xmlwriter.py 5.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175
  1. # -*- Mode: Python -*-
  2. # GObject-Introspection - a framework for introspecting GObject libraries
  3. # Copyright (C) 2008 Johan Dahlin
  4. #
  5. # This library is free software; you can redistribute it and/or
  6. # modify it under the terms of the GNU Lesser General Public
  7. # License as published by the Free Software Foundation; either
  8. # version 2 of the License, or (at your option) any later version.
  9. #
  10. # This library is distributed in the hope that it will be useful,
  11. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  13. # Lesser General Public License for more details.
  14. #
  15. # You should have received a copy of the GNU Lesser General Public
  16. # License along with this library; if not, write to the
  17. # Free Software Foundation, Inc., 59 Temple Place - Suite 330,
  18. # Boston, MA 02111-1307, USA.
  19. #
  20. from __future__ import with_statement
  21. from __future__ import absolute_import
  22. from __future__ import division
  23. from __future__ import print_function
  24. from __future__ import unicode_literals
  25. import os
  26. import sys
  27. from contextlib import contextmanager
  28. from xml.sax.saxutils import escape
  29. from .libtoolimporter import LibtoolImporter
  30. if sys.version_info.major < 3:
  31. from StringIO import StringIO
  32. else:
  33. from io import StringIO
  34. unicode = str
  35. with LibtoolImporter(None, None):
  36. if 'UNINSTALLED_INTROSPECTION_SRCDIR' in os.environ:
  37. from _giscanner import collect_attributes
  38. else:
  39. from giscanner._giscanner import collect_attributes
  40. def build_xml_tag(tag_name, attributes=None, data=None, self_indent=0,
  41. self_indent_char=' '):
  42. if attributes is None:
  43. attributes = []
  44. prefix = '<%s' % (tag_name, )
  45. if data is not None:
  46. if isinstance(data, bytes):
  47. data = data.decode('UTF-8')
  48. suffix = '>%s</%s>' % (escape(data), tag_name)
  49. else:
  50. suffix = '/>'
  51. attrs = collect_attributes(
  52. tag_name, attributes,
  53. self_indent,
  54. self_indent_char,
  55. len(prefix) + len(suffix))
  56. return prefix + attrs + suffix
  57. class XMLWriter(object):
  58. def __init__(self):
  59. # Build up the XML buffer as unicode strings. When writing to disk,
  60. # we can assume the lack of a Byte Order Mark (BOM) and lack
  61. # of an "encoding" xml property means utf-8.
  62. # See: http://www.opentag.com/xfaq_enc.htm#enc_default
  63. self._data = StringIO()
  64. self._data.write('<?xml version="1.0"?>\n')
  65. self._tag_stack = []
  66. self._indent = 0
  67. self._indent_unit = 2
  68. self.enable_whitespace()
  69. # Private
  70. def _open_tag(self, tag_name, attributes=None):
  71. if attributes is None:
  72. attributes = []
  73. attrs = collect_attributes(tag_name, attributes,
  74. self._indent, self._indent_char, len(tag_name) + 2)
  75. self.write_line('<%s%s>' % (tag_name, attrs))
  76. def _close_tag(self, tag_name):
  77. self.write_line('</%s>' % (tag_name, ))
  78. # Public API
  79. def enable_whitespace(self):
  80. self._indent_char = ' '
  81. self._newline_char = '\n'
  82. def disable_whitespace(self):
  83. self._indent_char = ''
  84. self._newline_char = ''
  85. def get_xml(self):
  86. """Returns a unicode string containing the XML."""
  87. return self._data.getvalue()
  88. def get_encoded_xml(self):
  89. """Returns a utf-8 encoded bytes object containing the XML."""
  90. return self._data.getvalue().encode('utf-8')
  91. def write_line(self, line='', indent=True, do_escape=False):
  92. if isinstance(line, bytes):
  93. line = line.decode('utf-8')
  94. assert isinstance(line, unicode)
  95. if do_escape:
  96. line = escape(line)
  97. if indent:
  98. self._data.write('%s%s%s' % (self._indent_char * self._indent,
  99. line,
  100. self._newline_char))
  101. else:
  102. self._data.write('%s%s' % (line, self._newline_char))
  103. def write_comment(self, text):
  104. self.write_line('<!-- %s -->' % (text, ))
  105. def write_tag(self, tag_name, attributes, data=None):
  106. self.write_line(build_xml_tag(tag_name, attributes, data,
  107. self._indent, self._indent_char))
  108. def push_tag(self, tag_name, attributes=None):
  109. if attributes is None:
  110. attributes = []
  111. self._open_tag(tag_name, attributes)
  112. self._tag_stack.append(tag_name)
  113. self._indent += self._indent_unit
  114. def pop_tag(self):
  115. self._indent -= self._indent_unit
  116. tag_name = self._tag_stack.pop()
  117. self._close_tag(tag_name)
  118. return tag_name
  119. @contextmanager
  120. def tagcontext(self, tag_name, attributes=None):
  121. self.push_tag(tag_name, attributes)
  122. try:
  123. yield
  124. finally:
  125. self.pop_tag()
  126. def test():
  127. w = XMLWriter()
  128. w.push_tag('repository')
  129. w.push_tag('namespace')
  130. w.push_tag('enumeration')
  131. w.push_tag('member',
  132. [('name', 'west'),
  133. ('value', '7'),
  134. ('c:identifier', 'GTK_ANCHOR_WEST'),
  135. ('glib:nick', 'west')])
  136. w.pop_tag()
  137. w.pop_tag()
  138. w.pop_tag()
  139. x = w.get_xml()
  140. lines = x.split('\n')
  141. import pprint
  142. pprint.pprint(lines)
  143. assert len(lines[3]) < 80, len(lines[3])
  144. if __name__ == '__main__':
  145. test()