sourcescanner.py 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323
  1. # -*- Mode: Python -*-
  2. # GObject-Introspection - a framework for introspecting GObject libraries
  3. # Copyright (C) 2008 Johan Dahlin
  4. #
  5. # This library is free software; you can redistribute it and/or
  6. # modify it under the terms of the GNU Lesser General Public
  7. # License as published by the Free Software Foundation; either
  8. # version 2 of the License, or (at your option) any later version.
  9. #
  10. # This library is distributed in the hope that it will be useful,
  11. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  13. # Lesser General Public License for more details.
  14. #
  15. # You should have received a copy of the GNU Lesser General Public
  16. # License along with this library; if not, write to the
  17. # Free Software Foundation, Inc., 59 Temple Place - Suite 330,
  18. # Boston, MA 02111-1307, USA.
  19. #
  20. from __future__ import with_statement
  21. from __future__ import absolute_import
  22. from __future__ import division
  23. from __future__ import print_function
  24. from __future__ import unicode_literals
  25. import os
  26. import subprocess
  27. import tempfile
  28. from .libtoolimporter import LibtoolImporter
  29. from .message import Position
  30. from .ccompiler import CCompiler
  31. with LibtoolImporter(None, None):
  32. if 'UNINSTALLED_INTROSPECTION_SRCDIR' in os.environ:
  33. from _giscanner import SourceScanner as CSourceScanner
  34. else:
  35. from giscanner._giscanner import SourceScanner as CSourceScanner
  36. HEADER_EXTS = ['.h', '.hpp', '.hxx']
  37. SOURCE_EXTS = ['.c', '.cpp', '.cc', '.cxx']
  38. ALL_EXTS = SOURCE_EXTS + HEADER_EXTS
  39. (CSYMBOL_TYPE_INVALID,
  40. CSYMBOL_TYPE_ELLIPSIS,
  41. CSYMBOL_TYPE_CONST,
  42. CSYMBOL_TYPE_OBJECT,
  43. CSYMBOL_TYPE_FUNCTION,
  44. CSYMBOL_TYPE_STRUCT,
  45. CSYMBOL_TYPE_UNION,
  46. CSYMBOL_TYPE_ENUM,
  47. CSYMBOL_TYPE_TYPEDEF,
  48. CSYMBOL_TYPE_MEMBER) = range(10)
  49. (CTYPE_INVALID,
  50. CTYPE_VOID,
  51. CTYPE_BASIC_TYPE,
  52. CTYPE_TYPEDEF,
  53. CTYPE_STRUCT,
  54. CTYPE_UNION,
  55. CTYPE_ENUM,
  56. CTYPE_POINTER,
  57. CTYPE_ARRAY,
  58. CTYPE_FUNCTION) = range(10)
  59. STORAGE_CLASS_NONE = 0
  60. STORAGE_CLASS_TYPEDEF = 1 << 1
  61. STORAGE_CLASS_EXTERN = 1 << 2
  62. STORAGE_CLASS_STATIC = 1 << 3
  63. STORAGE_CLASS_AUTO = 1 << 4
  64. STORAGE_CLASS_REGISTER = 1 << 5
  65. TYPE_QUALIFIER_NONE = 0
  66. TYPE_QUALIFIER_CONST = 1 << 1
  67. TYPE_QUALIFIER_RESTRICT = 1 << 2
  68. TYPE_QUALIFIER_VOLATILE = 1 << 3
  69. TYPE_QUALIFIER_EXTENSION = 1 << 4
  70. FUNCTION_NONE = 0
  71. FUNCTION_INLINE = 1 << 1
  72. (UNARY_ADDRESS_OF,
  73. UNARY_POINTER_INDIRECTION,
  74. UNARY_PLUS,
  75. UNARY_MINUS,
  76. UNARY_BITWISE_COMPLEMENT,
  77. UNARY_LOGICAL_NEGATION) = range(6)
  78. def symbol_type_name(symbol_type):
  79. return {
  80. CSYMBOL_TYPE_INVALID: 'invalid',
  81. CSYMBOL_TYPE_ELLIPSIS: 'ellipsis',
  82. CSYMBOL_TYPE_CONST: 'const',
  83. CSYMBOL_TYPE_OBJECT: 'object',
  84. CSYMBOL_TYPE_FUNCTION: 'function',
  85. CSYMBOL_TYPE_STRUCT: 'struct',
  86. CSYMBOL_TYPE_UNION: 'union',
  87. CSYMBOL_TYPE_ENUM: 'enum',
  88. CSYMBOL_TYPE_TYPEDEF: 'typedef',
  89. CSYMBOL_TYPE_MEMBER: 'member'}.get(symbol_type)
  90. def ctype_name(ctype):
  91. return {
  92. CTYPE_INVALID: 'invalid',
  93. CTYPE_VOID: 'void',
  94. CTYPE_BASIC_TYPE: 'basic',
  95. CTYPE_TYPEDEF: 'typedef',
  96. CTYPE_STRUCT: 'struct',
  97. CTYPE_UNION: 'union',
  98. CTYPE_ENUM: 'enum',
  99. CTYPE_POINTER: 'pointer',
  100. CTYPE_ARRAY: 'array',
  101. CTYPE_FUNCTION: 'function'}.get(ctype)
  102. class SourceType(object):
  103. __members__ = ['type', 'base_type', 'name', 'type_qualifier',
  104. 'child_list', 'is_bitfield']
  105. def __init__(self, scanner, stype):
  106. self._scanner = scanner
  107. self._stype = stype
  108. def __repr__(self):
  109. return "<%s type='%s' name='%s'>" % (
  110. self.__class__.__name__,
  111. ctype_name(self.type),
  112. self.name)
  113. @property
  114. def type(self):
  115. return self._stype.type
  116. @property
  117. def base_type(self):
  118. if self._stype.base_type is not None:
  119. return SourceType(self._scanner, self._stype.base_type)
  120. @property
  121. def name(self):
  122. return self._stype.name
  123. @property
  124. def type_qualifier(self):
  125. return self._stype.type_qualifier
  126. @property
  127. def child_list(self):
  128. for symbol in self._stype.child_list:
  129. if symbol is None:
  130. continue
  131. yield SourceSymbol(self._scanner, symbol)
  132. @property
  133. def is_bitfield(self):
  134. return self._stype.is_bitfield
  135. class SourceSymbol(object):
  136. __members__ = ['const_int', 'const_double', 'const_string', 'const_boolean',
  137. 'ident', 'type', 'base_type']
  138. def __init__(self, scanner, symbol):
  139. self._scanner = scanner
  140. self._symbol = symbol
  141. def __repr__(self):
  142. src = self.source_filename
  143. if src:
  144. line = self.line
  145. if line:
  146. src += ":'%s'" % (line, )
  147. return "<%s type='%s' ident='%s' src='%s'>" % (
  148. self.__class__.__name__,
  149. symbol_type_name(self.type),
  150. self.ident,
  151. src)
  152. @property
  153. def const_int(self):
  154. return self._symbol.const_int
  155. @property
  156. def const_double(self):
  157. return self._symbol.const_double
  158. @property
  159. def const_string(self):
  160. return self._symbol.const_string
  161. @property
  162. def const_boolean(self):
  163. return self._symbol.const_boolean
  164. @property
  165. def ident(self):
  166. return self._symbol.ident
  167. @property
  168. def type(self):
  169. return self._symbol.type
  170. @property
  171. def base_type(self):
  172. if self._symbol.base_type is not None:
  173. return SourceType(self._scanner, self._symbol.base_type)
  174. @property
  175. def source_filename(self):
  176. return self._symbol.source_filename
  177. @property
  178. def line(self):
  179. return self._symbol.line
  180. @property
  181. def private(self):
  182. return self._symbol.private
  183. @property
  184. def position(self):
  185. return Position(self._symbol.source_filename,
  186. self._symbol.line)
  187. class SourceScanner(object):
  188. def __init__(self):
  189. self._scanner = CSourceScanner()
  190. self._filenames = []
  191. self._cpp_options = []
  192. # Public API
  193. def set_cpp_options(self, includes, defines, undefines, cflags=[]):
  194. self._cpp_options.extend(cflags)
  195. for prefix, args in [('-I', [os.path.realpath(f) for f in includes]),
  196. ('-D', defines),
  197. ('-U', undefines)]:
  198. for arg in (args or []):
  199. opt = prefix + arg
  200. if opt not in self._cpp_options:
  201. self._cpp_options.append(opt)
  202. def parse_files(self, filenames):
  203. for filename in filenames:
  204. # self._scanner expects file names to be canonicalized and symlinks to be resolved
  205. filename = os.path.realpath(filename)
  206. self._scanner.append_filename(filename)
  207. self._filenames.append(filename)
  208. headers = []
  209. for filename in self._filenames:
  210. if os.path.splitext(filename)[1] in SOURCE_EXTS:
  211. self._scanner.lex_filename(filename)
  212. else:
  213. headers.append(filename)
  214. self._parse(headers)
  215. def parse_macros(self, filenames):
  216. self._scanner.set_macro_scan(True)
  217. # self._scanner expects file names to be canonicalized and symlinks to be resolved
  218. self._scanner.parse_macros([os.path.realpath(f) for f in filenames])
  219. self._scanner.set_macro_scan(False)
  220. def get_symbols(self):
  221. for symbol in self._scanner.get_symbols():
  222. yield SourceSymbol(self._scanner, symbol)
  223. def get_comments(self):
  224. return self._scanner.get_comments()
  225. def dump(self):
  226. print('-' * 30)
  227. for symbol in self._scanner.get_symbols():
  228. print(symbol.ident, symbol.base_type.name, symbol.type)
  229. # Private
  230. def _parse(self, filenames):
  231. if not filenames:
  232. return
  233. defines = ['__GI_SCANNER__']
  234. undefs = []
  235. cc = CCompiler()
  236. tmp_fd_cpp, tmp_name_cpp = tempfile.mkstemp(prefix='g-ir-cpp-', suffix='.c')
  237. with os.fdopen(tmp_fd_cpp, 'wb') as fp_cpp:
  238. self._write_preprocess_src(fp_cpp, defines, undefs, filenames)
  239. tmpfile_basename = os.path.basename(os.path.splitext(tmp_name_cpp)[0])
  240. # Output file name of the preprocessor, only really used on non-MSVC,
  241. # so we want the name to match the output file name of the MSVC preprocessor
  242. tmpfile_output = tmpfile_basename + '.i'
  243. cc.preprocess(tmp_name_cpp,
  244. tmpfile_output,
  245. self._cpp_options)
  246. os.unlink(tmp_name_cpp)
  247. fp = open(tmpfile_output, 'r')
  248. self._scanner.parse_file(fp.fileno())
  249. fp.close()
  250. os.unlink(tmpfile_output)
  251. def _write_preprocess_src(self, fp, defines, undefs, filenames):
  252. # Write to the temp file for feeding into the preprocessor
  253. for define in defines:
  254. fp.write(('#ifndef %s\n' % (define, )).encode())
  255. fp.write(('# define %s\n' % (define, )).encode())
  256. fp.write('#endif\n'.encode())
  257. for undef in undefs:
  258. fp.write(('#undef %s\n' % (undef, )).encode())
  259. for filename in filenames:
  260. fp.write(('#include <%s>\n' % (filename, )).encode())