blob: 98db1e2557d37f26e0f0d49bfbe68524f0fc0d7a [file] [log] [blame]
Jeremy Hylton816e1492001-03-22 23:32:22 +00001"""Interface to the compiler's internal symbol tables"""
Jeremy Hylton816e1492001-03-22 23:32:22 +00002
3import _symtable
Pablo Galindod5b4f1b2018-10-20 01:46:00 +01004from _symtable import (USE, DEF_GLOBAL, DEF_NONLOCAL, DEF_LOCAL, DEF_PARAM,
Yury Selivanovf8cb8a12016-09-08 20:50:03 -07005 DEF_IMPORT, DEF_BOUND, DEF_ANNOT, SCOPE_OFF, SCOPE_MASK, FREE,
Benjamin Peterson500c6ef2009-06-28 19:30:36 +00006 LOCAL, GLOBAL_IMPLICIT, GLOBAL_EXPLICIT, CELL)
Jeremy Hylton816e1492001-03-22 23:32:22 +00007
8import weakref
9
Benjamin Peterson3938a902008-08-20 02:33:00 +000010__all__ = ["symtable", "SymbolTable", "Class", "Function", "Symbol"]
Jeremy Hylton816e1492001-03-22 23:32:22 +000011
12def symtable(code, filename, compile_type):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -030013 """ Return the toplevel *SymbolTable* for the source code.
14
15 *filename* is the name of the file with the code
16 and *compile_type* is the *compile()* mode argument.
17 """
Benjamin Peterson89d8cd92013-10-26 13:13:51 -040018 top = _symtable.symtable(code, filename, compile_type)
Benjamin Peterson3938a902008-08-20 02:33:00 +000019 return _newSymbolTable(top, filename)
Jeremy Hylton816e1492001-03-22 23:32:22 +000020
21class SymbolTableFactory:
22 def __init__(self):
23 self.__memo = weakref.WeakValueDictionary()
24
25 def new(self, table, filename):
26 if table.type == _symtable.TYPE_FUNCTION:
27 return Function(table, filename)
28 if table.type == _symtable.TYPE_CLASS:
29 return Class(table, filename)
30 return SymbolTable(table, filename)
31
32 def __call__(self, table, filename):
33 key = table, filename
34 obj = self.__memo.get(key, None)
35 if obj is None:
36 obj = self.__memo[key] = self.new(table, filename)
37 return obj
38
Benjamin Peterson3938a902008-08-20 02:33:00 +000039_newSymbolTable = SymbolTableFactory()
Tim Petersa19a1682001-03-29 04:36:09 +000040
Jeremy Hylton816e1492001-03-22 23:32:22 +000041
Pablo Galindofb0a4652020-10-03 20:45:55 +010042class SymbolTable:
Benjamin Peterson55e00f22008-08-17 18:02:44 +000043
Jeremy Hylton816e1492001-03-22 23:32:22 +000044 def __init__(self, raw_table, filename):
45 self._table = raw_table
46 self._filename = filename
47 self._symbols = {}
48
49 def __repr__(self):
50 if self.__class__ == SymbolTable:
51 kind = ""
52 else:
53 kind = "%s " % self.__class__.__name__
Tim Petersa19a1682001-03-29 04:36:09 +000054
Pablo Galindofb0a4652020-10-03 20:45:55 +010055 if self._table.name == "top":
Benjamin Peterson55e00f22008-08-17 18:02:44 +000056 return "<{0}SymbolTable for module {1}>".format(kind, self._filename)
Jeremy Hylton816e1492001-03-22 23:32:22 +000057 else:
Benjamin Peterson55e00f22008-08-17 18:02:44 +000058 return "<{0}SymbolTable for {1} in {2}>".format(kind,
59 self._table.name,
60 self._filename)
Jeremy Hylton816e1492001-03-22 23:32:22 +000061
62 def get_type(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -030063 """Return the type of the symbol table.
64
65 The values retuned are 'class', 'module' and
66 'function'.
67 """
Jeremy Hylton816e1492001-03-22 23:32:22 +000068 if self._table.type == _symtable.TYPE_MODULE:
69 return "module"
70 if self._table.type == _symtable.TYPE_FUNCTION:
71 return "function"
72 if self._table.type == _symtable.TYPE_CLASS:
73 return "class"
74 assert self._table.type in (1, 2, 3), \
Benjamin Peterson55e00f22008-08-17 18:02:44 +000075 "unexpected type: {0}".format(self._table.type)
Jeremy Hylton816e1492001-03-22 23:32:22 +000076
77 def get_id(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -030078 """Return an identifier for the table.
79 """
Jeremy Hylton816e1492001-03-22 23:32:22 +000080 return self._table.id
81
82 def get_name(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -030083 """Return the table's name.
84
85 This corresponds to the name of the class, function
86 or 'top' if the table is for a class, function or
87 global respectively.
88 """
Jeremy Hylton816e1492001-03-22 23:32:22 +000089 return self._table.name
90
91 def get_lineno(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -030092 """Return the number of the first line in the
93 block for the table.
94 """
Jeremy Hylton816e1492001-03-22 23:32:22 +000095 return self._table.lineno
96
97 def is_optimized(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -030098 """Return *True* if the locals in the table
99 are optimizable.
100 """
Benjamin Peterson1dfd2472015-04-27 21:44:22 -0400101 return bool(self._table.type == _symtable.TYPE_FUNCTION)
Jeremy Hylton816e1492001-03-22 23:32:22 +0000102
103 def is_nested(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300104 """Return *True* if the block is a nested class
105 or function."""
Jeremy Hylton816e1492001-03-22 23:32:22 +0000106 return bool(self._table.nested)
107
108 def has_children(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300109 """Return *True* if the block has nested namespaces.
110 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000111 return bool(self._table.children)
112
Jeremy Hylton816e1492001-03-22 23:32:22 +0000113 def get_identifiers(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300114 """Return a list of names of symbols in the table.
115 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000116 return self._table.symbols.keys()
117
118 def lookup(self, name):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300119 """Lookup a *name* in the table.
120
121 Returns a *Symbol* instance.
122 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000123 sym = self._symbols.get(name)
124 if sym is None:
125 flags = self._table.symbols[name]
126 namespaces = self.__check_children(name)
Pablo Galindofb0a4652020-10-03 20:45:55 +0100127 module_scope = (self._table.name == "top")
128 sym = self._symbols[name] = Symbol(name, flags, namespaces,
129 module_scope=module_scope)
Jeremy Hylton816e1492001-03-22 23:32:22 +0000130 return sym
131
132 def get_symbols(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300133 """Return a list of *Symbol* instances for
134 names in the table.
135 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000136 return [self.lookup(ident) for ident in self.get_identifiers()]
137
138 def __check_children(self, name):
Benjamin Peterson3938a902008-08-20 02:33:00 +0000139 return [_newSymbolTable(st, self._filename)
Jeremy Hylton816e1492001-03-22 23:32:22 +0000140 for st in self._table.children
141 if st.name == name]
142
Jeremy Hylton101651c2001-03-23 15:41:14 +0000143 def get_children(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300144 """Return a list of the nested symbol tables.
145 """
Benjamin Peterson3938a902008-08-20 02:33:00 +0000146 return [_newSymbolTable(st, self._filename)
Jeremy Hylton101651c2001-03-23 15:41:14 +0000147 for st in self._table.children]
148
Benjamin Peterson55e00f22008-08-17 18:02:44 +0000149
Jeremy Hylton816e1492001-03-22 23:32:22 +0000150class Function(SymbolTable):
151
152 # Default values for instance variables
153 __params = None
154 __locals = None
155 __frees = None
156 __globals = None
Pablo Galindod5b4f1b2018-10-20 01:46:00 +0100157 __nonlocals = None
Jeremy Hylton816e1492001-03-22 23:32:22 +0000158
159 def __idents_matching(self, test_func):
Jon Dufresne39726282017-05-18 07:35:54 -0700160 return tuple(ident for ident in self.get_identifiers()
161 if test_func(self._table.symbols[ident]))
Jeremy Hylton816e1492001-03-22 23:32:22 +0000162
163 def get_parameters(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300164 """Return a tuple of parameters to the function.
165 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000166 if self.__params is None:
167 self.__params = self.__idents_matching(lambda x:x & DEF_PARAM)
168 return self.__params
169
170 def get_locals(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300171 """Return a tuple of locals in the function.
172 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000173 if self.__locals is None:
Benjamin Peterson500c6ef2009-06-28 19:30:36 +0000174 locs = (LOCAL, CELL)
175 test = lambda x: ((x >> SCOPE_OFF) & SCOPE_MASK) in locs
Benjamin Peterson78565b22009-06-28 19:19:51 +0000176 self.__locals = self.__idents_matching(test)
Jeremy Hylton816e1492001-03-22 23:32:22 +0000177 return self.__locals
Tim Petersa19a1682001-03-29 04:36:09 +0000178
Jeremy Hylton816e1492001-03-22 23:32:22 +0000179 def get_globals(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300180 """Return a tuple of globals in the function.
181 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000182 if self.__globals is None:
Benjamin Peterson55e00f22008-08-17 18:02:44 +0000183 glob = (GLOBAL_IMPLICIT, GLOBAL_EXPLICIT)
184 test = lambda x:((x >> SCOPE_OFF) & SCOPE_MASK) in glob
185 self.__globals = self.__idents_matching(test)
Jeremy Hylton816e1492001-03-22 23:32:22 +0000186 return self.__globals
187
Pablo Galindod5b4f1b2018-10-20 01:46:00 +0100188 def get_nonlocals(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300189 """Return a tuple of nonlocals in the function.
190 """
Pablo Galindod5b4f1b2018-10-20 01:46:00 +0100191 if self.__nonlocals is None:
192 self.__nonlocals = self.__idents_matching(lambda x:x & DEF_NONLOCAL)
193 return self.__nonlocals
194
Jeremy Hylton816e1492001-03-22 23:32:22 +0000195 def get_frees(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300196 """Return a tuple of free variables in the function.
197 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000198 if self.__frees is None:
Benjamin Peterson55e00f22008-08-17 18:02:44 +0000199 is_free = lambda x:((x >> SCOPE_OFF) & SCOPE_MASK) == FREE
Jeremy Hylton816e1492001-03-22 23:32:22 +0000200 self.__frees = self.__idents_matching(is_free)
201 return self.__frees
202
Benjamin Peterson55e00f22008-08-17 18:02:44 +0000203
Jeremy Hylton816e1492001-03-22 23:32:22 +0000204class Class(SymbolTable):
205
206 __methods = None
207
208 def get_methods(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300209 """Return a tuple of methods declared in the class.
210 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000211 if self.__methods is None:
212 d = {}
213 for st in self._table.children:
214 d[st.name] = 1
Benjamin Petersonb71caf12008-08-20 12:55:31 +0000215 self.__methods = tuple(d)
Jeremy Hylton816e1492001-03-22 23:32:22 +0000216 return self.__methods
217
Benjamin Peterson55e00f22008-08-17 18:02:44 +0000218
Pablo Galindofb0a4652020-10-03 20:45:55 +0100219class Symbol:
Benjamin Peterson55e00f22008-08-17 18:02:44 +0000220
Pablo Galindofb0a4652020-10-03 20:45:55 +0100221 def __init__(self, name, flags, namespaces=None, *, module_scope=False):
Jeremy Hylton816e1492001-03-22 23:32:22 +0000222 self.__name = name
223 self.__flags = flags
Benjamin Peterson55e00f22008-08-17 18:02:44 +0000224 self.__scope = (flags >> SCOPE_OFF) & SCOPE_MASK # like PyST_GetScope()
Jeremy Hylton816e1492001-03-22 23:32:22 +0000225 self.__namespaces = namespaces or ()
Pablo Galindofb0a4652020-10-03 20:45:55 +0100226 self.__module_scope = module_scope
Jeremy Hylton816e1492001-03-22 23:32:22 +0000227
228 def __repr__(self):
Benjamin Peterson55e00f22008-08-17 18:02:44 +0000229 return "<symbol {0!r}>".format(self.__name)
Jeremy Hylton816e1492001-03-22 23:32:22 +0000230
231 def get_name(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300232 """Return a name of a symbol.
233 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000234 return self.__name
235
236 def is_referenced(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300237 """Return *True* if the symbol is used in
238 its block.
239 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000240 return bool(self.__flags & _symtable.USE)
241
242 def is_parameter(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300243 """Return *True* if the symbol is a parameter.
244 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000245 return bool(self.__flags & DEF_PARAM)
246
247 def is_global(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300248 """Return *True* if the sysmbol is global.
249 """
Pablo Galindofb0a4652020-10-03 20:45:55 +0100250 return bool(self.__scope in (GLOBAL_IMPLICIT, GLOBAL_EXPLICIT)
251 or (self.__module_scope and self.__flags & DEF_BOUND))
Jeremy Hylton816e1492001-03-22 23:32:22 +0000252
Pablo Galindod5b4f1b2018-10-20 01:46:00 +0100253 def is_nonlocal(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300254 """Return *True* if the symbol is nonlocal."""
Pablo Galindod5b4f1b2018-10-20 01:46:00 +0100255 return bool(self.__flags & DEF_NONLOCAL)
256
Jeremy Hyltonf37708e2009-03-31 15:26:37 +0000257 def is_declared_global(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300258 """Return *True* if the symbol is declared global
259 with a global statement."""
Jeremy Hyltonf37708e2009-03-31 15:26:37 +0000260 return bool(self.__scope == GLOBAL_EXPLICIT)
261
Jeremy Hylton816e1492001-03-22 23:32:22 +0000262 def is_local(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300263 """Return *True* if the symbol is local.
264 """
Pablo Galindofb0a4652020-10-03 20:45:55 +0100265 return bool(self.__scope in (LOCAL, CELL)
266 or (self.__module_scope and self.__flags & DEF_BOUND))
Jeremy Hylton816e1492001-03-22 23:32:22 +0000267
Yury Selivanovf8cb8a12016-09-08 20:50:03 -0700268 def is_annotated(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300269 """Return *True* if the symbol is annotated.
270 """
Yury Selivanovf8cb8a12016-09-08 20:50:03 -0700271 return bool(self.__flags & DEF_ANNOT)
272
Jeremy Hylton816e1492001-03-22 23:32:22 +0000273 def is_free(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300274 """Return *True* if a referenced symbol is
275 not assigned to.
276 """
Benjamin Peterson55e00f22008-08-17 18:02:44 +0000277 return bool(self.__scope == FREE)
Jeremy Hylton816e1492001-03-22 23:32:22 +0000278
279 def is_imported(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300280 """Return *True* if the symbol is created from
281 an import statement.
282 """
Jeremy Hylton816e1492001-03-22 23:32:22 +0000283 return bool(self.__flags & DEF_IMPORT)
284
285 def is_assigned(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300286 """Return *True* if a symbol is assigned to."""
Jeremy Hylton816e1492001-03-22 23:32:22 +0000287 return bool(self.__flags & DEF_LOCAL)
288
Jeremy Hylton816e1492001-03-22 23:32:22 +0000289 def is_namespace(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300290 """Returns *True* if name binding introduces new namespace.
Jeremy Hylton816e1492001-03-22 23:32:22 +0000291
292 If the name is used as the target of a function or class
293 statement, this will be true.
294
295 Note that a single name can be bound to multiple objects. If
296 is_namespace() is true, the name may also be bound to other
297 objects, like an int or list, that does not introduce a new
298 namespace.
299 """
300 return bool(self.__namespaces)
301
302 def get_namespaces(self):
303 """Return a list of namespaces bound to this name"""
304 return self.__namespaces
305
306 def get_namespace(self):
Joannah Nanjekyea95ac772020-07-07 20:09:56 -0300307 """Return the single namespace bound to this name.
Jeremy Hylton816e1492001-03-22 23:32:22 +0000308
309 Raises ValueError if the name is bound to multiple namespaces.
310 """
311 if len(self.__namespaces) != 1:
Collin Winterce36ad82007-08-30 01:19:48 +0000312 raise ValueError("name is bound to multiple namespaces")
Jeremy Hylton816e1492001-03-22 23:32:22 +0000313 return self.__namespaces[0]
314
Jeremy Hylton816e1492001-03-22 23:32:22 +0000315if __name__ == "__main__":
316 import os, sys
Giampaolo Rodola'2f50aaf2013-02-12 02:04:27 +0100317 with open(sys.argv[0]) as f:
318 src = f.read()
Jeremy Hylton816e1492001-03-22 23:32:22 +0000319 mod = symtable(src, os.path.split(sys.argv[0])[1], "exec")
320 for ident in mod.get_identifiers():
321 info = mod.lookup(ident)
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000322 print(info, info.is_local(), info.is_namespace())