blob: cde937b75355119c7bc291187bbdd2cedb3e7975 [file] [log] [blame]
Jeremy Hylton8b966dc2001-04-09 04:35:35 +00001"""Module symbol-table generator"""
2
3from compiler import ast
Jeremy Hylton364f9b92001-04-12 06:40:42 +00004from compiler.consts import SC_LOCAL, SC_GLOBAL, SC_FREE, SC_CELL, SC_UNKNOWN
Jeremy Hyltonf870c952001-04-09 13:57:32 +00005import types
Jeremy Hylton8b966dc2001-04-09 04:35:35 +00006
Jeremy Hylton364f9b92001-04-12 06:40:42 +00007import sys
8
Jeremy Hyltonf870c952001-04-09 13:57:32 +00009MANGLE_LEN = 256
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000010
11class Scope:
12 # XXX how much information do I need about each name?
Jeremy Hyltonf870c952001-04-09 13:57:32 +000013 def __init__(self, name, module, klass=None):
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000014 self.name = name
Jeremy Hyltonf870c952001-04-09 13:57:32 +000015 self.module = module
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000016 self.defs = {}
17 self.uses = {}
18 self.globals = {}
19 self.params = {}
Jeremy Hylton364f9b92001-04-12 06:40:42 +000020 self.frees = {}
21 self.cells = {}
Jeremy Hyltonf870c952001-04-09 13:57:32 +000022 self.children = []
Jeremy Hylton364f9b92001-04-12 06:40:42 +000023 # nested is true if the class could contain free variables,
24 # i.e. if it is nested within another function.
25 self.nested = None
Jeremy Hyltonf870c952001-04-09 13:57:32 +000026 self.klass = None
27 if klass is not None:
28 for i in range(len(klass)):
29 if klass[i] != '_':
30 self.klass = klass[i:]
31 break
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000032
33 def __repr__(self):
34 return "<%s: %s>" % (self.__class__.__name__, self.name)
35
Jeremy Hyltonf870c952001-04-09 13:57:32 +000036 def mangle(self, name):
37 if self.klass is None:
38 return name
39 if not name.startswith('__'):
40 return name
41 if len(name) + 2 >= MANGLE_LEN:
42 return name
43 if name.endswith('__'):
44 return name
45 return "_%s%s" % (self.klass, name)
46
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000047 def add_def(self, name):
Jeremy Hyltonf870c952001-04-09 13:57:32 +000048 self.defs[self.mangle(name)] = 1
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000049
50 def add_use(self, name):
Jeremy Hyltonf870c952001-04-09 13:57:32 +000051 self.uses[self.mangle(name)] = 1
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000052
53 def add_global(self, name):
Jeremy Hyltonf870c952001-04-09 13:57:32 +000054 name = self.mangle(name)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000055 if self.uses.has_key(name) or self.defs.has_key(name):
56 pass # XXX warn about global following def/use
57 if self.params.has_key(name):
58 raise SyntaxError, "%s in %s is global and parameter" % \
59 (name, self.name)
60 self.globals[name] = 1
Jeremy Hyltonf870c952001-04-09 13:57:32 +000061 self.module.add_def(name)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000062
63 def add_param(self, name):
Jeremy Hyltonf870c952001-04-09 13:57:32 +000064 name = self.mangle(name)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000065 self.defs[name] = 1
66 self.params[name] = 1
67
68 def get_names(self):
69 d = {}
70 d.update(self.defs)
71 d.update(self.uses)
Jeremy Hyltondbdb28e2001-04-09 20:11:59 +000072 d.update(self.globals)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +000073 return d.keys()
74
Jeremy Hyltonf870c952001-04-09 13:57:32 +000075 def add_child(self, child):
76 self.children.append(child)
77
78 def get_children(self):
79 return self.children
80
Jeremy Hylton364f9b92001-04-12 06:40:42 +000081 def DEBUG(self):
82 return
83 print >> sys.stderr, self.name, self.nested and "nested" or ""
84 print >> sys.stderr, "\tglobals: ", self.globals
85 print >> sys.stderr, "\tcells: ", self.cells
86 print >> sys.stderr, "\tdefs: ", self.defs
87 print >> sys.stderr, "\tuses: ", self.uses
88 print >> sys.stderr, "\tfrees:", self.frees
89
90 def check_name(self, name):
91 """Return scope of name.
92
93 The scope of a name could be LOCAL, GLOBAL, FREE, or CELL.
94 """
95 if self.globals.has_key(name):
96 return SC_GLOBAL
97 if self.cells.has_key(name):
98 return SC_CELL
99 if self.defs.has_key(name):
100 return SC_LOCAL
101 if self.nested and (self.frees.has_key(name) or
102 self.uses.has_key(name)):
103 return SC_FREE
104 if self.nested:
105 return SC_UNKNOWN
106 else:
107 return SC_GLOBAL
108
109 def get_free_vars(self):
110 if not self.nested:
111 return ()
112 free = {}
113 free.update(self.frees)
114 for name in self.uses.keys():
115 if not (self.defs.has_key(name) or
116 self.globals.has_key(name)):
117 free[name] = 1
118 return free.keys()
119
120 def handle_children(self):
121 for child in self.children:
122 frees = child.get_free_vars()
123 globals = self.add_frees(frees)
124 for name in globals:
125 child.force_global(name)
126
127 def force_global(self, name):
128 """Force name to be global in scope.
129
130 Some child of the current node had a free reference to name.
131 When the child was processed, it was labelled a free
132 variable. Now that all its enclosing scope have been
133 processed, the name is known to be a global or builtin. So
134 walk back down the child chain and set the name to be global
135 rather than free.
136
137 Be careful to stop if a child does not think the name is
138 free.
139 """
140 self.globals[name] = 1
141 if self.frees.has_key(name):
142 del self.frees[name]
143 for child in self.children:
144 if child.check_name(name) == SC_FREE:
145 child.force_global(name)
146
147 def add_frees(self, names):
148 """Process list of free vars from nested scope.
149
150 Returns a list of names that are either 1) declared global in the
151 parent or 2) undefined in a top-level parent. In either case,
152 the nested scope should treat them as globals.
153 """
154 child_globals = []
155 for name in names:
156 sc = self.check_name(name)
157 if self.nested:
158 if sc == SC_UNKNOWN or sc == SC_FREE \
159 or isinstance(self, ClassScope):
160 self.frees[name] = 1
161 elif sc == SC_GLOBAL:
162 child_globals.append(name)
163 elif isinstance(self, FunctionScope) and sc == SC_LOCAL:
164 self.cells[name] = 1
165 else:
166 child_globals.append(name)
167 else:
168 if sc == SC_LOCAL:
169 self.cells[name] = 1
170 else:
171 child_globals.append(name)
172 return child_globals
173
174 def get_cell_vars(self):
175 return self.cells.keys()
176
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000177class ModuleScope(Scope):
178 __super_init = Scope.__init__
179
180 def __init__(self):
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000181 self.__super_init("global", self)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000182
Jeremy Hylton364f9b92001-04-12 06:40:42 +0000183class FunctionScope(Scope):
184 pass
185
186class LambdaScope(FunctionScope):
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000187 __super_init = Scope.__init__
188
189 __counter = 1
190
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000191 def __init__(self, module, klass=None):
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000192 i = self.__counter
193 self.__counter += 1
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000194 self.__super_init("lambda.%d" % i, module, klass)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000195
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000196class ClassScope(Scope):
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000197 __super_init = Scope.__init__
198
199 def __init__(self, name, module):
200 self.__super_init(name, module, name)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000201
202class SymbolVisitor:
203 def __init__(self):
204 self.scopes = {}
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000205 self.klass = None
206
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000207 # node that define new scopes
208
209 def visitModule(self, node):
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000210 scope = self.module = self.scopes[node] = ModuleScope()
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000211 self.visit(node.node, scope)
212
213 def visitFunction(self, node, parent):
214 parent.add_def(node.name)
215 for n in node.defaults:
216 self.visit(n, parent)
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000217 scope = FunctionScope(node.name, self.module, self.klass)
Jeremy Hylton364f9b92001-04-12 06:40:42 +0000218 if parent.nested or isinstance(parent, FunctionScope):
219 scope.nested = 1
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000220 self.scopes[node] = scope
Jeremy Hyltondbdb28e2001-04-09 20:11:59 +0000221 self._do_args(scope, node.argnames)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000222 self.visit(node.code, scope)
Jeremy Hylton364f9b92001-04-12 06:40:42 +0000223 self.handle_free_vars(scope, parent)
224 scope.DEBUG()
225
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000226 def visitLambda(self, node, parent):
227 for n in node.defaults:
228 self.visit(n, parent)
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000229 scope = LambdaScope(self.module, self.klass)
Jeremy Hylton364f9b92001-04-12 06:40:42 +0000230 if parent.nested or isinstance(parent, FunctionScope):
231 scope.nested = 1
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000232 self.scopes[node] = scope
Jeremy Hyltondbdb28e2001-04-09 20:11:59 +0000233 self._do_args(scope, node.argnames)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000234 self.visit(node.code, scope)
Jeremy Hylton364f9b92001-04-12 06:40:42 +0000235 self.handle_free_vars(scope, parent)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000236
Jeremy Hyltondbdb28e2001-04-09 20:11:59 +0000237 def _do_args(self, scope, args):
238 for name in args:
239 if type(name) == types.TupleType:
240 self._do_args(scope, name)
241 else:
242 scope.add_param(name)
243
Jeremy Hylton364f9b92001-04-12 06:40:42 +0000244 def handle_free_vars(self, scope, parent):
245 parent.add_child(scope)
246 if scope.children:
247 scope.DEBUG()
248 scope.handle_children()
249
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000250 def visitClass(self, node, parent):
251 parent.add_def(node.name)
252 for n in node.bases:
253 self.visit(n, parent)
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000254 scope = ClassScope(node.name, self.module)
Jeremy Hylton364f9b92001-04-12 06:40:42 +0000255 if parent.nested or isinstance(parent, FunctionScope):
256 scope.nested = 1
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000257 self.scopes[node] = scope
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000258 prev = self.klass
259 self.klass = node.name
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000260 self.visit(node.code, scope)
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000261 self.klass = prev
Jeremy Hylton364f9b92001-04-12 06:40:42 +0000262 self.handle_free_vars(scope, parent)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000263
264 # name can be a def or a use
265
266 # XXX a few calls and nodes expect a third "assign" arg that is
267 # true if the name is being used as an assignment. only
268 # expressions contained within statements may have the assign arg.
269
270 def visitName(self, node, scope, assign=0):
271 if assign:
272 scope.add_def(node.name)
273 else:
274 scope.add_use(node.name)
275
276 # operations that bind new names
277
278 def visitFor(self, node, scope):
279 self.visit(node.assign, scope, 1)
280 self.visit(node.list, scope)
281 self.visit(node.body, scope)
282 if node.else_:
283 self.visit(node.else_, scope)
284
285 def visitFrom(self, node, scope):
286 for name, asname in node.names:
287 if name == "*":
288 continue
289 scope.add_def(asname or name)
290
291 def visitImport(self, node, scope):
292 for name, asname in node.names:
293 i = name.find(".")
294 if i > -1:
295 name = name[:i]
296 scope.add_def(asname or name)
297
298 def visitAssName(self, node, scope, assign=1):
299 scope.add_def(node.name)
300
301 def visitAugAssign(self, node, scope):
302 # basically, the node is referenced and defined by the same expr
303 self.visit(node.node, scope)
304 self.visit(node.node, scope, 1)
305 self.visit(node.expr, scope)
306
307 def visitAssign(self, node, scope):
308 for n in node.nodes:
309 self.visit(n, scope, 1)
310 self.visit(node.expr, scope)
311
312 def visitGlobal(self, node, scope):
313 for name in node.names:
314 scope.add_global(name)
315
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000316 # prune if statements if tests are false
317
318 _const_types = types.StringType, types.IntType, types.FloatType
319
320 def visitIf(self, node, scope):
321 for test, body in node.tests:
322 if isinstance(test, ast.Const):
323 if type(test.value) in self._const_types:
324 if not test.value:
325 continue
326 self.visit(test, scope)
327 self.visit(body, scope)
328 if node.else_:
329 self.visit(node.else_, scope)
330
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000331def sort(l):
332 l = l[:]
333 l.sort()
334 return l
335
336def list_eq(l1, l2):
337 return sort(l1) == sort(l2)
338
339if __name__ == "__main__":
340 import sys
341 from compiler import parseFile, walk
342 import symtable
343
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000344 def get_names(syms):
345 return [s for s in [s.get_name() for s in syms.get_symbols()]
Jeremy Hyltondbdb28e2001-04-09 20:11:59 +0000346 if not (s.startswith('_[') or s.startswith('.'))]
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000347
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000348 for file in sys.argv[1:]:
349 print file
350 f = open(file)
351 buf = f.read()
352 f.close()
353 syms = symtable.symtable(buf, file, "exec")
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000354 mod_names = get_names(syms)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000355 tree = parseFile(file)
356 s = SymbolVisitor()
357 walk(tree, s)
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000358
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000359 # compare module-level symbols
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000360 names2 = s.scopes[tree].get_names()
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000361
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000362 if not list_eq(mod_names, names2):
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000363 print
Jeremy Hylton8b966dc2001-04-09 04:35:35 +0000364 print "oops", file
365 print sort(mod_names)
366 print sort(names2)
367 sys.exit(-1)
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000368
369 d = {}
370 d.update(s.scopes)
371 del d[tree]
372 scopes = d.values()
373 del d
374
375 for s in syms.get_symbols():
376 if s.is_namespace():
377 l = [sc for sc in scopes
378 if sc.name == s.get_name()]
379 if len(l) > 1:
380 print "skipping", s.get_name()
381 else:
382 if not list_eq(get_names(s.get_namespace()),
383 l[0].get_names()):
384 print s.get_name()
Jeremy Hyltondbdb28e2001-04-09 20:11:59 +0000385 print sort(get_names(s.get_namespace()))
386 print sort(l[0].get_names())
Jeremy Hyltonf870c952001-04-09 13:57:32 +0000387 sys.exit(-1)