1 """Module symbol-table generator"""
3 from compiler
import ast
4 from compiler
.consts
import SC_LOCAL
, SC_GLOBAL
, SC_FREE
, SC_CELL
, SC_UNKNOWN
5 from compiler
.misc
import mangle
14 # XXX how much information do I need about each name?
15 def __init__(self
, name
, module
, klass
=None):
25 # nested is true if the class could contain free variables,
26 # i.e. if it is nested within another function.
31 for i
in range(len(klass
)):
33 self
.klass
= klass
[i
:]
37 return "<%s: %s>" % (self
.__class
__.__name
__, self
.name
)
39 def mangle(self
, name
):
40 if self
.klass
is None:
42 return mangle(name
, self
.klass
)
44 def add_def(self
, name
):
45 self
.defs
[self
.mangle(name
)] = 1
47 def add_use(self
, name
):
48 self
.uses
[self
.mangle(name
)] = 1
50 def add_global(self
, name
):
51 name
= self
.mangle(name
)
52 if self
.uses
.has_key(name
) or self
.defs
.has_key(name
):
53 pass # XXX warn about global following def/use
54 if self
.params
.has_key(name
):
55 raise SyntaxError, "%s in %s is global and parameter" % \
57 self
.globals[name
] = 1
58 self
.module
.add_def(name
)
60 def add_param(self
, name
):
61 name
= self
.mangle(name
)
69 d
.update(self
.globals)
72 def add_child(self
, child
):
73 self
.children
.append(child
)
75 def get_children(self
):
79 print >> sys
.stderr
, self
.name
, self
.nested
and "nested" or ""
80 print >> sys
.stderr
, "\tglobals: ", self
.globals
81 print >> sys
.stderr
, "\tcells: ", self
.cells
82 print >> sys
.stderr
, "\tdefs: ", self
.defs
83 print >> sys
.stderr
, "\tuses: ", self
.uses
84 print >> sys
.stderr
, "\tfrees:", self
.frees
86 def check_name(self
, name
):
87 """Return scope of name.
89 The scope of a name could be LOCAL, GLOBAL, FREE, or CELL.
91 if self
.globals.has_key(name
):
93 if self
.cells
.has_key(name
):
95 if self
.defs
.has_key(name
):
97 if self
.nested
and (self
.frees
.has_key(name
) or
98 self
.uses
.has_key(name
)):
105 def get_free_vars(self
):
109 free
.update(self
.frees
)
110 for name
in self
.uses
.keys():
111 if not (self
.defs
.has_key(name
) or
112 self
.globals.has_key(name
)):
116 def handle_children(self
):
117 for child
in self
.children
:
118 frees
= child
.get_free_vars()
119 globals = self
.add_frees(frees
)
121 child
.force_global(name
)
123 def force_global(self
, name
):
124 """Force name to be global in scope.
126 Some child of the current node had a free reference to name.
127 When the child was processed, it was labelled a free
128 variable. Now that all its enclosing scope have been
129 processed, the name is known to be a global or builtin. So
130 walk back down the child chain and set the name to be global
133 Be careful to stop if a child does not think the name is
136 self
.globals[name
] = 1
137 if self
.frees
.has_key(name
):
139 for child
in self
.children
:
140 if child
.check_name(name
) == SC_FREE
:
141 child
.force_global(name
)
143 def add_frees(self
, names
):
144 """Process list of free vars from nested scope.
146 Returns a list of names that are either 1) declared global in the
147 parent or 2) undefined in a top-level parent. In either case,
148 the nested scope should treat them as globals.
152 sc
= self
.check_name(name
)
154 if sc
== SC_UNKNOWN
or sc
== SC_FREE \
155 or isinstance(self
, ClassScope
):
157 elif sc
== SC_GLOBAL
:
158 child_globals
.append(name
)
159 elif isinstance(self
, FunctionScope
) and sc
== SC_LOCAL
:
162 child_globals
.append(name
)
167 child_globals
.append(name
)
170 def get_cell_vars(self
):
171 return self
.cells
.keys()
173 class ModuleScope(Scope
):
174 __super_init
= Scope
.__init
__
177 self
.__super
_init
("global", self
)
179 class FunctionScope(Scope
):
182 class LambdaScope(FunctionScope
):
183 __super_init
= Scope
.__init
__
187 def __init__(self
, module
, klass
=None):
190 self
.__super
_init
("lambda.%d" % i
, module
, klass
)
192 class ClassScope(Scope
):
193 __super_init
= Scope
.__init
__
195 def __init__(self
, name
, module
):
196 self
.__super
_init
(name
, module
, name
)
203 # node that define new scopes
205 def visitModule(self
, node
):
206 scope
= self
.module
= self
.scopes
[node
] = ModuleScope()
207 self
.visit(node
.node
, scope
)
209 visitExpression
= visitModule
211 def visitFunction(self
, node
, parent
):
212 parent
.add_def(node
.name
)
213 for n
in node
.defaults
:
214 self
.visit(n
, parent
)
215 scope
= FunctionScope(node
.name
, self
.module
, self
.klass
)
216 if parent
.nested
or isinstance(parent
, FunctionScope
):
218 self
.scopes
[node
] = scope
219 self
._do
_args
(scope
, node
.argnames
)
220 self
.visit(node
.code
, scope
)
221 self
.handle_free_vars(scope
, parent
)
223 def visitLambda(self
, node
, parent
):
224 for n
in node
.defaults
:
225 self
.visit(n
, parent
)
226 scope
= LambdaScope(self
.module
, self
.klass
)
227 if parent
.nested
or isinstance(parent
, FunctionScope
):
229 self
.scopes
[node
] = scope
230 self
._do
_args
(scope
, node
.argnames
)
231 self
.visit(node
.code
, scope
)
232 self
.handle_free_vars(scope
, parent
)
234 def _do_args(self
, scope
, args
):
236 if type(name
) == types
.TupleType
:
237 self
._do
_args
(scope
, name
)
239 scope
.add_param(name
)
241 def handle_free_vars(self
, scope
, parent
):
242 parent
.add_child(scope
)
243 scope
.handle_children()
245 def visitClass(self
, node
, parent
):
246 parent
.add_def(node
.name
)
248 self
.visit(n
, parent
)
249 scope
= ClassScope(node
.name
, self
.module
)
250 if parent
.nested
or isinstance(parent
, FunctionScope
):
252 if node
.doc
is not None:
253 scope
.add_def('__doc__')
254 self
.scopes
[node
] = scope
256 self
.klass
= node
.name
257 self
.visit(node
.code
, scope
)
259 self
.handle_free_vars(scope
, parent
)
261 # name can be a def or a use
263 # XXX a few calls and nodes expect a third "assign" arg that is
264 # true if the name is being used as an assignment. only
265 # expressions contained within statements may have the assign arg.
267 def visitName(self
, node
, scope
, assign
=0):
269 scope
.add_def(node
.name
)
271 scope
.add_use(node
.name
)
273 # operations that bind new names
275 def visitFor(self
, node
, scope
):
276 self
.visit(node
.assign
, scope
, 1)
277 self
.visit(node
.list, scope
)
278 self
.visit(node
.body
, scope
)
280 self
.visit(node
.else_
, scope
)
282 def visitFrom(self
, node
, scope
):
283 for name
, asname
in node
.names
:
286 scope
.add_def(asname
or name
)
288 def visitImport(self
, node
, scope
):
289 for name
, asname
in node
.names
:
293 scope
.add_def(asname
or name
)
295 def visitGlobal(self
, node
, scope
):
296 for name
in node
.names
:
297 scope
.add_global(name
)
299 def visitAssign(self
, node
, scope
):
300 """Propagate assignment flag down to child nodes.
302 The Assign node doesn't itself contains the variables being
303 assigned to. Instead, the children in node.nodes are visited
304 with the assign flag set to true. When the names occur in
305 those nodes, they are marked as defs.
307 Some names that occur in an assignment target are not bound by
308 the assignment, e.g. a name occurring inside a slice. The
309 visitor handles these nodes specially; they do not propagate
310 the assign flag to their children.
313 self
.visit(n
, scope
, 1)
314 self
.visit(node
.expr
, scope
)
316 def visitAssName(self
, node
, scope
, assign
=1):
317 scope
.add_def(node
.name
)
319 def visitAssAttr(self
, node
, scope
, assign
=0):
320 self
.visit(node
.expr
, scope
, 0)
322 def visitSubscript(self
, node
, scope
, assign
=0):
323 self
.visit(node
.expr
, scope
, 0)
325 self
.visit(n
, scope
, 0)
327 def visitSlice(self
, node
, scope
, assign
=0):
328 self
.visit(node
.expr
, scope
, 0)
330 self
.visit(node
.lower
, scope
, 0)
332 self
.visit(node
.upper
, scope
, 0)
334 def visitAugAssign(self
, node
, scope
):
335 # If the LHS is a name, then this counts as assignment.
336 # Otherwise, it's just use.
337 self
.visit(node
.node
, scope
)
338 if isinstance(node
.node
, ast
.Name
):
339 self
.visit(node
.node
, scope
, 1) # XXX worry about this
340 self
.visit(node
.expr
, scope
)
342 # prune if statements if tests are false
344 _const_types
= types
.StringType
, types
.IntType
, types
.FloatType
346 def visitIf(self
, node
, scope
):
347 for test
, body
in node
.tests
:
348 if isinstance(test
, ast
.Const
):
349 if type(test
.value
) in self
._const
_types
:
352 self
.visit(test
, scope
)
353 self
.visit(body
, scope
)
355 self
.visit(node
.else_
, scope
)
357 # a yield statement signals a generator
359 def visitYield(self
, node
, scope
):
361 self
.visit(node
.value
, scope
)
369 return sort(l1
) == sort(l2
)
371 if __name__
== "__main__":
373 from compiler
import parseFile
, walk
377 return [s
for s
in [s
.get_name() for s
in syms
.get_symbols()]
378 if not (s
.startswith('_[') or s
.startswith('.'))]
380 for file in sys
.argv
[1:]:
385 syms
= symtable
.symtable(buf
, file, "exec")
386 mod_names
= get_names(syms
)
387 tree
= parseFile(file)
391 # compare module-level symbols
392 names2
= s
.scopes
[tree
].get_names()
394 if not list_eq(mod_names
, names2
):
397 print sort(mod_names
)
407 for s
in syms
.get_symbols():
409 l
= [sc
for sc
in scopes
410 if sc
.name
== s
.get_name()]
412 print "skipping", s
.get_name()
414 if not list_eq(get_names(s
.get_namespace()),
417 print sort(get_names(s
.get_namespace()))
418 print sort(l
[0].get_names())