1 """Module symbol-table generator""" 2 3 from compiler import ast 4 from compiler.consts import SC_LOCAL, SC_GLOBAL_IMPLICIT, SC_GLOBAL_EXPLICIT, \ 5 SC_FREE, SC_CELL, SC_UNKNOWN 6 from compiler.misc import mangle 7 import types 8 9 10 import sys 11 12 MANGLE_LEN = 256 13 14 class Scope: 15 # XXX how much information do I need about each name? 16 def __init__(self, name, module, klass=None): 17 self.name = name 18 self.module = module 19 self.defs = {} 20 self.uses = {} 21 self.globals = {} 22 self.params = {} 23 self.frees = {} 24 self.cells = {} 25 self.children = [] 26 # nested is true if the class could contain free variables, 27 # i.e. if it is nested within another function. 28 self.nested = None 29 self.generator = None 30 self.klass = None 31 if klass is not None: 32 for i in range(len(klass)): 33 if klass[i] != '_': 34 self.klass = klass[i:] 35 break 36 37 def __repr__(self): 38 return "<%s: %s>" % (self.__class__.__name__, self.name) 39 40 def mangle(self, name): 41 if self.klass is None: 42 return name 43 return mangle(name, self.klass) 44 45 def add_def(self, name): 46 self.defs[self.mangle(name)] = 1 47 48 def add_use(self, name): 49 self.uses[self.mangle(name)] = 1 50 51 def add_global(self, name): 52 name = self.mangle(name) 53 if name in self.uses or name in self.defs: 54 pass # XXX warn about global following def/use 55 if name in self.params: 56 raise SyntaxError, "%s in %s is global and parameter" % \ 57 (name, self.name) 58 self.globals[name] = 1 59 self.module.add_def(name) 60 61 def add_param(self, name): 62 name = self.mangle(name) 63 self.defs[name] = 1 64 self.params[name] = 1 65 66 def get_names(self): 67 d = {} 68 d.update(self.defs) 69 d.update(self.uses) 70 d.update(self.globals) 71 return d.keys() 72 73 def add_child(self, child): 74 self.children.append(child) 75 76 def get_children(self): 77 return self.children 78 79 def DEBUG(self): 80 print >> sys.stderr, self.name, self.nested and "nested" or "" 81 print >> sys.stderr, "\tglobals: ", self.globals 82 print >> sys.stderr, "\tcells: ", self.cells 83 print >> sys.stderr, "\tdefs: ", self.defs 84 print >> sys.stderr, "\tuses: ", self.uses 85 print >> sys.stderr, "\tfrees:", self.frees 86 87 def check_name(self, name): 88 """Return scope of name. 89 90 The scope of a name could be LOCAL, GLOBAL, FREE, or CELL. 91 """ 92 if name in self.globals: 93 return SC_GLOBAL_EXPLICIT 94 if name in self.cells: 95 return SC_CELL 96 if name in self.defs: 97 return SC_LOCAL 98 if self.nested and (name in self.frees or name in self.uses): 99 return SC_FREE 100 if self.nested: 101 return SC_UNKNOWN 102 else: 103 return SC_GLOBAL_IMPLICIT 104 105 def get_free_vars(self): 106 if not self.nested: 107 return () 108 free = {} 109 free.update(self.frees) 110 for name in self.uses.keys(): 111 if name not in self.defs and name not in self.globals: 112 free[name] = 1 113 return free.keys() 114 115 def handle_children(self): 116 for child in self.children: 117 frees = child.get_free_vars() 118 globals = self.add_frees(frees) 119 for name in globals: 120 child.force_global(name) 121 122 def force_global(self, name): 123 """Force name to be global in scope. 124 125 Some child of the current node had a free reference to name. 126 When the child was processed, it was labelled a free 127 variable. Now that all its enclosing scope have been 128 processed, the name is known to be a global or builtin. So 129 walk back down the child chain and set the name to be global 130 rather than free. 131 132 Be careful to stop if a child does not think the name is 133 free. 134 """ 135 self.globals[name] = 1 136 if name in self.frees: 137 del self.frees[name] 138 for child in self.children: 139 if child.check_name(name) == SC_FREE: 140 child.force_global(name) 141 142 def add_frees(self, names): 143 """Process list of free vars from nested scope. 144 145 Returns a list of names that are either 1) declared global in the 146 parent or 2) undefined in a top-level parent. In either case, 147 the nested scope should treat them as globals. 148 """ 149 child_globals = [] 150 for name in names: 151 sc = self.check_name(name) 152 if self.nested: 153 if sc == SC_UNKNOWN or sc == SC_FREE \ 154 or isinstance(self, ClassScope): 155 self.frees[name] = 1 156 elif sc == SC_GLOBAL_IMPLICIT: 157 child_globals.append(name) 158 elif isinstance(self, FunctionScope) and sc == SC_LOCAL: 159 self.cells[name] = 1 160 elif sc != SC_CELL: 161 child_globals.append(name) 162 else: 163 if sc == SC_LOCAL: 164 self.cells[name] = 1 165 elif sc != SC_CELL: 166 child_globals.append(name) 167 return child_globals 168 169 def get_cell_vars(self): 170 return self.cells.keys() 171 172 class ModuleScope(Scope): 173 __super_init = Scope.__init__ 174 175 def __init__(self): 176 self.__super_init("global", self) 177 178 class FunctionScope(Scope): 179 pass 180 181 class GenExprScope(Scope): 182 __super_init = Scope.__init__ 183 184 __counter = 1 185 186 def __init__(self, module, klass=None): 187 i = self.__counter 188 self.__counter += 1 189 self.__super_init("generator expression<%d>"%i, module, klass) 190 self.add_param('.0') 191 192 def get_names(self): 193 keys = Scope.get_names(self) 194 return keys 195 196 class LambdaScope(FunctionScope): 197 __super_init = Scope.__init__ 198 199 __counter = 1 200 201 def __init__(self, module, klass=None): 202 i = self.__counter 203 self.__counter += 1 204 self.__super_init("lambda.%d" % i, module, klass) 205 206 class ClassScope(Scope): 207 __super_init = Scope.__init__ 208 209 def __init__(self, name, module): 210 self.__super_init(name, module, name) 211 212 class SymbolVisitor: 213 def __init__(self): 214 self.scopes = {} 215 self.klass = None 216 217 # node that define new scopes 218 219 def visitModule(self, node): 220 scope = self.module = self.scopes[node] = ModuleScope() 221 self.visit(node.node, scope) 222 223 visitExpression = visitModule 224 225 def visitFunction(self, node, parent): 226 if node.decorators: 227 self.visit(node.decorators, parent) 228 parent.add_def(node.name) 229 for n in node.defaults: 230 self.visit(n, parent) 231 scope = FunctionScope(node.name, self.module, self.klass) 232 if parent.nested or isinstance(parent, FunctionScope): 233 scope.nested = 1 234 self.scopes[node] = scope 235 self._do_args(scope, node.argnames) 236 self.visit(node.code, scope) 237 self.handle_free_vars(scope, parent) 238 239 def visitGenExpr(self, node, parent): 240 scope = GenExprScope(self.module, self.klass); 241 if parent.nested or isinstance(parent, FunctionScope) \ 242 or isinstance(parent, GenExprScope): 243 scope.nested = 1 244 245 self.scopes[node] = scope 246 self.visit(node.code, scope) 247 248 self.handle_free_vars(scope, parent) 249 250 def visitGenExprInner(self, node, scope): 251 for genfor in node.quals: 252 self.visit(genfor, scope) 253 254 self.visit(node.expr, scope) 255 256 def visitGenExprFor(self, node, scope): 257 self.visit(node.assign, scope, 1) 258 self.visit(node.iter, scope) 259 for if_ in node.ifs: 260 self.visit(if_, scope) 261 262 def visitGenExprIf(self, node, scope): 263 self.visit(node.test, scope) 264 265 def visitLambda(self, node, parent, assign=0): 266 # Lambda is an expression, so it could appear in an expression 267 # context where assign is passed. The transformer should catch 268 # any code that has a lambda on the left-hand side. 269 assert not assign 270 271 for n in node.defaults: 272 self.visit(n, parent) 273 scope = LambdaScope(self.module, self.klass) 274 if parent.nested or isinstance(parent, FunctionScope): 275 scope.nested = 1 276 self.scopes[node] = scope 277 self._do_args(scope, node.argnames) 278 self.visit(node.code, scope) 279 self.handle_free_vars(scope, parent) 280 281 def _do_args(self, scope, args): 282 for name in args: 283 if type(name) == types.TupleType: 284 self._do_args(scope, name) 285 else: 286 scope.add_param(name) 287 288 def handle_free_vars(self, scope, parent): 289 parent.add_child(scope) 290 scope.handle_children() 291 292 def visitClass(self, node, parent): 293 parent.add_def(node.name) 294 for n in node.bases: 295 self.visit(n, parent) 296 scope = ClassScope(node.name, self.module) 297 if parent.nested or isinstance(parent, FunctionScope): 298 scope.nested = 1 299 if node.doc is not None: 300 scope.add_def('__doc__') 301 scope.add_def('__module__') 302 self.scopes[node] = scope 303 prev = self.klass 304 self.klass = node.name 305 self.visit(node.code, scope) 306 self.klass = prev 307 self.handle_free_vars(scope, parent) 308 309 # name can be a def or a use 310 311 # XXX a few calls and nodes expect a third "assign" arg that is 312 # true if the name is being used as an assignment. only 313 # expressions contained within statements may have the assign arg. 314 315 def visitName(self, node, scope, assign=0): 316 if assign: 317 scope.add_def(node.name) 318 else: 319 scope.add_use(node.name) 320 321 # operations that bind new names 322 323 def visitFor(self, node, scope): 324 self.visit(node.assign, scope, 1) 325 self.visit(node.list, scope) 326 self.visit(node.body, scope) 327 if node.else_: 328 self.visit(node.else_, scope) 329 330 def visitFrom(self, node, scope): 331 for name, asname in node.names: 332 if name == "*": 333 continue 334 scope.add_def(asname or name) 335 336 def visitImport(self, node, scope): 337 for name, asname in node.names: 338 i = name.find(".") 339 if i > -1: 340 name = name[:i] 341 scope.add_def(asname or name) 342 343 def visitGlobal(self, node, scope): 344 for name in node.names: 345 scope.add_global(name) 346 347 def visitAssign(self, node, scope): 348 """Propagate assignment flag down to child nodes. 349 350 The Assign node doesn't itself contains the variables being 351 assigned to. Instead, the children in node.nodes are visited 352 with the assign flag set to true. When the names occur in 353 those nodes, they are marked as defs. 354 355 Some names that occur in an assignment target are not bound by 356 the assignment, e.g. a name occurring inside a slice. The 357 visitor handles these nodes specially; they do not propagate 358 the assign flag to their children. 359 """ 360 for n in node.nodes: 361 self.visit(n, scope, 1) 362 self.visit(node.expr, scope) 363 364 def visitAssName(self, node, scope, assign=1): 365 scope.add_def(node.name) 366 367 def visitAssAttr(self, node, scope, assign=0): 368 self.visit(node.expr, scope, 0) 369 370 def visitSubscript(self, node, scope, assign=0): 371 self.visit(node.expr, scope, 0) 372 for n in node.subs: 373 self.visit(n, scope, 0) 374 375 def visitSlice(self, node, scope, assign=0): 376 self.visit(node.expr, scope, 0) 377 if node.lower: 378 self.visit(node.lower, scope, 0) 379 if node.upper: 380 self.visit(node.upper, scope, 0) 381 382 def visitAugAssign(self, node, scope): 383 # If the LHS is a name, then this counts as assignment. 384 # Otherwise, it's just use. 385 self.visit(node.node, scope) 386 if isinstance(node.node, ast.Name): 387 self.visit(node.node, scope, 1) # XXX worry about this 388 self.visit(node.expr, scope) 389 390 # prune if statements if tests are false 391 392 _const_types = types.StringType, types.IntType, types.FloatType 393 394 def visitIf(self, node, scope): 395 for test, body in node.tests: 396 if isinstance(test, ast.Const): 397 if type(test.value) in self._const_types: 398 if not test.value: 399 continue 400 self.visit(test, scope) 401 self.visit(body, scope) 402 if node.else_: 403 self.visit(node.else_, scope) 404 405 # a yield statement signals a generator 406 407 def visitYield(self, node, scope): 408 scope.generator = 1 409 self.visit(node.value, scope) 410 411 def list_eq(l1, l2): 412 return sorted(l1) == sorted(l2) 413 414 if __name__ == "__main__": 415 import sys 416 from compiler import parseFile, walk 417 import symtable 418 419 def get_names(syms): 420 return [s for s in [s.get_name() for s in syms.get_symbols()] 421 if not (s.startswith('_[') or s.startswith('.'))] 422 423 for file in sys.argv[1:]: 424 print file 425 f = open(file) 426 buf = f.read() 427 f.close() 428 syms = symtable.symtable(buf, file, "exec") 429 mod_names = get_names(syms) 430 tree = parseFile(file) 431 s = SymbolVisitor() 432 walk(tree, s) 433 434 # compare module-level symbols 435 names2 = s.scopes[tree].get_names() 436 437 if not list_eq(mod_names, names2): 438 print 439 print "oops", file 440 print sorted(mod_names) 441 print sorted(names2) 442 sys.exit(-1) 443 444 d = {} 445 d.update(s.scopes) 446 del d[tree] 447 scopes = d.values() 448 del d 449 450 for s in syms.get_symbols(): 451 if s.is_namespace(): 452 l = [sc for sc in scopes 453 if sc.name == s.get_name()] 454 if len(l) > 1: 455 print "skipping", s.get_name() 456 else: 457 if not list_eq(get_names(s.get_namespace()), 458 l[0].get_names()): 459 print s.get_name() 460 print sorted(get_names(s.get_namespace())) 461 print sorted(l[0].get_names()) 462 sys.exit(-1) 463