1 # -*- coding: utf-8 -*- 2 """ 3 ast 4 ~~~ 5 6 The `ast` module helps Python applications to process trees of the Python 7 abstract syntax grammar. The abstract syntax itself might change with 8 each Python release; this module helps to find out programmatically what 9 the current grammar looks like and allows modifications of it. 10 11 An abstract syntax tree can be generated by passing `ast.PyCF_ONLY_AST` as 12 a flag to the `compile()` builtin function or by using the `parse()` 13 function from this module. The result will be a tree of objects whose 14 classes all inherit from `ast.AST`. 15 16 A modified abstract syntax tree can be compiled into a Python code object 17 using the built-in `compile()` function. 18 19 Additionally various helper functions are provided that make working with 20 the trees simpler. The main intention of the helper functions and this 21 module in general is to provide an easy to use interface for libraries 22 that work tightly with the python syntax (template engines for example). 23 24 25 :copyright: Copyright 2008 by Armin Ronacher. 26 :license: Python License. 27 """ 28 from _ast import * 29 from _ast import __version__ 30 31 32 def parse(source, filename='<unknown>', mode='exec'): 33 """ 34 Parse the source into an AST node. 35 Equivalent to compile(source, filename, mode, PyCF_ONLY_AST). 36 """ 37 return compile(source, filename, mode, PyCF_ONLY_AST) 38 39 40 def literal_eval(node_or_string): 41 """ 42 Safely evaluate an expression node or a string containing a Python 43 expression. The string or node provided may only consist of the following 44 Python literal structures: strings, numbers, tuples, lists, dicts, booleans, 45 and None. 46 """ 47 _safe_names = {'None': None, 'True': True, 'False': False} 48 if isinstance(node_or_string, basestring): 49 node_or_string = parse(node_or_string, mode='eval') 50 if isinstance(node_or_string, Expression): 51 node_or_string = node_or_string.body 52 def _convert(node): 53 if isinstance(node, Str): 54 return node.s 55 elif isinstance(node, Num): 56 return node.n 57 elif isinstance(node, Tuple): 58 return tuple(map(_convert, node.elts)) 59 elif isinstance(node, List): 60 return list(map(_convert, node.elts)) 61 elif isinstance(node, Dict): 62 return dict((_convert(k), _convert(v)) for k, v 63 in zip(node.keys, node.values)) 64 elif isinstance(node, Name): 65 if node.id in _safe_names: 66 return _safe_names[node.id] 67 elif isinstance(node, BinOp) and \ 68 isinstance(node.op, (Add, Sub)) and \ 69 isinstance(node.right, Num) and \ 70 isinstance(node.right.n, complex) and \ 71 isinstance(node.left, Num) and \ 72 isinstance(node.left.n, (int, long, float)): 73 left = node.left.n 74 right = node.right.n 75 if isinstance(node.op, Add): 76 return left + right 77 else: 78 return left - right 79 raise ValueError('malformed string') 80 return _convert(node_or_string) 81 82 83 def dump(node, annotate_fields=True, include_attributes=False): 84 """ 85 Return a formatted dump of the tree in *node*. This is mainly useful for 86 debugging purposes. The returned string will show the names and the values 87 for fields. This makes the code impossible to evaluate, so if evaluation is 88 wanted *annotate_fields* must be set to False. Attributes such as line 89 numbers and column offsets are not dumped by default. If this is wanted, 90 *include_attributes* can be set to True. 91 """ 92 def _format(node): 93 if isinstance(node, AST): 94 fields = [(a, _format(b)) for a, b in iter_fields(node)] 95 rv = '%s(%s' % (node.__class__.__name__, ', '.join( 96 ('%s=%s' % field for field in fields) 97 if annotate_fields else 98 (b for a, b in fields) 99 )) 100 if include_attributes and node._attributes: 101 rv += fields and ', ' or ' ' 102 rv += ', '.join('%s=%s' % (a, _format(getattr(node, a))) 103 for a in node._attributes) 104 return rv + ')' 105 elif isinstance(node, list): 106 return '[%s]' % ', '.join(_format(x) for x in node) 107 return repr(node) 108 if not isinstance(node, AST): 109 raise TypeError('expected AST, got %r' % node.__class__.__name__) 110 return _format(node) 111 112 113 def copy_location(new_node, old_node): 114 """ 115 Copy source location (`lineno` and `col_offset` attributes) from 116 *old_node* to *new_node* if possible, and return *new_node*. 117 """ 118 for attr in 'lineno', 'col_offset': 119 if attr in old_node._attributes and attr in new_node._attributes \ 120 and hasattr(old_node, attr): 121 setattr(new_node, attr, getattr(old_node, attr)) 122 return new_node 123 124 125 def fix_missing_locations(node): 126 """ 127 When you compile a node tree with compile(), the compiler expects lineno and 128 col_offset attributes for every node that supports them. This is rather 129 tedious to fill in for generated nodes, so this helper adds these attributes 130 recursively where not already set, by setting them to the values of the 131 parent node. It works recursively starting at *node*. 132 """ 133 def _fix(node, lineno, col_offset): 134 if 'lineno' in node._attributes: 135 if not hasattr(node, 'lineno'): 136 node.lineno = lineno 137 else: 138 lineno = node.lineno 139 if 'col_offset' in node._attributes: 140 if not hasattr(node, 'col_offset'): 141 node.col_offset = col_offset 142 else: 143 col_offset = node.col_offset 144 for child in iter_child_nodes(node): 145 _fix(child, lineno, col_offset) 146 _fix(node, 1, 0) 147 return node 148 149 150 def increment_lineno(node, n=1): 151 """ 152 Increment the line number of each node in the tree starting at *node* by *n*. 153 This is useful to "move code" to a different location in a file. 154 """ 155 for child in walk(node): 156 if 'lineno' in child._attributes: 157 child.lineno = getattr(child, 'lineno', 0) + n 158 return node 159 160 161 def iter_fields(node): 162 """ 163 Yield a tuple of ``(fieldname, value)`` for each field in ``node._fields`` 164 that is present on *node*. 165 """ 166 for field in node._fields: 167 try: 168 yield field, getattr(node, field) 169 except AttributeError: 170 pass 171 172 173 def iter_child_nodes(node): 174 """ 175 Yield all direct child nodes of *node*, that is, all fields that are nodes 176 and all items of fields that are lists of nodes. 177 """ 178 for name, field in iter_fields(node): 179 if isinstance(field, AST): 180 yield field 181 elif isinstance(field, list): 182 for item in field: 183 if isinstance(item, AST): 184 yield item 185 186 187 def get_docstring(node, clean=True): 188 """ 189 Return the docstring for the given node or None if no docstring can 190 be found. If the node provided does not have docstrings a TypeError 191 will be raised. 192 """ 193 if not isinstance(node, (FunctionDef, ClassDef, Module)): 194 raise TypeError("%r can't have docstrings" % node.__class__.__name__) 195 if node.body and isinstance(node.body[0], Expr) and \ 196 isinstance(node.body[0].value, Str): 197 if clean: 198 import inspect 199 return inspect.cleandoc(node.body[0].value.s) 200 return node.body[0].value.s 201 202 203 def walk(node): 204 """ 205 Recursively yield all descendant nodes in the tree starting at *node* 206 (including *node* itself), in no specified order. This is useful if you 207 only want to modify nodes in place and don't care about the context. 208 """ 209 from collections import deque 210 todo = deque([node]) 211 while todo: 212 node = todo.popleft() 213 todo.extend(iter_child_nodes(node)) 214 yield node 215 216 217 class NodeVisitor(object): 218 """ 219 A node visitor base class that walks the abstract syntax tree and calls a 220 visitor function for every node found. This function may return a value 221 which is forwarded by the `visit` method. 222 223 This class is meant to be subclassed, with the subclass adding visitor 224 methods. 225 226 Per default the visitor functions for the nodes are ``'visit_'`` + 227 class name of the node. So a `TryFinally` node visit function would 228 be `visit_TryFinally`. This behavior can be changed by overriding 229 the `visit` method. If no visitor function exists for a node 230 (return value `None`) the `generic_visit` visitor is used instead. 231 232 Don't use the `NodeVisitor` if you want to apply changes to nodes during 233 traversing. For this a special visitor exists (`NodeTransformer`) that 234 allows modifications. 235 """ 236 237 def visit(self, node): 238 """Visit a node.""" 239 method = 'visit_' + node.__class__.__name__ 240 visitor = getattr(self, method, self.generic_visit) 241 return visitor(node) 242 243 def generic_visit(self, node): 244 """Called if no explicit visitor function exists for a node.""" 245 for field, value in iter_fields(node): 246 if isinstance(value, list): 247 for item in value: 248 if isinstance(item, AST): 249 self.visit(item) 250 elif isinstance(value, AST): 251 self.visit(value) 252 253 254 class NodeTransformer(NodeVisitor): 255 """ 256 A :class:`NodeVisitor` subclass that walks the abstract syntax tree and 257 allows modification of nodes. 258 259 The `NodeTransformer` will walk the AST and use the return value of the 260 visitor methods to replace or remove the old node. If the return value of 261 the visitor method is ``None``, the node will be removed from its location, 262 otherwise it is replaced with the return value. The return value may be the 263 original node in which case no replacement takes place. 264 265 Here is an example transformer that rewrites all occurrences of name lookups 266 (``foo``) to ``data['foo']``:: 267 268 class RewriteName(NodeTransformer): 269 270 def visit_Name(self, node): 271 return copy_location(Subscript( 272 value=Name(id='data', ctx=Load()), 273 slice=Index(value=Str(s=node.id)), 274 ctx=node.ctx 275 ), node) 276 277 Keep in mind that if the node you're operating on has child nodes you must 278 either transform the child nodes yourself or call the :meth:`generic_visit` 279 method for the node first. 280 281 For nodes that were part of a collection of statements (that applies to all 282 statement nodes), the visitor may also return a list of nodes rather than 283 just a single node. 284 285 Usually you use the transformer like this:: 286 287 node = YourTransformer().visit(node) 288 """ 289 290 def generic_visit(self, node): 291 for field, old_value in iter_fields(node): 292 old_value = getattr(node, field, None) 293 if isinstance(old_value, list): 294 new_values = [] 295 for value in old_value: 296 if isinstance(value, AST): 297 value = self.visit(value) 298 if value is None: 299 continue 300 elif not isinstance(value, AST): 301 new_values.extend(value) 302 continue 303 new_values.append(value) 304 old_value[:] = new_values 305 elif isinstance(old_value, AST): 306 new_node = self.visit(old_value) 307 if new_node is None: 308 delattr(node, field) 309 else: 310 setattr(node, field, new_node) 311 return node 312