blob: c876b452d6453f569a2a8378171c162077a79d11 [file] [log] [blame]
adminbae64d82013-08-01 10:50:15 -07001# -*- coding: utf-8 -*-
2"""
3 ast
4 ~~~
5
6 The `ast` module helps Python applications to process trees of the Python
7 abstract syntax grammar. The abstract syntax itself might change with
8 each Python release; this module helps to find out programmatically what
9 the current grammar looks like and allows modifications of it.
10
11 An abstract syntax tree can be generated by passing `ast.PyCF_ONLY_AST` as
12 a flag to the `compile()` builtin function or by using the `parse()`
13 function from this module. The result will be a tree of objects whose
14 classes all inherit from `ast.AST`.
15
16 A modified abstract syntax tree can be compiled into a Python code object
17 using the built-in `compile()` function.
18
19 Additionally various helper functions are provided that make working with
20 the trees simpler. The main intention of the helper functions and this
21 module in general is to provide an easy to use interface for libraries
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +000022 that work tightly with the python syntax (template engines for example).
adminbae64d82013-08-01 10:50:15 -070023
24
25 :copyright: Copyright 2008 by Armin Ronacher.
26 :license: Python License.
27"""
28from _ast import *
29from _ast import __version__
30
31
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070032def parse( source, filename='<unknown>', mode='exec' ):
adminbae64d82013-08-01 10:50:15 -070033 """
34 Parse the source into an AST node.
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +000035 Equivalent to compile(source, filename, mode, PyCF_ONLY_AST).
adminbae64d82013-08-01 10:50:15 -070036 """
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070037 return compile( source, filename, mode, PyCF_ONLY_AST )
adminbae64d82013-08-01 10:50:15 -070038
39
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070040def literal_eval( node_or_string ):
adminbae64d82013-08-01 10:50:15 -070041 """
42 Safely evaluate an expression node or a string containing a Python
43 expression. The string or node provided may only consist of the following
44 Python literal structures: strings, numbers, tuples, lists, dicts, booleans,
45 and None.
46 """
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070047 _safe_names = { 'None': None, 'True': True, 'False': False }
48 if isinstance( node_or_string, basestring ):
49 node_or_string = parse( node_or_string, mode='eval' )
50 if isinstance( node_or_string, Expression ):
adminbae64d82013-08-01 10:50:15 -070051 node_or_string = node_or_string.body
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070052
53 def _convert( node ):
54 if isinstance( node, Str ):
adminbae64d82013-08-01 10:50:15 -070055 return node.s
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070056 elif isinstance( node, Num ):
adminbae64d82013-08-01 10:50:15 -070057 return node.n
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070058 elif isinstance( node, Tuple ):
59 return tuple( map( _convert, node.elts ) )
60 elif isinstance( node, List ):
61 return list( map( _convert, node.elts ) )
62 elif isinstance( node, Dict ):
63 return dict( ( _convert( k ), _convert( v ) ) for k, v in zip( node.keys, node.values ) )
64 elif isinstance( node, Name ):
adminbae64d82013-08-01 10:50:15 -070065 if node.id in _safe_names:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070066 return _safe_names[ node.id ]
67 elif isinstance( node, BinOp ) and \
68 isinstance( node.op, ( Add, Sub ) ) and \
69 isinstance( node.right, Num ) and \
70 isinstance( node.right.n, complex ) and \
71 isinstance( node.left, Num ) and \
72 isinstance( node.left.n, ( int, long, float ) ):
adminbae64d82013-08-01 10:50:15 -070073 left = node.left.n
74 right = node.right.n
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070075 if isinstance( node.op, Add ):
adminbae64d82013-08-01 10:50:15 -070076 return left + right
77 else:
78 return left - right
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070079 raise ValueError( 'malformed string' )
80 return _convert( node_or_string )
adminbae64d82013-08-01 10:50:15 -070081
82
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070083def dump( node, annotate_fields=True, include_attributes=False ):
adminbae64d82013-08-01 10:50:15 -070084 """
85 Return a formatted dump of the tree in *node*. This is mainly useful for
86 debugging purposes. The returned string will show the names and the values
87 for fields. This makes the code impossible to evaluate, so if evaluation is
88 wanted *annotate_fields* must be set to False. Attributes such as line
89 numbers and column offsets are not dumped by default. If this is wanted,
90 *include_attributes* can be set to True.
91 """
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070092 def _format( node ):
93 if isinstance( node, AST ):
94 fields = [ ( a, _format( b ) ) for a, b in iter_fields( node ) ]
95 rv = '%s(%s' % ( node.__class__.__name__, ', '.join(
96 ( '%s=%s' % field for field in fields )
adminbae64d82013-08-01 10:50:15 -070097 if annotate_fields else
Jeremy Ronquillo696f4262017-10-17 10:56:26 -070098 ( b for a, b in fields )
99 ) )
adminbae64d82013-08-01 10:50:15 -0700100 if include_attributes and node._attributes:
101 rv += fields and ', ' or ' '
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700102 rv += ', '.join( '%s=%s' % ( a, _format( getattr( node, a ) ) ) for a in node._attributes )
adminbae64d82013-08-01 10:50:15 -0700103 return rv + ')'
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700104 elif isinstance( node, list ):
105 return '[%s]' % ', '.join( _format( x ) for x in node )
106 return repr( node )
107 if not isinstance( node, AST ):
108 raise TypeError( 'expected AST, got %r' % node.__class__.__name__ )
109 return _format( node )
adminbae64d82013-08-01 10:50:15 -0700110
111
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700112def copy_location( new_node, old_node ):
adminbae64d82013-08-01 10:50:15 -0700113 """
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000114 Copy source location (`lineno` and `col_offset` attributes) from
adminbae64d82013-08-01 10:50:15 -0700115 *old_node* to *new_node* if possible, and return *new_node*.
116 """
117 for attr in 'lineno', 'col_offset':
118 if attr in old_node._attributes and attr in new_node._attributes \
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700119 and hasattr( old_node, attr ):
120 setattr( new_node, attr, getattr( old_node, attr ) )
adminbae64d82013-08-01 10:50:15 -0700121 return new_node
122
123
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700124def fix_missing_locations( node ):
adminbae64d82013-08-01 10:50:15 -0700125 """
126 When you compile a node tree with compile(), the compiler expects lineno and
127 col_offset attributes for every node that supports them. This is rather
128 tedious to fill in for generated nodes, so this helper adds these attributes
129 recursively where not already set, by setting them to the values of the
130 parent node. It works recursively starting at *node*.
131 """
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700132 def _fix( node, lineno, col_offset ):
adminbae64d82013-08-01 10:50:15 -0700133 if 'lineno' in node._attributes:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700134 if not hasattr( node, 'lineno' ):
adminbae64d82013-08-01 10:50:15 -0700135 node.lineno = lineno
136 else:
137 lineno = node.lineno
138 if 'col_offset' in node._attributes:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700139 if not hasattr( node, 'col_offset' ):
adminbae64d82013-08-01 10:50:15 -0700140 node.col_offset = col_offset
141 else:
142 col_offset = node.col_offset
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700143 for child in iter_child_nodes( node ):
144 _fix( child, lineno, col_offset )
145 _fix( node, 1, 0 )
adminbae64d82013-08-01 10:50:15 -0700146 return node
147
148
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700149def increment_lineno( node, n=1 ):
adminbae64d82013-08-01 10:50:15 -0700150 """
151 Increment the line number of each node in the tree starting at *node* by *n*.
152 This is useful to "move code" to a different location in a file.
153 """
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700154 for child in walk( node ):
adminbae64d82013-08-01 10:50:15 -0700155 if 'lineno' in child._attributes:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700156 child.lineno = getattr( child, 'lineno', 0 ) + n
adminbae64d82013-08-01 10:50:15 -0700157 return node
158
159
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700160def iter_fields( node ):
adminbae64d82013-08-01 10:50:15 -0700161 """
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000162 Yield a tuple of ``(fieldname, value)`` for each field in ``node._fields``
adminbae64d82013-08-01 10:50:15 -0700163 that is present on *node*.
164 """
165 for field in node._fields:
166 try:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700167 yield field, getattr( node, field )
adminbae64d82013-08-01 10:50:15 -0700168 except AttributeError:
169 pass
170
171
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700172def iter_child_nodes( node ):
adminbae64d82013-08-01 10:50:15 -0700173 """
174 Yield all direct child nodes of *node*, that is, all fields that are nodes
175 and all items of fields that are lists of nodes.
176 """
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700177 for name, field in iter_fields( node ):
178 if isinstance( field, AST ):
adminbae64d82013-08-01 10:50:15 -0700179 yield field
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700180 elif isinstance( field, list ):
adminbae64d82013-08-01 10:50:15 -0700181 for item in field:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700182 if isinstance( item, AST ):
adminbae64d82013-08-01 10:50:15 -0700183 yield item
184
185
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700186def get_docstring( node, clean=True ):
adminbae64d82013-08-01 10:50:15 -0700187 """
188 Return the docstring for the given node or None if no docstring can
189 be found. If the node provided does not have docstrings a TypeError
190 will be raised.
191 """
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700192 if not isinstance( node, ( FunctionDef, ClassDef, Module ) ):
193 raise TypeError( "%r can't have docstrings" % node.__class__.__name__ )
194 if node.body and isinstance( node.body[ 0 ], Expr ) and \
195 isinstance( node.body[ 0 ].value, Str ):
adminbae64d82013-08-01 10:50:15 -0700196 if clean:
197 import inspect
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700198 return inspect.cleandoc( node.body[ 0 ].value.s )
199 return node.body[ 0 ].value.s
adminbae64d82013-08-01 10:50:15 -0700200
201
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700202def walk( node ):
adminbae64d82013-08-01 10:50:15 -0700203 """
204 Recursively yield all descendant nodes in the tree starting at *node*
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000205 (including *node* itself), in no specified order. This is useful if you
adminbae64d82013-08-01 10:50:15 -0700206 only want to modify nodes in place and don't care about the context.
207 """
208 from collections import deque
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700209 todo = deque( [ node ] )
adminbae64d82013-08-01 10:50:15 -0700210 while todo:
211 node = todo.popleft()
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700212 todo.extend( iter_child_nodes( node ) )
adminbae64d82013-08-01 10:50:15 -0700213 yield node
214
215
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700216class NodeVisitor( object ):
adminbae64d82013-08-01 10:50:15 -0700217 """
218 A node visitor base class that walks the abstract syntax tree and calls a
219 visitor function for every node found. This function may return a value
220 which is forwarded by the `visit` method.
221
222 This class is meant to be subclassed, with the subclass adding visitor
223 methods.
224
225 Per default the visitor functions for the nodes are ``'visit_'`` +
226 class name of the node. So a `TryFinally` node visit function would
227 be `visit_TryFinally`. This behavior can be changed by overriding
228 the `visit` method. If no visitor function exists for a node
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000229 (return value `None`) the `generic_visit` visitor is used instead.
adminbae64d82013-08-01 10:50:15 -0700230
231 Don't use the `NodeVisitor` if you want to apply changes to nodes during
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000232 traversing. For this a special visitor exists (`NodeTransformer`) that
adminbae64d82013-08-01 10:50:15 -0700233 allows modifications.
234 """
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000235
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700236 def visit( self, node ):
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000237 """Visit a node."""
adminbae64d82013-08-01 10:50:15 -0700238 method = 'visit_' + node.__class__.__name__
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700239 visitor = getattr( self, method, self.generic_visit )
240 return visitor( node )
adminbae64d82013-08-01 10:50:15 -0700241
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700242 def generic_visit( self, node ):
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000243 """Called if no explicit visitor function exists for a node."""
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700244 for field, value in iter_fields( node ):
245 if isinstance( value, list ):
adminbae64d82013-08-01 10:50:15 -0700246 for item in value:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700247 if isinstance( item, AST ):
248 self.visit( item )
249 elif isinstance( value, AST ):
250 self.visit( value )
adminbae64d82013-08-01 10:50:15 -0700251
252
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700253class NodeTransformer( NodeVisitor ):
adminbae64d82013-08-01 10:50:15 -0700254 """
255 A :class:`NodeVisitor` subclass that walks the abstract syntax tree and
256 allows modification of nodes.
257
258 The `NodeTransformer` will walk the AST and use the return value of the
259 visitor methods to replace or remove the old node. If the return value of
260 the visitor method is ``None``, the node will be removed from its location,
261 otherwise it is replaced with the return value. The return value may be the
262 original node in which case no replacement takes place.
263
264 Here is an example transformer that rewrites all occurrences of name lookups
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000265 (``foo``) to ``data['foo']``::
adminbae64d82013-08-01 10:50:15 -0700266
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000267 class RewriteName(NodeTransformer):
adminbae64d82013-08-01 10:50:15 -0700268
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000269 def visit_Name(self, node):
270 return copy_location(Subscript(
271 value=Name(id='data', ctx=Load()),
272 slice=Index(value=Str(s=node.id)),
adminbae64d82013-08-01 10:50:15 -0700273 ctx=node.ctx
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000274 ), node)
adminbae64d82013-08-01 10:50:15 -0700275
276 Keep in mind that if the node you're operating on has child nodes you must
277 either transform the child nodes yourself or call the :meth:`generic_visit`
278 method for the node first.
279
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000280 For nodes that were part of a collection of statements (that applies to all
281 statement nodes), the visitor may also return a list of nodes rather than
adminbae64d82013-08-01 10:50:15 -0700282 just a single node.
283
284 Usually you use the transformer like this::
285
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000286 node = YourTransformer().visit(node)
adminbae64d82013-08-01 10:50:15 -0700287 """
Jeremy Ronquillo4d5f1d02017-10-13 20:23:57 +0000288
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700289 def generic_visit( self, node ):
290 for field, old_value in iter_fields( node ):
291 old_value = getattr( node, field, None )
292 if isinstance( old_value, list ):
adminbae64d82013-08-01 10:50:15 -0700293 new_values = []
294 for value in old_value:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700295 if isinstance( value, AST ):
296 value = self.visit( value )
adminbae64d82013-08-01 10:50:15 -0700297 if value is None:
298 continue
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700299 elif not isinstance( value, AST ):
300 new_values.extend( value )
adminbae64d82013-08-01 10:50:15 -0700301 continue
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700302 new_values.append( value )
303 old_value[ : ] = new_values
304 elif isinstance( old_value, AST ):
305 new_node = self.visit( old_value )
adminbae64d82013-08-01 10:50:15 -0700306 if new_node is None:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700307 delattr( node, field )
adminbae64d82013-08-01 10:50:15 -0700308 else:
Jeremy Ronquillo696f4262017-10-17 10:56:26 -0700309 setattr( node, field, new_node )
adminbae64d82013-08-01 10:50:15 -0700310 return node