1 """Utility functions, node construction macros, etc."""
2 # Author: Collin Winter
5 from .pgen2
import token
6 from .pytree
import Leaf
, Node
7 from .pygram
import python_symbols
as syms
11 ###########################################################
12 ### Common node-construction "macros"
13 ###########################################################
15 def KeywordArg(keyword
, value
):
16 return Node(syms
.argument
,
17 [keyword
, Leaf(token
.EQUAL
, u
'='), value
])
20 return Leaf(token
.LPAR
, u
"(")
23 return Leaf(token
.RPAR
, u
")")
25 def Assign(target
, source
):
26 """Build an assignment statement"""
27 if not isinstance(target
, list):
29 if not isinstance(source
, list):
33 return Node(syms
.atom
,
34 target
+ [Leaf(token
.EQUAL
, u
"=", prefix
=u
" ")] + source
)
36 def Name(name
, prefix
=None):
37 """Return a NAME leaf"""
38 return Leaf(token
.NAME
, name
, prefix
=prefix
)
41 """A node tuple for obj.attr"""
42 return [obj
, Node(syms
.trailer
, [Dot(), attr
])]
46 return Leaf(token
.COMMA
, u
",")
49 """A period (.) leaf"""
50 return Leaf(token
.DOT
, u
".")
52 def ArgList(args
, lparen
=LParen(), rparen
=RParen()):
53 """A parenthesised argument list, used by Call()"""
54 node
= Node(syms
.trailer
, [lparen
.clone(), rparen
.clone()])
56 node
.insert_child(1, Node(syms
.arglist
, args
))
59 def Call(func_name
, args
=None, prefix
=None):
61 node
= Node(syms
.power
, [func_name
, ArgList(args
)])
62 if prefix
is not None:
67 """A newline literal"""
68 return Leaf(token
.NEWLINE
, u
"\n")
72 return Leaf(token
.NEWLINE
, u
"")
74 def Number(n
, prefix
=None):
75 return Leaf(token
.NUMBER
, n
, prefix
=prefix
)
77 def Subscript(index_node
):
78 """A numeric or string subscript"""
79 return Node(syms
.trailer
, [Leaf(token
.LBRACE
, u
'['),
81 Leaf(token
.RBRACE
, u
']')])
83 def String(string
, prefix
=None):
85 return Leaf(token
.STRING
, string
, prefix
=prefix
)
87 def ListComp(xp
, fp
, it
, test
=None):
88 """A list comprehension of the form [xp for fp in it if test].
90 If test is None, the "if test" part is omitted.
95 for_leaf
= Leaf(token
.NAME
, u
"for")
96 for_leaf
.prefix
= u
" "
97 in_leaf
= Leaf(token
.NAME
, u
"in")
99 inner_args
= [for_leaf
, fp
, in_leaf
, it
]
102 if_leaf
= Leaf(token
.NAME
, u
"if")
103 if_leaf
.prefix
= u
" "
104 inner_args
.append(Node(syms
.comp_if
, [if_leaf
, test
]))
105 inner
= Node(syms
.listmaker
, [xp
, Node(syms
.comp_for
, inner_args
)])
106 return Node(syms
.atom
,
107 [Leaf(token
.LBRACE
, u
"["),
109 Leaf(token
.RBRACE
, u
"]")])
111 def FromImport(package_name
, name_leafs
):
112 """ Return an import statement in the form:
113 from package import name_leafs"""
114 # XXX: May not handle dotted imports properly (eg, package_name='foo.bar')
115 #assert package_name == '.' or '.' not in package_name, "FromImport has "\
116 # "not been tested with dotted package names -- use at your own "\
119 for leaf
in name_leafs
:
120 # Pull the leaves out of their old tree
123 children
= [Leaf(token
.NAME
, u
'from'),
124 Leaf(token
.NAME
, package_name
, prefix
=u
" "),
125 Leaf(token
.NAME
, u
'import', prefix
=u
" "),
126 Node(syms
.import_as_names
, name_leafs
)]
127 imp
= Node(syms
.import_from
, children
)
131 ###########################################################
132 ### Determine whether a node represents a given literal
133 ###########################################################
136 """Does the node represent a tuple literal?"""
137 if isinstance(node
, Node
) and node
.children
== [LParen(), RParen()]:
139 return (isinstance(node
, Node
)
140 and len(node
.children
) == 3
141 and isinstance(node
.children
[0], Leaf
)
142 and isinstance(node
.children
[1], Node
)
143 and isinstance(node
.children
[2], Leaf
)
144 and node
.children
[0].value
== u
"("
145 and node
.children
[2].value
== u
")")
148 """Does the node represent a list literal?"""
149 return (isinstance(node
, Node
)
150 and len(node
.children
) > 1
151 and isinstance(node
.children
[0], Leaf
)
152 and isinstance(node
.children
[-1], Leaf
)
153 and node
.children
[0].value
== u
"["
154 and node
.children
[-1].value
== u
"]")
157 ###########################################################
159 ###########################################################
161 def parenthesize(node
):
162 return Node(syms
.atom
, [LParen(), node
, RParen()])
165 consuming_calls
= set(["sorted", "list", "set", "any", "all", "tuple", "sum",
168 def attr_chain(obj
, attr
):
169 """Follow an attribute chain.
171 If you have a chain of objects where a.foo -> b, b.foo-> c, etc,
172 use this to iterate over all objects in the chain. Iteration is
173 terminated by getattr(x, attr) is None.
176 obj: the starting object
177 attr: the name of the chaining attribute
180 Each successive object in the chain.
182 next
= getattr(obj
, attr
)
185 next
= getattr(next
, attr
)
187 p0
= """for_stmt< 'for' any 'in' node=any ':' any* >
188 | comp_for< 'for' any 'in' node=any any* >
192 ( 'iter' | 'list' | 'tuple' | 'sorted' | 'set' | 'sum' |
193 'any' | 'all' | (any* trailer< '.' 'join' >) )
194 trailer< '(' node=any ')' >
201 trailer< '(' arglist<node=any any*> ')' >
206 def in_special_context(node
):
207 """ Returns true if node is in an environment where all that is required
208 of it is being itterable (ie, it doesn't matter if it returns a list
210 See test_map_nochange in test_fixers.py for some examples and tests.
212 global p0
, p1
, p2
, pats_built
214 p1
= patcomp
.compile_pattern(p1
)
215 p0
= patcomp
.compile_pattern(p0
)
216 p2
= patcomp
.compile_pattern(p2
)
218 patterns
= [p0
, p1
, p2
]
219 for pattern
, parent
in zip(patterns
, attr_chain(node
, "parent")):
221 if pattern
.match(parent
, results
) and results
["node"] is node
:
225 def is_probably_builtin(node
):
227 Check that something isn't an attribute or function name etc.
229 prev
= node
.prev_sibling
230 if prev
is not None and prev
.type == token
.DOT
:
234 if parent
.type in (syms
.funcdef
, syms
.classdef
):
236 if parent
.type == syms
.expr_stmt
and parent
.children
[0] is node
:
239 if parent
.type == syms
.parameters
or \
240 (parent
.type == syms
.typedargslist
and (
241 (prev
is not None and prev
.type == token
.COMMA
) or
242 parent
.children
[0] is node
244 # The name of an argument.
248 ###########################################################
249 ### The following functions are to find bindings in a suite
250 ###########################################################
252 def make_suite(node
):
253 if node
.type == syms
.suite
:
256 parent
, node
.parent
= node
.parent
, None
257 suite
= Node(syms
.suite
, [node
])
258 suite
.parent
= parent
262 """Find the top level namespace."""
263 # Scamper up to the top level namespace
264 while node
.type != syms
.file_input
:
265 assert node
.parent
, "Tree is insane! root found before "\
266 "file_input node was found."
270 def does_tree_import(package
, name
, node
):
271 """ Returns true if name is imported from package at the
272 top level of the tree which node belongs to.
273 To cover the case of an import like 'import foo', use
274 None for the package and 'foo' for the name. """
275 binding
= find_binding(name
, find_root(node
), package
)
279 """Returns true if the node is an import statement."""
280 return node
.type in (syms
.import_name
, syms
.import_from
)
282 def touch_import(package
, name
, node
):
283 """ Works like `does_tree_import` but adds an import statement
284 if it was not imported. """
285 def is_import_stmt(node
):
286 return node
.type == syms
.simple_stmt
and node
.children
and \
287 is_import(node
.children
[0])
289 root
= find_root(node
)
291 if does_tree_import(package
, name
, root
):
294 add_newline_before
= False
296 # figure out where to insert the new import. First try to find
297 # the first import and then skip to the last one.
298 insert_pos
= offset
= 0
299 for idx
, node
in enumerate(root
.children
):
300 if not is_import_stmt(node
):
302 for offset
, node2
in enumerate(root
.children
[idx
:]):
303 if not is_import_stmt(node2
):
305 insert_pos
= idx
+ offset
308 # if there are no imports where we can insert, find the docstring.
309 # if that also fails, we stick to the beginning of the file
311 for idx
, node
in enumerate(root
.children
):
312 if node
.type == syms
.simple_stmt
and node
.children
and \
313 node
.children
[0].type == token
.STRING
:
319 import_
= Node(syms
.import_name
, [
320 Leaf(token
.NAME
, u
'import'),
321 Leaf(token
.NAME
, name
, prefix
=u
' ')
324 import_
= FromImport(package
, [Leaf(token
.NAME
, name
, prefix
=u
' ')])
326 children
= [import_
, Newline()]
327 if add_newline_before
:
328 children
.insert(0, Newline())
329 root
.insert_child(insert_pos
, Node(syms
.simple_stmt
, children
))
332 _def_syms
= set([syms
.classdef
, syms
.funcdef
])
333 def find_binding(name
, node
, package
=None):
334 """ Returns the node which binds variable name, otherwise None.
335 If optional argument package is supplied, only imports will
337 See test cases for examples."""
338 for child
in node
.children
:
340 if child
.type == syms
.for_stmt
:
341 if _find(name
, child
.children
[1]):
343 n
= find_binding(name
, make_suite(child
.children
[-1]), package
)
345 elif child
.type in (syms
.if_stmt
, syms
.while_stmt
):
346 n
= find_binding(name
, make_suite(child
.children
[-1]), package
)
348 elif child
.type == syms
.try_stmt
:
349 n
= find_binding(name
, make_suite(child
.children
[2]), package
)
353 for i
, kid
in enumerate(child
.children
[3:]):
354 if kid
.type == token
.COLON
and kid
.value
== ":":
355 # i+3 is the colon, i+4 is the suite
356 n
= find_binding(name
, make_suite(child
.children
[i
+4]), package
)
358 elif child
.type in _def_syms
and child
.children
[1].value
== name
:
360 elif _is_import_binding(child
, name
, package
):
362 elif child
.type == syms
.simple_stmt
:
363 ret
= find_binding(name
, child
, package
)
364 elif child
.type == syms
.expr_stmt
:
365 if _find(name
, child
.children
[0]):
375 _block_syms
= set([syms
.funcdef
, syms
.classdef
, syms
.trailer
])
376 def _find(name
, node
):
380 if node
.type > 256 and node
.type not in _block_syms
:
381 nodes
.extend(node
.children
)
382 elif node
.type == token
.NAME
and node
.value
== name
:
386 def _is_import_binding(node
, name
, package
=None):
387 """ Will reuturn node if node will import name, or node
388 will import * from package. None is returned otherwise.
389 See test cases for examples. """
391 if node
.type == syms
.import_name
and not package
:
392 imp
= node
.children
[1]
393 if imp
.type == syms
.dotted_as_names
:
394 for child
in imp
.children
:
395 if child
.type == syms
.dotted_as_name
:
396 if child
.children
[2].value
== name
:
398 elif child
.type == token
.NAME
and child
.value
== name
:
400 elif imp
.type == syms
.dotted_as_name
:
401 last
= imp
.children
[-1]
402 if last
.type == token
.NAME
and last
.value
== name
:
404 elif imp
.type == token
.NAME
and imp
.value
== name
:
406 elif node
.type == syms
.import_from
:
407 # unicode(...) is used to make life easier here, because
408 # from a.b import parses to ['import', ['a', '.', 'b'], ...]
409 if package
and unicode(node
.children
[1]).strip() != package
:
412 if package
and _find(u
'as', n
):
413 # See test_from_import_as for explanation
415 elif n
.type == syms
.import_as_names
and _find(name
, n
):
417 elif n
.type == syms
.import_as_name
:
418 child
= n
.children
[2]
419 if child
.type == token
.NAME
and child
.value
== name
:
421 elif n
.type == token
.NAME
and n
.value
== name
:
423 elif package
and n
.type == token
.STAR
: