Coverage for /pythoncovmergedfiles/medio/medio/usr/local/lib/python3.11/site-packages/black/linegen.py: 11%
Shortcuts on this page
r m x toggle line displays
j k next/prev highlighted chunk
0 (zero) top of page
1 (one) first highlighted chunk
Shortcuts on this page
r m x toggle line displays
j k next/prev highlighted chunk
0 (zero) top of page
1 (one) first highlighted chunk
1"""
2Generating lines of code.
3"""
5import re
6import sys
7from collections.abc import Collection, Iterator
8from dataclasses import replace
9from enum import Enum, auto
10from functools import partial, wraps
11from typing import Optional, Union, cast
13from black.brackets import (
14 COMMA_PRIORITY,
15 DOT_PRIORITY,
16 STRING_PRIORITY,
17 get_leaves_inside_matching_brackets,
18 max_delimiter_priority_in_atom,
19)
20from black.comments import FMT_OFF, generate_comments, list_comments
21from black.lines import (
22 Line,
23 RHSResult,
24 append_leaves,
25 can_be_split,
26 can_omit_invisible_parens,
27 is_line_short_enough,
28 line_to_string,
29)
30from black.mode import Feature, Mode, Preview
31from black.nodes import (
32 ASSIGNMENTS,
33 BRACKETS,
34 CLOSING_BRACKETS,
35 OPENING_BRACKETS,
36 STANDALONE_COMMENT,
37 STATEMENT,
38 WHITESPACE,
39 Visitor,
40 ensure_visible,
41 fstring_to_string,
42 get_annotation_type,
43 has_sibling_with_type,
44 is_arith_like,
45 is_async_stmt_or_funcdef,
46 is_atom_with_invisible_parens,
47 is_docstring,
48 is_empty_tuple,
49 is_generator,
50 is_lpar_token,
51 is_multiline_string,
52 is_name_token,
53 is_one_sequence_between,
54 is_one_tuple,
55 is_parent_function_or_class,
56 is_part_of_annotation,
57 is_rpar_token,
58 is_stub_body,
59 is_stub_suite,
60 is_tuple,
61 is_tuple_containing_star,
62 is_tuple_containing_walrus,
63 is_type_ignore_comment_string,
64 is_vararg,
65 is_walrus_assignment,
66 is_yield,
67 syms,
68 wrap_in_parentheses,
69)
70from black.numerics import normalize_numeric_literal
71from black.strings import (
72 fix_multiline_docstring,
73 get_string_prefix,
74 normalize_string_prefix,
75 normalize_string_quotes,
76 normalize_unicode_escape_sequences,
77)
78from black.trans import (
79 CannotTransform,
80 StringMerger,
81 StringParenStripper,
82 StringParenWrapper,
83 StringSplitter,
84 Transformer,
85 hug_power_op,
86)
87from blib2to3.pgen2 import token
88from blib2to3.pytree import Leaf, Node
90# types
91LeafID = int
92LN = Union[Leaf, Node]
95class CannotSplit(CannotTransform):
96 """A readable split that fits the allotted line length is impossible."""
99# This isn't a dataclass because @dataclass + Generic breaks mypyc.
100# See also https://github.com/mypyc/mypyc/issues/827.
101class LineGenerator(Visitor[Line]):
102 """Generates reformatted Line objects. Empty lines are not emitted.
104 Note: destroys the tree it's visiting by mutating prefixes of its leaves
105 in ways that will no longer stringify to valid Python code on the tree.
106 """
108 def __init__(self, mode: Mode, features: Collection[Feature]) -> None:
109 self.mode = mode
110 self.features = features
111 self.current_line: Line
112 self.__post_init__()
114 def line(self, indent: int = 0) -> Iterator[Line]:
115 """Generate a line.
117 If the line is empty, only emit if it makes sense.
118 If the line is too long, split it first and then generate.
120 If any lines were generated, set up a new current_line.
121 """
122 if not self.current_line:
123 self.current_line.depth += indent
124 return # Line is empty, don't emit. Creating a new one unnecessary.
126 if len(self.current_line.leaves) == 1 and is_async_stmt_or_funcdef(
127 self.current_line.leaves[0]
128 ):
129 # Special case for async def/for/with statements. `visit_async_stmt`
130 # adds an `ASYNC` leaf then visits the child def/for/with statement
131 # nodes. Line yields from those nodes shouldn't treat the former
132 # `ASYNC` leaf as a complete line.
133 return
135 complete_line = self.current_line
136 self.current_line = Line(mode=self.mode, depth=complete_line.depth + indent)
137 yield complete_line
139 def visit_default(self, node: LN) -> Iterator[Line]:
140 """Default `visit_*()` implementation. Recurses to children of `node`."""
141 if isinstance(node, Leaf):
142 any_open_brackets = self.current_line.bracket_tracker.any_open_brackets()
143 for comment in generate_comments(node):
144 if any_open_brackets:
145 # any comment within brackets is subject to splitting
146 self.current_line.append(comment)
147 elif comment.type == token.COMMENT:
148 # regular trailing comment
149 self.current_line.append(comment)
150 yield from self.line()
152 else:
153 # regular standalone comment
154 yield from self.line()
156 self.current_line.append(comment)
157 yield from self.line()
159 if any_open_brackets:
160 node.prefix = ""
161 if node.type not in WHITESPACE:
162 self.current_line.append(node)
163 yield from super().visit_default(node)
165 def visit_test(self, node: Node) -> Iterator[Line]:
166 """Visit an `x if y else z` test"""
168 already_parenthesized = (
169 node.prev_sibling and node.prev_sibling.type == token.LPAR
170 )
172 if not already_parenthesized:
173 # Similar to logic in wrap_in_parentheses
174 lpar = Leaf(token.LPAR, "")
175 rpar = Leaf(token.RPAR, "")
176 prefix = node.prefix
177 node.prefix = ""
178 lpar.prefix = prefix
179 node.insert_child(0, lpar)
180 node.append_child(rpar)
182 yield from self.visit_default(node)
184 def visit_INDENT(self, node: Leaf) -> Iterator[Line]:
185 """Increase indentation level, maybe yield a line."""
186 # In blib2to3 INDENT never holds comments.
187 yield from self.line(+1)
188 yield from self.visit_default(node)
190 def visit_DEDENT(self, node: Leaf) -> Iterator[Line]:
191 """Decrease indentation level, maybe yield a line."""
192 # The current line might still wait for trailing comments. At DEDENT time
193 # there won't be any (they would be prefixes on the preceding NEWLINE).
194 # Emit the line then.
195 yield from self.line()
197 # While DEDENT has no value, its prefix may contain standalone comments
198 # that belong to the current indentation level. Get 'em.
199 yield from self.visit_default(node)
201 # Finally, emit the dedent.
202 yield from self.line(-1)
204 def visit_stmt(
205 self, node: Node, keywords: set[str], parens: set[str]
206 ) -> Iterator[Line]:
207 """Visit a statement.
209 This implementation is shared for `if`, `while`, `for`, `try`, `except`,
210 `def`, `with`, `class`, `assert`, and assignments.
212 The relevant Python language `keywords` for a given statement will be
213 NAME leaves within it. This methods puts those on a separate line.
215 `parens` holds a set of string leaf values immediately after which
216 invisible parens should be put.
217 """
218 normalize_invisible_parens(
219 node, parens_after=parens, mode=self.mode, features=self.features
220 )
221 for child in node.children:
222 if is_name_token(child) and child.value in keywords:
223 yield from self.line()
225 yield from self.visit(child)
227 def visit_typeparams(self, node: Node) -> Iterator[Line]:
228 yield from self.visit_default(node)
229 node.children[0].prefix = ""
231 def visit_typevartuple(self, node: Node) -> Iterator[Line]:
232 yield from self.visit_default(node)
233 node.children[1].prefix = ""
235 def visit_paramspec(self, node: Node) -> Iterator[Line]:
236 yield from self.visit_default(node)
237 node.children[1].prefix = ""
239 def visit_dictsetmaker(self, node: Node) -> Iterator[Line]:
240 if Preview.wrap_long_dict_values_in_parens in self.mode:
241 for i, child in enumerate(node.children):
242 if i == 0:
243 continue
244 if node.children[i - 1].type == token.COLON:
245 if (
246 child.type == syms.atom
247 and child.children[0].type in OPENING_BRACKETS
248 and not is_walrus_assignment(child)
249 ):
250 maybe_make_parens_invisible_in_atom(
251 child,
252 parent=node,
253 remove_brackets_around_comma=False,
254 )
255 else:
256 wrap_in_parentheses(node, child, visible=False)
257 yield from self.visit_default(node)
259 def visit_funcdef(self, node: Node) -> Iterator[Line]:
260 """Visit function definition."""
261 yield from self.line()
263 # Remove redundant brackets around return type annotation.
264 is_return_annotation = False
265 for child in node.children:
266 if child.type == token.RARROW:
267 is_return_annotation = True
268 elif is_return_annotation:
269 if child.type == syms.atom and child.children[0].type == token.LPAR:
270 if maybe_make_parens_invisible_in_atom(
271 child,
272 parent=node,
273 remove_brackets_around_comma=False,
274 ):
275 wrap_in_parentheses(node, child, visible=False)
276 else:
277 wrap_in_parentheses(node, child, visible=False)
278 is_return_annotation = False
280 for child in node.children:
281 yield from self.visit(child)
283 def visit_match_case(self, node: Node) -> Iterator[Line]:
284 """Visit either a match or case statement."""
285 normalize_invisible_parens(
286 node, parens_after=set(), mode=self.mode, features=self.features
287 )
289 yield from self.line()
290 for child in node.children:
291 yield from self.visit(child)
293 def visit_suite(self, node: Node) -> Iterator[Line]:
294 """Visit a suite."""
295 if is_stub_suite(node):
296 yield from self.visit(node.children[2])
297 else:
298 yield from self.visit_default(node)
300 def visit_simple_stmt(self, node: Node) -> Iterator[Line]:
301 """Visit a statement without nested statements."""
302 prev_type: Optional[int] = None
303 for child in node.children:
304 if (prev_type is None or prev_type == token.SEMI) and is_arith_like(child):
305 wrap_in_parentheses(node, child, visible=False)
306 prev_type = child.type
308 if node.parent and node.parent.type in STATEMENT:
309 if is_parent_function_or_class(node) and is_stub_body(node):
310 yield from self.visit_default(node)
311 else:
312 yield from self.line(+1)
313 yield from self.visit_default(node)
314 yield from self.line(-1)
316 else:
317 if node.parent and is_stub_suite(node.parent):
318 node.prefix = ""
319 yield from self.visit_default(node)
320 return
321 yield from self.line()
322 yield from self.visit_default(node)
324 def visit_async_stmt(self, node: Node) -> Iterator[Line]:
325 """Visit `async def`, `async for`, `async with`."""
326 yield from self.line()
328 children = iter(node.children)
329 for child in children:
330 yield from self.visit(child)
332 if child.type == token.ASYNC or child.type == STANDALONE_COMMENT:
333 # STANDALONE_COMMENT happens when `# fmt: skip` is applied on the async
334 # line.
335 break
337 internal_stmt = next(children)
338 yield from self.visit(internal_stmt)
340 def visit_decorators(self, node: Node) -> Iterator[Line]:
341 """Visit decorators."""
342 for child in node.children:
343 yield from self.line()
344 yield from self.visit(child)
346 def visit_power(self, node: Node) -> Iterator[Line]:
347 for idx, leaf in enumerate(node.children[:-1]):
348 next_leaf = node.children[idx + 1]
350 if not isinstance(leaf, Leaf):
351 continue
353 value = leaf.value.lower()
354 if (
355 leaf.type == token.NUMBER
356 and next_leaf.type == syms.trailer
357 # Ensure that we are in an attribute trailer
358 and next_leaf.children[0].type == token.DOT
359 # It shouldn't wrap hexadecimal, binary and octal literals
360 and not value.startswith(("0x", "0b", "0o"))
361 # It shouldn't wrap complex literals
362 and "j" not in value
363 ):
364 wrap_in_parentheses(node, leaf)
366 remove_await_parens(node)
368 yield from self.visit_default(node)
370 def visit_SEMI(self, leaf: Leaf) -> Iterator[Line]:
371 """Remove a semicolon and put the other statement on a separate line."""
372 yield from self.line()
374 def visit_ENDMARKER(self, leaf: Leaf) -> Iterator[Line]:
375 """End of file. Process outstanding comments and end with a newline."""
376 yield from self.visit_default(leaf)
377 yield from self.line()
379 def visit_STANDALONE_COMMENT(self, leaf: Leaf) -> Iterator[Line]:
380 if not self.current_line.bracket_tracker.any_open_brackets():
381 yield from self.line()
382 yield from self.visit_default(leaf)
384 def visit_factor(self, node: Node) -> Iterator[Line]:
385 """Force parentheses between a unary op and a binary power:
387 -2 ** 8 -> -(2 ** 8)
388 """
389 _operator, operand = node.children
390 if (
391 operand.type == syms.power
392 and len(operand.children) == 3
393 and operand.children[1].type == token.DOUBLESTAR
394 ):
395 lpar = Leaf(token.LPAR, "(")
396 rpar = Leaf(token.RPAR, ")")
397 index = operand.remove() or 0
398 node.insert_child(index, Node(syms.atom, [lpar, operand, rpar]))
399 yield from self.visit_default(node)
401 def visit_tname(self, node: Node) -> Iterator[Line]:
402 """
403 Add potential parentheses around types in function parameter lists to be made
404 into real parentheses in case the type hint is too long to fit on a line
405 Examples:
406 def foo(a: int, b: float = 7): ...
408 ->
410 def foo(a: (int), b: (float) = 7): ...
411 """
412 assert len(node.children) == 3
413 if maybe_make_parens_invisible_in_atom(node.children[2], parent=node):
414 wrap_in_parentheses(node, node.children[2], visible=False)
416 yield from self.visit_default(node)
418 def visit_STRING(self, leaf: Leaf) -> Iterator[Line]:
419 normalize_unicode_escape_sequences(leaf)
421 if is_docstring(leaf) and not re.search(r"\\\s*\n", leaf.value):
422 # We're ignoring docstrings with backslash newline escapes because changing
423 # indentation of those changes the AST representation of the code.
424 if self.mode.string_normalization:
425 docstring = normalize_string_prefix(leaf.value)
426 # We handle string normalization at the end of this method, but since
427 # what we do right now acts differently depending on quote style (ex.
428 # see padding logic below), there's a possibility for unstable
429 # formatting. To avoid a situation where this function formats a
430 # docstring differently on the second pass, normalize it early.
431 docstring = normalize_string_quotes(docstring)
432 else:
433 docstring = leaf.value
434 prefix = get_string_prefix(docstring)
435 docstring = docstring[len(prefix) :] # Remove the prefix
436 quote_char = docstring[0]
437 # A natural way to remove the outer quotes is to do:
438 # docstring = docstring.strip(quote_char)
439 # but that breaks on """""x""" (which is '""x').
440 # So we actually need to remove the first character and the next two
441 # characters but only if they are the same as the first.
442 quote_len = 1 if docstring[1] != quote_char else 3
443 docstring = docstring[quote_len:-quote_len]
444 docstring_started_empty = not docstring
445 indent = " " * 4 * self.current_line.depth
447 if is_multiline_string(leaf):
448 docstring = fix_multiline_docstring(docstring, indent)
449 else:
450 docstring = docstring.strip()
452 has_trailing_backslash = False
453 if docstring:
454 # Add some padding if the docstring starts / ends with a quote mark.
455 if docstring[0] == quote_char:
456 docstring = " " + docstring
457 if docstring[-1] == quote_char:
458 docstring += " "
459 if docstring[-1] == "\\":
460 backslash_count = len(docstring) - len(docstring.rstrip("\\"))
461 if backslash_count % 2:
462 # Odd number of tailing backslashes, add some padding to
463 # avoid escaping the closing string quote.
464 docstring += " "
465 has_trailing_backslash = True
466 elif not docstring_started_empty:
467 docstring = " "
469 # We could enforce triple quotes at this point.
470 quote = quote_char * quote_len
472 # It's invalid to put closing single-character quotes on a new line.
473 if quote_len == 3:
474 # We need to find the length of the last line of the docstring
475 # to find if we can add the closing quotes to the line without
476 # exceeding the maximum line length.
477 # If docstring is one line, we don't put the closing quotes on a
478 # separate line because it looks ugly (#3320).
479 lines = docstring.splitlines()
480 last_line_length = len(lines[-1]) if docstring else 0
482 # If adding closing quotes would cause the last line to exceed
483 # the maximum line length, and the closing quote is not
484 # prefixed by a newline then put a line break before
485 # the closing quotes
486 if (
487 len(lines) > 1
488 and last_line_length + quote_len > self.mode.line_length
489 and len(indent) + quote_len <= self.mode.line_length
490 and not has_trailing_backslash
491 ):
492 if leaf.value[-1 - quote_len] == "\n":
493 leaf.value = prefix + quote + docstring + quote
494 else:
495 leaf.value = prefix + quote + docstring + "\n" + indent + quote
496 else:
497 leaf.value = prefix + quote + docstring + quote
498 else:
499 leaf.value = prefix + quote + docstring + quote
501 if self.mode.string_normalization and leaf.type == token.STRING:
502 leaf.value = normalize_string_prefix(leaf.value)
503 leaf.value = normalize_string_quotes(leaf.value)
504 yield from self.visit_default(leaf)
506 def visit_NUMBER(self, leaf: Leaf) -> Iterator[Line]:
507 normalize_numeric_literal(leaf)
508 yield from self.visit_default(leaf)
510 def visit_atom(self, node: Node) -> Iterator[Line]:
511 """Visit any atom"""
512 if len(node.children) == 3:
513 first = node.children[0]
514 last = node.children[-1]
515 if (first.type == token.LSQB and last.type == token.RSQB) or (
516 first.type == token.LBRACE and last.type == token.RBRACE
517 ):
518 # Lists or sets of one item
519 maybe_make_parens_invisible_in_atom(node.children[1], parent=node)
521 yield from self.visit_default(node)
523 def visit_fstring(self, node: Node) -> Iterator[Line]:
524 # currently we don't want to format and split f-strings at all.
525 string_leaf = fstring_to_string(node)
526 node.replace(string_leaf)
527 if "\\" in string_leaf.value and any(
528 "\\" in str(child)
529 for child in node.children
530 if child.type == syms.fstring_replacement_field
531 ):
532 # string normalization doesn't account for nested quotes,
533 # causing breakages. skip normalization when nested quotes exist
534 yield from self.visit_default(string_leaf)
535 return
536 yield from self.visit_STRING(string_leaf)
538 # TODO: Uncomment Implementation to format f-string children
539 # fstring_start = node.children[0]
540 # fstring_end = node.children[-1]
541 # assert isinstance(fstring_start, Leaf)
542 # assert isinstance(fstring_end, Leaf)
544 # quote_char = fstring_end.value[0]
545 # quote_idx = fstring_start.value.index(quote_char)
546 # prefix, quote = (
547 # fstring_start.value[:quote_idx],
548 # fstring_start.value[quote_idx:]
549 # )
551 # if not is_docstring(node, self.mode):
552 # prefix = normalize_string_prefix(prefix)
554 # assert quote == fstring_end.value
556 # is_raw_fstring = "r" in prefix or "R" in prefix
557 # middles = [
558 # leaf
559 # for leaf in node.leaves()
560 # if leaf.type == token.FSTRING_MIDDLE
561 # ]
563 # if self.mode.string_normalization:
564 # middles, quote = normalize_fstring_quotes(quote, middles, is_raw_fstring)
566 # fstring_start.value = prefix + quote
567 # fstring_end.value = quote
569 # yield from self.visit_default(node)
571 def __post_init__(self) -> None:
572 """You are in a twisty little maze of passages."""
573 self.current_line = Line(mode=self.mode)
575 v = self.visit_stmt
576 Ø: set[str] = set()
577 self.visit_assert_stmt = partial(v, keywords={"assert"}, parens={"assert", ","})
578 self.visit_if_stmt = partial(
579 v, keywords={"if", "else", "elif"}, parens={"if", "elif"}
580 )
581 self.visit_while_stmt = partial(v, keywords={"while", "else"}, parens={"while"})
582 self.visit_for_stmt = partial(v, keywords={"for", "else"}, parens={"for", "in"})
583 self.visit_try_stmt = partial(
584 v, keywords={"try", "except", "else", "finally"}, parens=Ø
585 )
586 self.visit_except_clause = partial(v, keywords={"except"}, parens={"except"})
587 self.visit_with_stmt = partial(v, keywords={"with"}, parens={"with"})
588 self.visit_classdef = partial(v, keywords={"class"}, parens=Ø)
590 self.visit_expr_stmt = partial(v, keywords=Ø, parens=ASSIGNMENTS)
591 self.visit_return_stmt = partial(v, keywords={"return"}, parens={"return"})
592 self.visit_import_from = partial(v, keywords=Ø, parens={"import"})
593 self.visit_del_stmt = partial(v, keywords=Ø, parens={"del"})
594 self.visit_async_funcdef = self.visit_async_stmt
595 self.visit_decorated = self.visit_decorators
597 # PEP 634
598 self.visit_match_stmt = self.visit_match_case
599 self.visit_case_block = self.visit_match_case
600 self.visit_guard = partial(v, keywords=Ø, parens={"if"})
603def _hugging_power_ops_line_to_string(
604 line: Line,
605 features: Collection[Feature],
606 mode: Mode,
607) -> Optional[str]:
608 try:
609 return line_to_string(next(hug_power_op(line, features, mode)))
610 except CannotTransform:
611 return None
614def transform_line(
615 line: Line, mode: Mode, features: Collection[Feature] = ()
616) -> Iterator[Line]:
617 """Transform a `line`, potentially splitting it into many lines.
619 They should fit in the allotted `line_length` but might not be able to.
621 `features` are syntactical features that may be used in the output.
622 """
623 if line.is_comment:
624 yield line
625 return
627 line_str = line_to_string(line)
629 # We need the line string when power operators are hugging to determine if we should
630 # split the line. Default to line_str, if no power operator are present on the line.
631 line_str_hugging_power_ops = (
632 _hugging_power_ops_line_to_string(line, features, mode) or line_str
633 )
635 ll = mode.line_length
636 sn = mode.string_normalization
637 string_merge = StringMerger(ll, sn)
638 string_paren_strip = StringParenStripper(ll, sn)
639 string_split = StringSplitter(ll, sn)
640 string_paren_wrap = StringParenWrapper(ll, sn)
642 transformers: list[Transformer]
643 if (
644 not line.contains_uncollapsable_type_comments()
645 and not line.should_split_rhs
646 and not line.magic_trailing_comma
647 and (
648 is_line_short_enough(line, mode=mode, line_str=line_str_hugging_power_ops)
649 or line.contains_unsplittable_type_ignore()
650 )
651 and not (line.inside_brackets and line.contains_standalone_comments())
652 and not line.contains_implicit_multiline_string_with_comments()
653 ):
654 # Only apply basic string preprocessing, since lines shouldn't be split here.
655 if Preview.string_processing in mode:
656 transformers = [string_merge, string_paren_strip]
657 else:
658 transformers = []
659 elif line.is_def and not should_split_funcdef_with_rhs(line, mode):
660 transformers = [left_hand_split]
661 else:
663 def _rhs(
664 self: object, line: Line, features: Collection[Feature], mode: Mode
665 ) -> Iterator[Line]:
666 """Wraps calls to `right_hand_split`.
668 The calls increasingly `omit` right-hand trailers (bracket pairs with
669 content), meaning the trailers get glued together to split on another
670 bracket pair instead.
671 """
672 for omit in generate_trailers_to_omit(line, mode.line_length):
673 lines = list(right_hand_split(line, mode, features, omit=omit))
674 # Note: this check is only able to figure out if the first line of the
675 # *current* transformation fits in the line length. This is true only
676 # for simple cases. All others require running more transforms via
677 # `transform_line()`. This check doesn't know if those would succeed.
678 if is_line_short_enough(lines[0], mode=mode):
679 yield from lines
680 return
682 # All splits failed, best effort split with no omits.
683 # This mostly happens to multiline strings that are by definition
684 # reported as not fitting a single line, as well as lines that contain
685 # trailing commas (those have to be exploded).
686 yield from right_hand_split(line, mode, features=features)
688 # HACK: nested functions (like _rhs) compiled by mypyc don't retain their
689 # __name__ attribute which is needed in `run_transformer` further down.
690 # Unfortunately a nested class breaks mypyc too. So a class must be created
691 # via type ... https://github.com/mypyc/mypyc/issues/884
692 rhs = type("rhs", (), {"__call__": _rhs})()
694 if Preview.string_processing in mode:
695 if line.inside_brackets:
696 transformers = [
697 string_merge,
698 string_paren_strip,
699 string_split,
700 delimiter_split,
701 standalone_comment_split,
702 string_paren_wrap,
703 rhs,
704 ]
705 else:
706 transformers = [
707 string_merge,
708 string_paren_strip,
709 string_split,
710 string_paren_wrap,
711 rhs,
712 ]
713 else:
714 if line.inside_brackets:
715 transformers = [delimiter_split, standalone_comment_split, rhs]
716 else:
717 transformers = [rhs]
718 # It's always safe to attempt hugging of power operations and pretty much every line
719 # could match.
720 transformers.append(hug_power_op)
722 for transform in transformers:
723 # We are accumulating lines in `result` because we might want to abort
724 # mission and return the original line in the end, or attempt a different
725 # split altogether.
726 try:
727 result = run_transformer(line, transform, mode, features, line_str=line_str)
728 except CannotTransform:
729 continue
730 else:
731 yield from result
732 break
734 else:
735 yield line
738def should_split_funcdef_with_rhs(line: Line, mode: Mode) -> bool:
739 """If a funcdef has a magic trailing comma in the return type, then we should first
740 split the line with rhs to respect the comma.
741 """
742 return_type_leaves: list[Leaf] = []
743 in_return_type = False
745 for leaf in line.leaves:
746 if leaf.type == token.COLON:
747 in_return_type = False
748 if in_return_type:
749 return_type_leaves.append(leaf)
750 if leaf.type == token.RARROW:
751 in_return_type = True
753 # using `bracket_split_build_line` will mess with whitespace, so we duplicate a
754 # couple lines from it.
755 result = Line(mode=line.mode, depth=line.depth)
756 leaves_to_track = get_leaves_inside_matching_brackets(return_type_leaves)
757 for leaf in return_type_leaves:
758 result.append(
759 leaf,
760 preformatted=True,
761 track_bracket=id(leaf) in leaves_to_track,
762 )
764 # we could also return true if the line is too long, and the return type is longer
765 # than the param list. Or if `should_split_rhs` returns True.
766 return result.magic_trailing_comma is not None
769class _BracketSplitComponent(Enum):
770 head = auto()
771 body = auto()
772 tail = auto()
775def left_hand_split(
776 line: Line, _features: Collection[Feature], mode: Mode
777) -> Iterator[Line]:
778 """Split line into many lines, starting with the first matching bracket pair.
780 Note: this usually looks weird, only use this for function definitions.
781 Prefer RHS otherwise. This is why this function is not symmetrical with
782 :func:`right_hand_split` which also handles optional parentheses.
783 """
784 for leaf_type in [token.LPAR, token.LSQB]:
785 tail_leaves: list[Leaf] = []
786 body_leaves: list[Leaf] = []
787 head_leaves: list[Leaf] = []
788 current_leaves = head_leaves
789 matching_bracket: Optional[Leaf] = None
790 depth = 0
791 for index, leaf in enumerate(line.leaves):
792 if index == 2 and leaf.type == token.LSQB:
793 # A [ at index 2 means this is a type param, so start
794 # tracking the depth
795 depth += 1
796 elif depth > 0:
797 if leaf.type == token.LSQB:
798 depth += 1
799 elif leaf.type == token.RSQB:
800 depth -= 1
801 if (
802 current_leaves is body_leaves
803 and leaf.type in CLOSING_BRACKETS
804 and leaf.opening_bracket is matching_bracket
805 and isinstance(matching_bracket, Leaf)
806 # If the code is still on LPAR and we are inside a type
807 # param, ignore the match since this is searching
808 # for the function arguments
809 and not (leaf_type == token.LPAR and depth > 0)
810 ):
811 ensure_visible(leaf)
812 ensure_visible(matching_bracket)
813 current_leaves = tail_leaves if body_leaves else head_leaves
814 current_leaves.append(leaf)
815 if current_leaves is head_leaves:
816 if leaf.type == leaf_type:
817 matching_bracket = leaf
818 current_leaves = body_leaves
819 if matching_bracket and tail_leaves:
820 break
821 if not matching_bracket or not tail_leaves:
822 raise CannotSplit("No brackets found")
824 head = bracket_split_build_line(
825 head_leaves, line, matching_bracket, component=_BracketSplitComponent.head
826 )
827 body = bracket_split_build_line(
828 body_leaves, line, matching_bracket, component=_BracketSplitComponent.body
829 )
830 tail = bracket_split_build_line(
831 tail_leaves, line, matching_bracket, component=_BracketSplitComponent.tail
832 )
833 bracket_split_succeeded_or_raise(head, body, tail)
834 for result in (head, body, tail):
835 if result:
836 yield result
839def right_hand_split(
840 line: Line,
841 mode: Mode,
842 features: Collection[Feature] = (),
843 omit: Collection[LeafID] = (),
844) -> Iterator[Line]:
845 """Split line into many lines, starting with the last matching bracket pair.
847 If the split was by optional parentheses, attempt splitting without them, too.
848 `omit` is a collection of closing bracket IDs that shouldn't be considered for
849 this split.
851 Note: running this function modifies `bracket_depth` on the leaves of `line`.
852 """
853 rhs_result = _first_right_hand_split(line, omit=omit)
854 yield from _maybe_split_omitting_optional_parens(
855 rhs_result, line, mode, features=features, omit=omit
856 )
859def _first_right_hand_split(
860 line: Line,
861 omit: Collection[LeafID] = (),
862) -> RHSResult:
863 """Split the line into head, body, tail starting with the last bracket pair.
865 Note: this function should not have side effects. It's relied upon by
866 _maybe_split_omitting_optional_parens to get an opinion whether to prefer
867 splitting on the right side of an assignment statement.
868 """
869 tail_leaves: list[Leaf] = []
870 body_leaves: list[Leaf] = []
871 head_leaves: list[Leaf] = []
872 current_leaves = tail_leaves
873 opening_bracket: Optional[Leaf] = None
874 closing_bracket: Optional[Leaf] = None
875 for leaf in reversed(line.leaves):
876 if current_leaves is body_leaves:
877 if leaf is opening_bracket:
878 current_leaves = head_leaves if body_leaves else tail_leaves
879 current_leaves.append(leaf)
880 if current_leaves is tail_leaves:
881 if leaf.type in CLOSING_BRACKETS and id(leaf) not in omit:
882 opening_bracket = leaf.opening_bracket
883 closing_bracket = leaf
884 current_leaves = body_leaves
885 if not (opening_bracket and closing_bracket and head_leaves):
886 # If there is no opening or closing_bracket that means the split failed and
887 # all content is in the tail. Otherwise, if `head_leaves` are empty, it means
888 # the matching `opening_bracket` wasn't available on `line` anymore.
889 raise CannotSplit("No brackets found")
891 tail_leaves.reverse()
892 body_leaves.reverse()
893 head_leaves.reverse()
895 body: Optional[Line] = None
896 if (
897 Preview.hug_parens_with_braces_and_square_brackets in line.mode
898 and tail_leaves[0].value
899 and tail_leaves[0].opening_bracket is head_leaves[-1]
900 ):
901 inner_body_leaves = list(body_leaves)
902 hugged_opening_leaves: list[Leaf] = []
903 hugged_closing_leaves: list[Leaf] = []
904 is_unpacking = body_leaves[0].type in [token.STAR, token.DOUBLESTAR]
905 unpacking_offset: int = 1 if is_unpacking else 0
906 while (
907 len(inner_body_leaves) >= 2 + unpacking_offset
908 and inner_body_leaves[-1].type in CLOSING_BRACKETS
909 and inner_body_leaves[-1].opening_bracket
910 is inner_body_leaves[unpacking_offset]
911 ):
912 if unpacking_offset:
913 hugged_opening_leaves.append(inner_body_leaves.pop(0))
914 unpacking_offset = 0
915 hugged_opening_leaves.append(inner_body_leaves.pop(0))
916 hugged_closing_leaves.insert(0, inner_body_leaves.pop())
918 if hugged_opening_leaves and inner_body_leaves:
919 inner_body = bracket_split_build_line(
920 inner_body_leaves,
921 line,
922 hugged_opening_leaves[-1],
923 component=_BracketSplitComponent.body,
924 )
925 if (
926 line.mode.magic_trailing_comma
927 and inner_body_leaves[-1].type == token.COMMA
928 ):
929 should_hug = True
930 else:
931 line_length = line.mode.line_length - sum(
932 len(str(leaf))
933 for leaf in hugged_opening_leaves + hugged_closing_leaves
934 )
935 if is_line_short_enough(
936 inner_body, mode=replace(line.mode, line_length=line_length)
937 ):
938 # Do not hug if it fits on a single line.
939 should_hug = False
940 else:
941 should_hug = True
942 if should_hug:
943 body_leaves = inner_body_leaves
944 head_leaves.extend(hugged_opening_leaves)
945 tail_leaves = hugged_closing_leaves + tail_leaves
946 body = inner_body # No need to re-calculate the body again later.
948 head = bracket_split_build_line(
949 head_leaves, line, opening_bracket, component=_BracketSplitComponent.head
950 )
951 if body is None:
952 body = bracket_split_build_line(
953 body_leaves, line, opening_bracket, component=_BracketSplitComponent.body
954 )
955 tail = bracket_split_build_line(
956 tail_leaves, line, opening_bracket, component=_BracketSplitComponent.tail
957 )
958 bracket_split_succeeded_or_raise(head, body, tail)
959 return RHSResult(head, body, tail, opening_bracket, closing_bracket)
962def _maybe_split_omitting_optional_parens(
963 rhs: RHSResult,
964 line: Line,
965 mode: Mode,
966 features: Collection[Feature] = (),
967 omit: Collection[LeafID] = (),
968) -> Iterator[Line]:
969 if (
970 Feature.FORCE_OPTIONAL_PARENTHESES not in features
971 # the opening bracket is an optional paren
972 and rhs.opening_bracket.type == token.LPAR
973 and not rhs.opening_bracket.value
974 # the closing bracket is an optional paren
975 and rhs.closing_bracket.type == token.RPAR
976 and not rhs.closing_bracket.value
977 # it's not an import (optional parens are the only thing we can split on
978 # in this case; attempting a split without them is a waste of time)
979 and not line.is_import
980 # and we can actually remove the parens
981 and can_omit_invisible_parens(rhs, mode.line_length)
982 ):
983 omit = {id(rhs.closing_bracket), *omit}
984 try:
985 # The RHSResult Omitting Optional Parens.
986 rhs_oop = _first_right_hand_split(line, omit=omit)
987 if _prefer_split_rhs_oop_over_rhs(rhs_oop, rhs, mode):
988 yield from _maybe_split_omitting_optional_parens(
989 rhs_oop, line, mode, features=features, omit=omit
990 )
991 return
993 except CannotSplit as e:
994 # For chained assignments we want to use the previous successful split
995 if line.is_chained_assignment:
996 pass
998 elif (
999 not can_be_split(rhs.body)
1000 and not is_line_short_enough(rhs.body, mode=mode)
1001 and not (
1002 Preview.wrap_long_dict_values_in_parens
1003 and rhs.opening_bracket.parent
1004 and rhs.opening_bracket.parent.parent
1005 and rhs.opening_bracket.parent.parent.type == syms.dictsetmaker
1006 )
1007 ):
1008 raise CannotSplit(
1009 "Splitting failed, body is still too long and can't be split."
1010 ) from e
1012 elif (
1013 rhs.head.contains_multiline_strings()
1014 or rhs.tail.contains_multiline_strings()
1015 ):
1016 raise CannotSplit(
1017 "The current optional pair of parentheses is bound to fail to"
1018 " satisfy the splitting algorithm because the head or the tail"
1019 " contains multiline strings which by definition never fit one"
1020 " line."
1021 ) from e
1023 ensure_visible(rhs.opening_bracket)
1024 ensure_visible(rhs.closing_bracket)
1025 for result in (rhs.head, rhs.body, rhs.tail):
1026 if result:
1027 yield result
1030def _prefer_split_rhs_oop_over_rhs(
1031 rhs_oop: RHSResult, rhs: RHSResult, mode: Mode
1032) -> bool:
1033 """
1034 Returns whether we should prefer the result from a split omitting optional parens
1035 (rhs_oop) over the original (rhs).
1036 """
1037 # contains unsplittable type ignore
1038 if (
1039 rhs_oop.head.contains_unsplittable_type_ignore()
1040 or rhs_oop.body.contains_unsplittable_type_ignore()
1041 or rhs_oop.tail.contains_unsplittable_type_ignore()
1042 ):
1043 return True
1045 # Retain optional parens around dictionary values
1046 if (
1047 Preview.wrap_long_dict_values_in_parens
1048 and rhs.opening_bracket.parent
1049 and rhs.opening_bracket.parent.parent
1050 and rhs.opening_bracket.parent.parent.type == syms.dictsetmaker
1051 and rhs.body.bracket_tracker.delimiters
1052 ):
1053 # Unless the split is inside the key
1054 return any(leaf.type == token.COLON for leaf in rhs_oop.tail.leaves)
1056 # the split is right after `=`
1057 if not (len(rhs.head.leaves) >= 2 and rhs.head.leaves[-2].type == token.EQUAL):
1058 return True
1060 # the left side of assignment contains brackets
1061 if not any(leaf.type in BRACKETS for leaf in rhs.head.leaves[:-1]):
1062 return True
1064 # the left side of assignment is short enough (the -1 is for the ending optional
1065 # paren)
1066 if not is_line_short_enough(
1067 rhs.head, mode=replace(mode, line_length=mode.line_length - 1)
1068 ):
1069 return True
1071 # the left side of assignment won't explode further because of magic trailing comma
1072 if rhs.head.magic_trailing_comma is not None:
1073 return True
1075 # If we have multiple targets, we prefer more `=`s on the head vs pushing them to
1076 # the body
1077 rhs_head_equal_count = [leaf.type for leaf in rhs.head.leaves].count(token.EQUAL)
1078 rhs_oop_head_equal_count = [leaf.type for leaf in rhs_oop.head.leaves].count(
1079 token.EQUAL
1080 )
1081 if rhs_head_equal_count > 1 and rhs_head_equal_count > rhs_oop_head_equal_count:
1082 return False
1084 has_closing_bracket_after_assign = False
1085 for leaf in reversed(rhs_oop.head.leaves):
1086 if leaf.type == token.EQUAL:
1087 break
1088 if leaf.type in CLOSING_BRACKETS:
1089 has_closing_bracket_after_assign = True
1090 break
1091 return (
1092 # contains matching brackets after the `=` (done by checking there is a
1093 # closing bracket)
1094 has_closing_bracket_after_assign
1095 or (
1096 # the split is actually from inside the optional parens (done by checking
1097 # the first line still contains the `=`)
1098 any(leaf.type == token.EQUAL for leaf in rhs_oop.head.leaves)
1099 # the first line is short enough
1100 and is_line_short_enough(rhs_oop.head, mode=mode)
1101 )
1102 )
1105def bracket_split_succeeded_or_raise(head: Line, body: Line, tail: Line) -> None:
1106 """Raise :exc:`CannotSplit` if the last left- or right-hand split failed.
1108 Do nothing otherwise.
1110 A left- or right-hand split is based on a pair of brackets. Content before
1111 (and including) the opening bracket is left on one line, content inside the
1112 brackets is put on a separate line, and finally content starting with and
1113 following the closing bracket is put on a separate line.
1115 Those are called `head`, `body`, and `tail`, respectively. If the split
1116 produced the same line (all content in `head`) or ended up with an empty `body`
1117 and the `tail` is just the closing bracket, then it's considered failed.
1118 """
1119 tail_len = len(str(tail).strip())
1120 if not body:
1121 if tail_len == 0:
1122 raise CannotSplit("Splitting brackets produced the same line")
1124 elif tail_len < 3:
1125 raise CannotSplit(
1126 f"Splitting brackets on an empty body to save {tail_len} characters is"
1127 " not worth it"
1128 )
1131def _ensure_trailing_comma(
1132 leaves: list[Leaf], original: Line, opening_bracket: Leaf
1133) -> bool:
1134 if not leaves:
1135 return False
1136 # Ensure a trailing comma for imports
1137 if original.is_import:
1138 return True
1139 # ...and standalone function arguments
1140 if not original.is_def:
1141 return False
1142 if opening_bracket.value != "(":
1143 return False
1144 # Don't add commas if we already have any commas
1145 if any(
1146 leaf.type == token.COMMA and not is_part_of_annotation(leaf) for leaf in leaves
1147 ):
1148 return False
1150 # Find a leaf with a parent (comments don't have parents)
1151 leaf_with_parent = next((leaf for leaf in leaves if leaf.parent), None)
1152 if leaf_with_parent is None:
1153 return True
1154 # Don't add commas inside parenthesized return annotations
1155 if get_annotation_type(leaf_with_parent) == "return":
1156 return False
1157 # Don't add commas inside PEP 604 unions
1158 if (
1159 leaf_with_parent.parent
1160 and leaf_with_parent.parent.next_sibling
1161 and leaf_with_parent.parent.next_sibling.type == token.VBAR
1162 ):
1163 return False
1164 return True
1167def bracket_split_build_line(
1168 leaves: list[Leaf],
1169 original: Line,
1170 opening_bracket: Leaf,
1171 *,
1172 component: _BracketSplitComponent,
1173) -> Line:
1174 """Return a new line with given `leaves` and respective comments from `original`.
1176 If it's the head component, brackets will be tracked so trailing commas are
1177 respected.
1179 If it's the body component, the result line is one-indented inside brackets and as
1180 such has its first leaf's prefix normalized and a trailing comma added when
1181 expected.
1182 """
1183 result = Line(mode=original.mode, depth=original.depth)
1184 if component is _BracketSplitComponent.body:
1185 result.inside_brackets = True
1186 result.depth += 1
1187 if _ensure_trailing_comma(leaves, original, opening_bracket):
1188 for i in range(len(leaves) - 1, -1, -1):
1189 if leaves[i].type == STANDALONE_COMMENT:
1190 continue
1192 if leaves[i].type != token.COMMA:
1193 new_comma = Leaf(token.COMMA, ",")
1194 leaves.insert(i + 1, new_comma)
1195 break
1197 leaves_to_track: set[LeafID] = set()
1198 if component is _BracketSplitComponent.head:
1199 leaves_to_track = get_leaves_inside_matching_brackets(leaves)
1200 # Populate the line
1201 for leaf in leaves:
1202 result.append(
1203 leaf,
1204 preformatted=True,
1205 track_bracket=id(leaf) in leaves_to_track,
1206 )
1207 for comment_after in original.comments_after(leaf):
1208 result.append(comment_after, preformatted=True)
1209 if component is _BracketSplitComponent.body and should_split_line(
1210 result, opening_bracket
1211 ):
1212 result.should_split_rhs = True
1213 return result
1216def dont_increase_indentation(split_func: Transformer) -> Transformer:
1217 """Normalize prefix of the first leaf in every line returned by `split_func`.
1219 This is a decorator over relevant split functions.
1220 """
1222 @wraps(split_func)
1223 def split_wrapper(
1224 line: Line, features: Collection[Feature], mode: Mode
1225 ) -> Iterator[Line]:
1226 for split_line in split_func(line, features, mode):
1227 split_line.leaves[0].prefix = ""
1228 yield split_line
1230 return split_wrapper
1233def _get_last_non_comment_leaf(line: Line) -> Optional[int]:
1234 for leaf_idx in range(len(line.leaves) - 1, 0, -1):
1235 if line.leaves[leaf_idx].type != STANDALONE_COMMENT:
1236 return leaf_idx
1237 return None
1240def _can_add_trailing_comma(leaf: Leaf, features: Collection[Feature]) -> bool:
1241 if is_vararg(leaf, within={syms.typedargslist}):
1242 return Feature.TRAILING_COMMA_IN_DEF in features
1243 if is_vararg(leaf, within={syms.arglist, syms.argument}):
1244 return Feature.TRAILING_COMMA_IN_CALL in features
1245 return True
1248def _safe_add_trailing_comma(safe: bool, delimiter_priority: int, line: Line) -> Line:
1249 if (
1250 safe
1251 and delimiter_priority == COMMA_PRIORITY
1252 and line.leaves[-1].type != token.COMMA
1253 and line.leaves[-1].type != STANDALONE_COMMENT
1254 ):
1255 new_comma = Leaf(token.COMMA, ",")
1256 line.append(new_comma)
1257 return line
1260MIGRATE_COMMENT_DELIMITERS = {STRING_PRIORITY, COMMA_PRIORITY}
1263@dont_increase_indentation
1264def delimiter_split(
1265 line: Line, features: Collection[Feature], mode: Mode
1266) -> Iterator[Line]:
1267 """Split according to delimiters of the highest priority.
1269 If the appropriate Features are given, the split will add trailing commas
1270 also in function signatures and calls that contain `*` and `**`.
1271 """
1272 if len(line.leaves) == 0:
1273 raise CannotSplit("Line empty") from None
1274 last_leaf = line.leaves[-1]
1276 bt = line.bracket_tracker
1277 try:
1278 delimiter_priority = bt.max_delimiter_priority(exclude={id(last_leaf)})
1279 except ValueError:
1280 raise CannotSplit("No delimiters found") from None
1282 if (
1283 delimiter_priority == DOT_PRIORITY
1284 and bt.delimiter_count_with_priority(delimiter_priority) == 1
1285 ):
1286 raise CannotSplit("Splitting a single attribute from its owner looks wrong")
1288 current_line = Line(
1289 mode=line.mode, depth=line.depth, inside_brackets=line.inside_brackets
1290 )
1291 lowest_depth = sys.maxsize
1292 trailing_comma_safe = True
1294 def append_to_line(leaf: Leaf) -> Iterator[Line]:
1295 """Append `leaf` to current line or to new line if appending impossible."""
1296 nonlocal current_line
1297 try:
1298 current_line.append_safe(leaf, preformatted=True)
1299 except ValueError:
1300 yield current_line
1302 current_line = Line(
1303 mode=line.mode, depth=line.depth, inside_brackets=line.inside_brackets
1304 )
1305 current_line.append(leaf)
1307 def append_comments(leaf: Leaf) -> Iterator[Line]:
1308 for comment_after in line.comments_after(leaf):
1309 yield from append_to_line(comment_after)
1311 last_non_comment_leaf = _get_last_non_comment_leaf(line)
1312 for leaf_idx, leaf in enumerate(line.leaves):
1313 yield from append_to_line(leaf)
1315 previous_priority = leaf_idx > 0 and bt.delimiters.get(
1316 id(line.leaves[leaf_idx - 1])
1317 )
1318 if (
1319 previous_priority != delimiter_priority
1320 or delimiter_priority in MIGRATE_COMMENT_DELIMITERS
1321 ):
1322 yield from append_comments(leaf)
1324 lowest_depth = min(lowest_depth, leaf.bracket_depth)
1325 if trailing_comma_safe and leaf.bracket_depth == lowest_depth:
1326 trailing_comma_safe = _can_add_trailing_comma(leaf, features)
1328 if last_leaf.type == STANDALONE_COMMENT and leaf_idx == last_non_comment_leaf:
1329 current_line = _safe_add_trailing_comma(
1330 trailing_comma_safe, delimiter_priority, current_line
1331 )
1333 leaf_priority = bt.delimiters.get(id(leaf))
1334 if leaf_priority == delimiter_priority:
1335 if (
1336 leaf_idx + 1 < len(line.leaves)
1337 and delimiter_priority not in MIGRATE_COMMENT_DELIMITERS
1338 ):
1339 yield from append_comments(line.leaves[leaf_idx + 1])
1341 yield current_line
1342 current_line = Line(
1343 mode=line.mode, depth=line.depth, inside_brackets=line.inside_brackets
1344 )
1346 if current_line:
1347 current_line = _safe_add_trailing_comma(
1348 trailing_comma_safe, delimiter_priority, current_line
1349 )
1350 yield current_line
1353@dont_increase_indentation
1354def standalone_comment_split(
1355 line: Line, features: Collection[Feature], mode: Mode
1356) -> Iterator[Line]:
1357 """Split standalone comments from the rest of the line."""
1358 if not line.contains_standalone_comments():
1359 raise CannotSplit("Line does not have any standalone comments")
1361 current_line = Line(
1362 mode=line.mode, depth=line.depth, inside_brackets=line.inside_brackets
1363 )
1365 def append_to_line(leaf: Leaf) -> Iterator[Line]:
1366 """Append `leaf` to current line or to new line if appending impossible."""
1367 nonlocal current_line
1368 try:
1369 current_line.append_safe(leaf, preformatted=True)
1370 except ValueError:
1371 yield current_line
1373 current_line = Line(
1374 line.mode, depth=line.depth, inside_brackets=line.inside_brackets
1375 )
1376 current_line.append(leaf)
1378 for leaf in line.leaves:
1379 yield from append_to_line(leaf)
1381 for comment_after in line.comments_after(leaf):
1382 yield from append_to_line(comment_after)
1384 if current_line:
1385 yield current_line
1388def normalize_invisible_parens( # noqa: C901
1389 node: Node, parens_after: set[str], *, mode: Mode, features: Collection[Feature]
1390) -> None:
1391 """Make existing optional parentheses invisible or create new ones.
1393 `parens_after` is a set of string leaf values immediately after which parens
1394 should be put.
1396 Standardizes on visible parentheses for single-element tuples, and keeps
1397 existing visible parentheses for other tuples and generator expressions.
1398 """
1399 for pc in list_comments(node.prefix, is_endmarker=False):
1400 if pc.value in FMT_OFF:
1401 # This `node` has a prefix with `# fmt: off`, don't mess with parens.
1402 return
1404 # The multiple context managers grammar has a different pattern, thus this is
1405 # separate from the for-loop below. This possibly wraps them in invisible parens,
1406 # and later will be removed in remove_with_parens when needed.
1407 if node.type == syms.with_stmt:
1408 _maybe_wrap_cms_in_parens(node, mode, features)
1410 check_lpar = False
1411 for index, child in enumerate(list(node.children)):
1412 # Fixes a bug where invisible parens are not properly stripped from
1413 # assignment statements that contain type annotations.
1414 if isinstance(child, Node) and child.type == syms.annassign:
1415 normalize_invisible_parens(
1416 child, parens_after=parens_after, mode=mode, features=features
1417 )
1419 # Fixes a bug where invisible parens are not properly wrapped around
1420 # case blocks.
1421 if isinstance(child, Node) and child.type == syms.case_block:
1422 normalize_invisible_parens(
1423 child, parens_after={"case"}, mode=mode, features=features
1424 )
1426 # Add parentheses around if guards in case blocks
1427 if isinstance(child, Node) and child.type == syms.guard:
1428 normalize_invisible_parens(
1429 child, parens_after={"if"}, mode=mode, features=features
1430 )
1432 # Add parentheses around long tuple unpacking in assignments.
1433 if (
1434 index == 0
1435 and isinstance(child, Node)
1436 and child.type == syms.testlist_star_expr
1437 ):
1438 check_lpar = True
1440 if check_lpar:
1441 if (
1442 child.type == syms.atom
1443 and node.type == syms.for_stmt
1444 and isinstance(child.prev_sibling, Leaf)
1445 and child.prev_sibling.type == token.NAME
1446 and child.prev_sibling.value == "for"
1447 ):
1448 if maybe_make_parens_invisible_in_atom(
1449 child,
1450 parent=node,
1451 remove_brackets_around_comma=True,
1452 ):
1453 wrap_in_parentheses(node, child, visible=False)
1454 elif isinstance(child, Node) and node.type == syms.with_stmt:
1455 remove_with_parens(child, node)
1456 elif child.type == syms.atom:
1457 if maybe_make_parens_invisible_in_atom(
1458 child,
1459 parent=node,
1460 ):
1461 wrap_in_parentheses(node, child, visible=False)
1462 elif is_one_tuple(child):
1463 wrap_in_parentheses(node, child, visible=True)
1464 elif node.type == syms.import_from:
1465 _normalize_import_from(node, child, index)
1466 break
1467 elif (
1468 index == 1
1469 and child.type == token.STAR
1470 and node.type == syms.except_clause
1471 ):
1472 # In except* (PEP 654), the star is actually part of
1473 # of the keyword. So we need to skip the insertion of
1474 # invisible parentheses to work more precisely.
1475 continue
1477 elif (
1478 isinstance(child, Leaf)
1479 and child.next_sibling is not None
1480 and child.next_sibling.type == token.COLON
1481 and child.value == "case"
1482 ):
1483 # A special patch for "case case:" scenario, the second occurrence
1484 # of case will be not parsed as a Python keyword.
1485 break
1487 elif not is_multiline_string(child):
1488 wrap_in_parentheses(node, child, visible=False)
1490 comma_check = child.type == token.COMMA
1492 check_lpar = isinstance(child, Leaf) and (
1493 child.value in parens_after or comma_check
1494 )
1497def _normalize_import_from(parent: Node, child: LN, index: int) -> None:
1498 # "import from" nodes store parentheses directly as part of
1499 # the statement
1500 if is_lpar_token(child):
1501 assert is_rpar_token(parent.children[-1])
1502 # make parentheses invisible
1503 child.value = ""
1504 parent.children[-1].value = ""
1505 elif child.type != token.STAR:
1506 # insert invisible parentheses
1507 parent.insert_child(index, Leaf(token.LPAR, ""))
1508 parent.append_child(Leaf(token.RPAR, ""))
1511def remove_await_parens(node: Node) -> None:
1512 if node.children[0].type == token.AWAIT and len(node.children) > 1:
1513 if (
1514 node.children[1].type == syms.atom
1515 and node.children[1].children[0].type == token.LPAR
1516 ):
1517 if maybe_make_parens_invisible_in_atom(
1518 node.children[1],
1519 parent=node,
1520 remove_brackets_around_comma=True,
1521 ):
1522 wrap_in_parentheses(node, node.children[1], visible=False)
1524 # Since await is an expression we shouldn't remove
1525 # brackets in cases where this would change
1526 # the AST due to operator precedence.
1527 # Therefore we only aim to remove brackets around
1528 # power nodes that aren't also await expressions themselves.
1529 # https://peps.python.org/pep-0492/#updated-operator-precedence-table
1530 # N.B. We've still removed any redundant nested brackets though :)
1531 opening_bracket = cast(Leaf, node.children[1].children[0])
1532 closing_bracket = cast(Leaf, node.children[1].children[-1])
1533 bracket_contents = node.children[1].children[1]
1534 if isinstance(bracket_contents, Node) and (
1535 bracket_contents.type != syms.power
1536 or bracket_contents.children[0].type == token.AWAIT
1537 or any(
1538 isinstance(child, Leaf) and child.type == token.DOUBLESTAR
1539 for child in bracket_contents.children
1540 )
1541 ):
1542 ensure_visible(opening_bracket)
1543 ensure_visible(closing_bracket)
1546def _maybe_wrap_cms_in_parens(
1547 node: Node, mode: Mode, features: Collection[Feature]
1548) -> None:
1549 """When enabled and safe, wrap the multiple context managers in invisible parens.
1551 It is only safe when `features` contain Feature.PARENTHESIZED_CONTEXT_MANAGERS.
1552 """
1553 if (
1554 Feature.PARENTHESIZED_CONTEXT_MANAGERS not in features
1555 or len(node.children) <= 2
1556 # If it's an atom, it's already wrapped in parens.
1557 or node.children[1].type == syms.atom
1558 ):
1559 return
1560 colon_index: Optional[int] = None
1561 for i in range(2, len(node.children)):
1562 if node.children[i].type == token.COLON:
1563 colon_index = i
1564 break
1565 if colon_index is not None:
1566 lpar = Leaf(token.LPAR, "")
1567 rpar = Leaf(token.RPAR, "")
1568 context_managers = node.children[1:colon_index]
1569 for child in context_managers:
1570 child.remove()
1571 # After wrapping, the with_stmt will look like this:
1572 # with_stmt
1573 # NAME 'with'
1574 # atom
1575 # LPAR ''
1576 # testlist_gexp
1577 # ... <-- context_managers
1578 # /testlist_gexp
1579 # RPAR ''
1580 # /atom
1581 # COLON ':'
1582 new_child = Node(
1583 syms.atom, [lpar, Node(syms.testlist_gexp, context_managers), rpar]
1584 )
1585 node.insert_child(1, new_child)
1588def remove_with_parens(node: Node, parent: Node) -> None:
1589 """Recursively hide optional parens in `with` statements."""
1590 # Removing all unnecessary parentheses in with statements in one pass is a tad
1591 # complex as different variations of bracketed statements result in pretty
1592 # different parse trees:
1593 #
1594 # with (open("file")) as f: # this is an asexpr_test
1595 # ...
1596 #
1597 # with (open("file") as f): # this is an atom containing an
1598 # ... # asexpr_test
1599 #
1600 # with (open("file")) as f, (open("file")) as f: # this is asexpr_test, COMMA,
1601 # ... # asexpr_test
1602 #
1603 # with (open("file") as f, open("file") as f): # an atom containing a
1604 # ... # testlist_gexp which then
1605 # # contains multiple asexpr_test(s)
1606 if node.type == syms.atom:
1607 if maybe_make_parens_invisible_in_atom(
1608 node,
1609 parent=parent,
1610 remove_brackets_around_comma=True,
1611 ):
1612 wrap_in_parentheses(parent, node, visible=False)
1613 if isinstance(node.children[1], Node):
1614 remove_with_parens(node.children[1], node)
1615 elif node.type == syms.testlist_gexp:
1616 for child in node.children:
1617 if isinstance(child, Node):
1618 remove_with_parens(child, node)
1619 elif node.type == syms.asexpr_test and not any(
1620 leaf.type == token.COLONEQUAL for leaf in node.leaves()
1621 ):
1622 if maybe_make_parens_invisible_in_atom(
1623 node.children[0],
1624 parent=node,
1625 remove_brackets_around_comma=True,
1626 ):
1627 wrap_in_parentheses(node, node.children[0], visible=False)
1630def maybe_make_parens_invisible_in_atom(
1631 node: LN,
1632 parent: LN,
1633 remove_brackets_around_comma: bool = False,
1634) -> bool:
1635 """If it's safe, make the parens in the atom `node` invisible, recursively.
1636 Additionally, remove repeated, adjacent invisible parens from the atom `node`
1637 as they are redundant.
1639 Returns whether the node should itself be wrapped in invisible parentheses.
1640 """
1641 if (
1642 node.type not in (syms.atom, syms.expr)
1643 or is_empty_tuple(node)
1644 or is_one_tuple(node)
1645 or (is_tuple(node) and parent.type == syms.asexpr_test)
1646 or (
1647 is_tuple(node)
1648 and parent.type == syms.with_stmt
1649 and has_sibling_with_type(node, token.COMMA)
1650 )
1651 or (is_yield(node) and parent.type != syms.expr_stmt)
1652 or (
1653 # This condition tries to prevent removing non-optional brackets
1654 # around a tuple, however, can be a bit overzealous so we provide
1655 # and option to skip this check for `for` and `with` statements.
1656 not remove_brackets_around_comma
1657 and max_delimiter_priority_in_atom(node) >= COMMA_PRIORITY
1658 )
1659 or is_tuple_containing_walrus(node)
1660 or is_tuple_containing_star(node)
1661 or is_generator(node)
1662 ):
1663 return False
1665 if is_walrus_assignment(node):
1666 if parent.type in [
1667 syms.annassign,
1668 syms.expr_stmt,
1669 syms.assert_stmt,
1670 syms.return_stmt,
1671 syms.except_clause,
1672 syms.funcdef,
1673 syms.with_stmt,
1674 syms.testlist_gexp,
1675 syms.tname,
1676 # these ones aren't useful to end users, but they do please fuzzers
1677 syms.for_stmt,
1678 syms.del_stmt,
1679 syms.for_stmt,
1680 ]:
1681 return False
1683 first = node.children[0]
1684 last = node.children[-1]
1685 if is_lpar_token(first) and is_rpar_token(last):
1686 middle = node.children[1]
1687 # make parentheses invisible
1688 if (
1689 # If the prefix of `middle` includes a type comment with
1690 # ignore annotation, then we do not remove the parentheses
1691 not is_type_ignore_comment_string(middle.prefix.strip())
1692 ):
1693 first.value = ""
1694 last.value = ""
1695 maybe_make_parens_invisible_in_atom(
1696 middle,
1697 parent=parent,
1698 remove_brackets_around_comma=remove_brackets_around_comma,
1699 )
1701 if is_atom_with_invisible_parens(middle):
1702 # Strip the invisible parens from `middle` by replacing
1703 # it with the child in-between the invisible parens
1704 middle.replace(middle.children[1])
1706 if middle.children[0].prefix.strip():
1707 # Preserve comments before first paren
1708 middle.children[1].prefix = (
1709 middle.children[0].prefix + middle.children[1].prefix
1710 )
1712 if middle.children[-1].prefix.strip():
1713 # Preserve comments before last paren
1714 last.prefix = middle.children[-1].prefix + last.prefix
1716 return False
1718 return True
1721def should_split_line(line: Line, opening_bracket: Leaf) -> bool:
1722 """Should `line` be immediately split with `delimiter_split()` after RHS?"""
1724 if not (opening_bracket.parent and opening_bracket.value in "[{("):
1725 return False
1727 # We're essentially checking if the body is delimited by commas and there's more
1728 # than one of them (we're excluding the trailing comma and if the delimiter priority
1729 # is still commas, that means there's more).
1730 exclude = set()
1731 trailing_comma = False
1732 try:
1733 last_leaf = line.leaves[-1]
1734 if last_leaf.type == token.COMMA:
1735 trailing_comma = True
1736 exclude.add(id(last_leaf))
1737 max_priority = line.bracket_tracker.max_delimiter_priority(exclude=exclude)
1738 except (IndexError, ValueError):
1739 return False
1741 return max_priority == COMMA_PRIORITY and (
1742 (line.mode.magic_trailing_comma and trailing_comma)
1743 # always explode imports
1744 or opening_bracket.parent.type in {syms.atom, syms.import_from}
1745 )
1748def generate_trailers_to_omit(line: Line, line_length: int) -> Iterator[set[LeafID]]:
1749 """Generate sets of closing bracket IDs that should be omitted in a RHS.
1751 Brackets can be omitted if the entire trailer up to and including
1752 a preceding closing bracket fits in one line.
1754 Yielded sets are cumulative (contain results of previous yields, too). First
1755 set is empty, unless the line should explode, in which case bracket pairs until
1756 the one that needs to explode are omitted.
1757 """
1759 omit: set[LeafID] = set()
1760 if not line.magic_trailing_comma:
1761 yield omit
1763 length = 4 * line.depth
1764 opening_bracket: Optional[Leaf] = None
1765 closing_bracket: Optional[Leaf] = None
1766 inner_brackets: set[LeafID] = set()
1767 for index, leaf, leaf_length in line.enumerate_with_length(is_reversed=True):
1768 length += leaf_length
1769 if length > line_length:
1770 break
1772 has_inline_comment = leaf_length > len(leaf.value) + len(leaf.prefix)
1773 if leaf.type == STANDALONE_COMMENT or has_inline_comment:
1774 break
1776 if opening_bracket:
1777 if leaf is opening_bracket:
1778 opening_bracket = None
1779 elif leaf.type in CLOSING_BRACKETS:
1780 prev = line.leaves[index - 1] if index > 0 else None
1781 if (
1782 prev
1783 and prev.type == token.COMMA
1784 and leaf.opening_bracket is not None
1785 and not is_one_sequence_between(
1786 leaf.opening_bracket, leaf, line.leaves
1787 )
1788 ):
1789 # Never omit bracket pairs with trailing commas.
1790 # We need to explode on those.
1791 break
1793 inner_brackets.add(id(leaf))
1794 elif leaf.type in CLOSING_BRACKETS:
1795 prev = line.leaves[index - 1] if index > 0 else None
1796 if prev and prev.type in OPENING_BRACKETS:
1797 # Empty brackets would fail a split so treat them as "inner"
1798 # brackets (e.g. only add them to the `omit` set if another
1799 # pair of brackets was good enough.
1800 inner_brackets.add(id(leaf))
1801 continue
1803 if closing_bracket:
1804 omit.add(id(closing_bracket))
1805 omit.update(inner_brackets)
1806 inner_brackets.clear()
1807 yield omit
1809 if (
1810 prev
1811 and prev.type == token.COMMA
1812 and leaf.opening_bracket is not None
1813 and not is_one_sequence_between(leaf.opening_bracket, leaf, line.leaves)
1814 ):
1815 # Never omit bracket pairs with trailing commas.
1816 # We need to explode on those.
1817 break
1819 if leaf.value:
1820 opening_bracket = leaf.opening_bracket
1821 closing_bracket = leaf
1824def run_transformer(
1825 line: Line,
1826 transform: Transformer,
1827 mode: Mode,
1828 features: Collection[Feature],
1829 *,
1830 line_str: str = "",
1831) -> list[Line]:
1832 if not line_str:
1833 line_str = line_to_string(line)
1834 result: list[Line] = []
1835 for transformed_line in transform(line, features, mode):
1836 if str(transformed_line).strip("\n") == line_str:
1837 raise CannotTransform("Line transformer returned an unchanged result")
1839 result.extend(transform_line(transformed_line, mode=mode, features=features))
1841 features_set = set(features)
1842 if (
1843 Feature.FORCE_OPTIONAL_PARENTHESES in features_set
1844 or transform.__class__.__name__ != "rhs"
1845 or not line.bracket_tracker.invisible
1846 or any(bracket.value for bracket in line.bracket_tracker.invisible)
1847 or line.contains_multiline_strings()
1848 or result[0].contains_uncollapsable_type_comments()
1849 or result[0].contains_unsplittable_type_ignore()
1850 or is_line_short_enough(result[0], mode=mode)
1851 # If any leaves have no parents (which _can_ occur since
1852 # `transform(line)` potentially destroys the line's underlying node
1853 # structure), then we can't proceed. Doing so would cause the below
1854 # call to `append_leaves()` to fail.
1855 or any(leaf.parent is None for leaf in line.leaves)
1856 ):
1857 return result
1859 line_copy = line.clone()
1860 append_leaves(line_copy, line, line.leaves)
1861 features_fop = features_set | {Feature.FORCE_OPTIONAL_PARENTHESES}
1862 second_opinion = run_transformer(
1863 line_copy, transform, mode, features_fop, line_str=line_str
1864 )
1865 if all(is_line_short_enough(ln, mode=mode) for ln in second_opinion):
1866 result = second_opinion
1867 return result