Remove Python version in the_basics.md (#3528)

[etc/vim.git] / src / black / linegen.py
diff --git a/src/black/linegen.py b/src/black/linegen.py

index 644824a3c861c34d45ce7befc73a783ea7d6dc2b..bfc28ca006ccc44d72185a2cd355c7e958d31de6 100644 (file)
--- a/src/black/linegen.py
+++ b/src/black/linegen.py
@@ -2,6 +2,7 @@
  Generating lines of code.
  """
  import sys
+from dataclasses import dataclass
  from enum import Enum, auto
  from functools import partial, wraps
  from typing import Collection, Iterator, List, Optional, Set, Union, cast
@@ -24,6 +25,7 @@ from black.lines import (
  from black.mode import Feature, Mode, Preview
  from black.nodes import (
      ASSIGNMENTS,
+    BRACKETS,
      CLOSING_BRACKETS,
      OPENING_BRACKETS,
      RARROW,
@@ -44,6 +46,7 @@ from black.nodes import (
      is_rpar_token,
      is_stub_body,
      is_stub_suite,
+    is_tuple_containing_walrus,
      is_vararg,
      is_walrus_assignment,
      is_yield,
@@ -56,6 +59,7 @@ from black.strings import (
      get_string_prefix,
      normalize_string_prefix,
      normalize_string_quotes,
+    normalize_unicode_escape_sequences,
  )
  from black.trans import (
      CannotTransform,
@@ -87,8 +91,9 @@ class LineGenerator(Visitor[Line]):
      in ways that will no longer stringify to valid Python code on the tree.
      """
  
-    def __init__(self, mode: Mode) -> None:
+    def __init__(self, mode: Mode, features: Collection[Feature]) -> None:
          self.mode = mode
+        self.features = features
          self.current_line: Line
          self.__post_init__()
  
@@ -138,6 +143,22 @@ class LineGenerator(Visitor[Line]):
                  self.current_line.append(node)
          yield from super().visit_default(node)
  
+    def visit_test(self, node: Node) -> Iterator[Line]:
+        """Visit an `x if y else z` test"""
+
+        if Preview.parenthesize_conditional_expressions in self.mode:
+            already_parenthesized = (
+                node.prev_sibling and node.prev_sibling.type == token.LPAR
+            )
+
+            if not already_parenthesized:
+                lpar = Leaf(token.LPAR, "")
+                rpar = Leaf(token.RPAR, "")
+                node.insert_child(0, lpar)
+                node.append_child(rpar)
+
+        yield from self.visit_default(node)
+
      def visit_INDENT(self, node: Leaf) -> Iterator[Line]:
          """Increase indentation level, maybe yield a line."""
          # In blib2to3 INDENT never holds comments.
@@ -172,13 +193,32 @@ class LineGenerator(Visitor[Line]):
          `parens` holds a set of string leaf values immediately after which
          invisible parens should be put.
          """
-        normalize_invisible_parens(node, parens_after=parens, preview=self.mode.preview)
+        normalize_invisible_parens(
+            node, parens_after=parens, mode=self.mode, features=self.features
+        )
          for child in node.children:
              if is_name_token(child) and child.value in keywords:
                  yield from self.line()
  
              yield from self.visit(child)
  
+    def visit_dictsetmaker(self, node: Node) -> Iterator[Line]:
+        if Preview.wrap_long_dict_values_in_parens in self.mode:
+            for i, child in enumerate(node.children):
+                if i == 0:
+                    continue
+                if node.children[i - 1].type == token.COLON:
+                    if child.type == syms.atom and child.children[0].type == token.LPAR:
+                        if maybe_make_parens_invisible_in_atom(
+                            child,
+                            parent=node,
+                            remove_brackets_around_comma=False,
+                        ):
+                            wrap_in_parentheses(node, child, visible=False)
+                    else:
+                        wrap_in_parentheses(node, child, visible=False)
+        yield from self.visit_default(node)
+
      def visit_funcdef(self, node: Node) -> Iterator[Line]:
          """Visit function definition."""
          if Preview.annotation_parens not in self.mode:
@@ -208,7 +248,9 @@ class LineGenerator(Visitor[Line]):
  
      def visit_match_case(self, node: Node) -> Iterator[Line]:
          """Visit either a match or case statement."""
-        normalize_invisible_parens(node, parens_after=set(), preview=self.mode.preview)
+        normalize_invisible_parens(
+            node, parens_after=set(), mode=self.mode, features=self.features
+        )
  
          yield from self.line()
          for child in node.children:
@@ -327,6 +369,9 @@ class LineGenerator(Visitor[Line]):
          yield from self.visit_default(node)
  
      def visit_STRING(self, leaf: Leaf) -> Iterator[Line]:
+        if Preview.hex_codes_in_unicode_sequences in self.mode:
+            normalize_unicode_escape_sequences(leaf)
+
          if is_docstring(leaf) and "\\\n" not in leaf.value:
              # We're ignoring docstrings with backslash newline escapes because changing
              # indentation of those changes the AST representation of the code.
@@ -366,6 +411,7 @@ class LineGenerator(Visitor[Line]):
              else:
                  docstring = docstring.strip()
  
+            has_trailing_backslash = False
              if docstring:
                  # Add some padding if the docstring starts / ends with a quote mark.
                  if docstring[0] == quote_char:
@@ -378,6 +424,7 @@ class LineGenerator(Visitor[Line]):
                          # Odd number of tailing backslashes, add some padding to
                          # avoid escaping the closing string quote.
                          docstring += " "
+                        has_trailing_backslash = True
              elif not docstring_started_empty:
                  docstring = " "
  
@@ -400,6 +447,8 @@ class LineGenerator(Visitor[Line]):
                  if (
                      len(lines) > 1
                      and last_line_length + quote_len > self.mode.line_length
+                    and len(indent) + quote_len <= self.mode.line_length
+                    and not has_trailing_backslash
                  ):
                      leaf.value = prefix + quote + docstring + "\n" + indent + quote
                  else:
@@ -617,6 +666,17 @@ def left_hand_split(line: Line, _features: Collection[Feature] = ()) -> Iterator
              yield result
  
  
+@dataclass
+class _RHSResult:
+    """Intermediate split result from a right hand split."""
+
+    head: Line
+    body: Line
+    tail: Line
+    opening_bracket: Leaf
+    closing_bracket: Leaf
+
+
  def right_hand_split(
      line: Line,
      line_length: int,
@@ -631,6 +691,22 @@ def right_hand_split(
  
      Note: running this function modifies `bracket_depth` on the leaves of `line`.
      """
+    rhs_result = _first_right_hand_split(line, omit=omit)
+    yield from _maybe_split_omitting_optional_parens(
+        rhs_result, line, line_length, features=features, omit=omit
+    )
+
+
+def _first_right_hand_split(
+    line: Line,
+    omit: Collection[LeafID] = (),
+) -> _RHSResult:
+    """Split the line into head, body, tail starting with the last bracket pair.
+
+    Note: this function should not have side effects. It's relied upon by
+    _maybe_split_omitting_optional_parens to get an opinion whether to prefer
+    splitting on the right side of an assignment statement.
+    """
      tail_leaves: List[Leaf] = []
      body_leaves: List[Leaf] = []
      head_leaves: List[Leaf] = []
@@ -666,37 +742,71 @@ def right_hand_split(
          tail_leaves, line, opening_bracket, component=_BracketSplitComponent.tail
      )
      bracket_split_succeeded_or_raise(head, body, tail)
+    return _RHSResult(head, body, tail, opening_bracket, closing_bracket)
+
+
+def _maybe_split_omitting_optional_parens(
+    rhs: _RHSResult,
+    line: Line,
+    line_length: int,
+    features: Collection[Feature] = (),
+    omit: Collection[LeafID] = (),
+) -> Iterator[Line]:
      if (
          Feature.FORCE_OPTIONAL_PARENTHESES not in features
          # the opening bracket is an optional paren
-        and opening_bracket.type == token.LPAR
-        and not opening_bracket.value
+        and rhs.opening_bracket.type == token.LPAR
+        and not rhs.opening_bracket.value
          # the closing bracket is an optional paren
-        and closing_bracket.type == token.RPAR
-        and not closing_bracket.value
+        and rhs.closing_bracket.type == token.RPAR
+        and not rhs.closing_bracket.value
          # it's not an import (optional parens are the only thing we can split on
          # in this case; attempting a split without them is a waste of time)
          and not line.is_import
          # there are no standalone comments in the body
-        and not body.contains_standalone_comments(0)
+        and not rhs.body.contains_standalone_comments(0)
          # and we can actually remove the parens
-        and can_omit_invisible_parens(body, line_length)
+        and can_omit_invisible_parens(rhs.body, line_length)
      ):
-        omit = {id(closing_bracket), *omit}
+        omit = {id(rhs.closing_bracket), *omit}
          try:
-            yield from right_hand_split(line, line_length, features=features, omit=omit)
-            return
+            # The _RHSResult Omitting Optional Parens.
+            rhs_oop = _first_right_hand_split(line, omit=omit)
+            if not (
+                Preview.prefer_splitting_right_hand_side_of_assignments in line.mode
+                # the split is right after `=`
+                and len(rhs.head.leaves) >= 2
+                and rhs.head.leaves[-2].type == token.EQUAL
+                # the left side of assignement contains brackets
+                and any(leaf.type in BRACKETS for leaf in rhs.head.leaves[:-1])
+                # the left side of assignment is short enough (the -1 is for the ending
+                # optional paren)
+                and is_line_short_enough(rhs.head, line_length=line_length - 1)
+                # the left side of assignment won't explode further because of magic
+                # trailing comma
+                and rhs.head.magic_trailing_comma is None
+                # the split by omitting optional parens isn't preferred by some other
+                # reason
+                and not _prefer_split_rhs_oop(rhs_oop, line_length=line_length)
+            ):
+                yield from _maybe_split_omitting_optional_parens(
+                    rhs_oop, line, line_length, features=features, omit=omit
+                )
+                return
  
          except CannotSplit as e:
              if not (
-                can_be_split(body)
-                or is_line_short_enough(body, line_length=line_length)
+                can_be_split(rhs.body)
+                or is_line_short_enough(rhs.body, line_length=line_length)
              ):
                  raise CannotSplit(
                      "Splitting failed, body is still too long and can't be split."
                  ) from e
  
-            elif head.contains_multiline_strings() or tail.contains_multiline_strings():
+            elif (
+                rhs.head.contains_multiline_strings()
+                or rhs.tail.contains_multiline_strings()
+            ):
                  raise CannotSplit(
                      "The current optional pair of parentheses is bound to fail to"
                      " satisfy the splitting algorithm because the head or the tail"
@@ -704,13 +814,42 @@ def right_hand_split(
                      " line."
                  ) from e
  
-    ensure_visible(opening_bracket)
-    ensure_visible(closing_bracket)
-    for result in (head, body, tail):
+    ensure_visible(rhs.opening_bracket)
+    ensure_visible(rhs.closing_bracket)
+    for result in (rhs.head, rhs.body, rhs.tail):
          if result:
              yield result
  
  
+def _prefer_split_rhs_oop(rhs_oop: _RHSResult, line_length: int) -> bool:
+    """
+    Returns whether we should prefer the result from a split omitting optional parens.
+    """
+    has_closing_bracket_after_assign = False
+    for leaf in reversed(rhs_oop.head.leaves):
+        if leaf.type == token.EQUAL:
+            break
+        if leaf.type in CLOSING_BRACKETS:
+            has_closing_bracket_after_assign = True
+            break
+    return (
+        # contains matching brackets after the `=` (done by checking there is a
+        # closing bracket)
+        has_closing_bracket_after_assign
+        or (
+            # the split is actually from inside the optional parens (done by checking
+            # the first line still contains the `=`)
+            any(leaf.type == token.EQUAL for leaf in rhs_oop.head.leaves)
+            # the first line is short enough
+            and is_line_short_enough(rhs_oop.head, line_length=line_length)
+        )
+        # contains unsplittable type ignore
+        or rhs_oop.head.contains_unsplittable_type_ignore()
+        or rhs_oop.body.contains_unsplittable_type_ignore()
+        or rhs_oop.tail.contains_unsplittable_type_ignore()
+    )
+
+
  def bracket_split_succeeded_or_raise(head: Line, body: Line, tail: Line) -> None:
      """Raise :exc:`CannotSplit` if the last left- or right-hand split failed.
  
@@ -960,7 +1099,7 @@ def normalize_prefix(leaf: Leaf, *, inside_brackets: bool) -> None:
  
  
  def normalize_invisible_parens(
-    node: Node, parens_after: Set[str], *, preview: bool
+    node: Node, parens_after: Set[str], *, mode: Mode, features: Collection[Feature]
  ) -> None:
      """Make existing optional parentheses invisible or create new ones.
  
@@ -970,17 +1109,24 @@ def normalize_invisible_parens(
      Standardizes on visible parentheses for single-element tuples, and keeps
      existing visible parentheses for other tuples and generator expressions.
      """
-    for pc in list_comments(node.prefix, is_endmarker=False, preview=preview):
+    for pc in list_comments(node.prefix, is_endmarker=False, preview=mode.preview):
          if pc.value in FMT_OFF:
              # This `node` has a prefix with `# fmt: off`, don't mess with parens.
              return
+
+    # The multiple context managers grammar has a different pattern, thus this is
+    # separate from the for-loop below. This possibly wraps them in invisible parens,
+    # and later will be removed in remove_with_parens when needed.
+    if node.type == syms.with_stmt:
+        _maybe_wrap_cms_in_parens(node, mode, features)
+
      check_lpar = False
      for index, child in enumerate(list(node.children)):
          # Fixes a bug where invisible parens are not properly stripped from
          # assignment statements that contain type annotations.
          if isinstance(child, Node) and child.type == syms.annassign:
              normalize_invisible_parens(
-                child, parens_after=parens_after, preview=preview
+                child, parens_after=parens_after, mode=mode, features=features
              )
  
          # Add parentheses around long tuple unpacking in assignments.
@@ -993,7 +1139,7 @@ def normalize_invisible_parens(
  
          if check_lpar:
              if (
-                preview
+                mode.preview
                  and child.type == syms.atom
                  and node.type == syms.for_stmt
                  and isinstance(child.prev_sibling, Leaf)
@@ -1006,7 +1152,9 @@ def normalize_invisible_parens(
                      remove_brackets_around_comma=True,
                  ):
                      wrap_in_parentheses(node, child, visible=False)
-            elif preview and isinstance(child, Node) and node.type == syms.with_stmt:
+            elif (
+                mode.preview and isinstance(child, Node) and node.type == syms.with_stmt
+            ):
                  remove_with_parens(child, node)
              elif child.type == syms.atom:
                  if maybe_make_parens_invisible_in_atom(
@@ -1017,17 +1165,7 @@ def normalize_invisible_parens(
              elif is_one_tuple(child):
                  wrap_in_parentheses(node, child, visible=True)
              elif node.type == syms.import_from:
-                # "import from" nodes store parentheses directly as part of
-                # the statement
-                if is_lpar_token(child):
-                    assert is_rpar_token(node.children[-1])
-                    # make parentheses invisible
-                    child.value = ""
-                    node.children[-1].value = ""
-                elif child.type != token.STAR:
-                    # insert invisible parentheses
-                    node.insert_child(index, Leaf(token.LPAR, ""))
-                    node.append_child(Leaf(token.RPAR, ""))
+                _normalize_import_from(node, child, index)
                  break
              elif (
                  index == 1
@@ -1042,13 +1180,27 @@ def normalize_invisible_parens(
              elif not (isinstance(child, Leaf) and is_multiline_string(child)):
                  wrap_in_parentheses(node, child, visible=False)
  
-        comma_check = child.type == token.COMMA if preview else False
+        comma_check = child.type == token.COMMA if mode.preview else False
  
          check_lpar = isinstance(child, Leaf) and (
              child.value in parens_after or comma_check
          )
  
  
+def _normalize_import_from(parent: Node, child: LN, index: int) -> None:
+    # "import from" nodes store parentheses directly as part of
+    # the statement
+    if is_lpar_token(child):
+        assert is_rpar_token(parent.children[-1])
+        # make parentheses invisible
+        child.value = ""
+        parent.children[-1].value = ""
+    elif child.type != token.STAR:
+        # insert invisible parentheses
+        parent.insert_child(index, Leaf(token.LPAR, ""))
+        parent.append_child(Leaf(token.RPAR, ""))
+
+
  def remove_await_parens(node: Node) -> None:
      if node.children[0].type == token.AWAIT and len(node.children) > 1:
          if (
@@ -1085,6 +1237,49 @@ def remove_await_parens(node: Node) -> None:
                  remove_await_parens(bracket_contents)
  
  
+def _maybe_wrap_cms_in_parens(
+    node: Node, mode: Mode, features: Collection[Feature]
+) -> None:
+    """When enabled and safe, wrap the multiple context managers in invisible parens.
+
+    It is only safe when `features` contain Feature.PARENTHESIZED_CONTEXT_MANAGERS.
+    """
+    if (
+        Feature.PARENTHESIZED_CONTEXT_MANAGERS not in features
+        or Preview.wrap_multiple_context_managers_in_parens not in mode
+        or len(node.children) <= 2
+        # If it's an atom, it's already wrapped in parens.
+        or node.children[1].type == syms.atom
+    ):
+        return
+    colon_index: Optional[int] = None
+    for i in range(2, len(node.children)):
+        if node.children[i].type == token.COLON:
+            colon_index = i
+            break
+    if colon_index is not None:
+        lpar = Leaf(token.LPAR, "")
+        rpar = Leaf(token.RPAR, "")
+        context_managers = node.children[1:colon_index]
+        for child in context_managers:
+            child.remove()
+        # After wrapping, the with_stmt will look like this:
+        #   with_stmt
+        #     NAME 'with'
+        #     atom
+        #       LPAR ''
+        #       testlist_gexp
+        #         ... <-- context_managers
+        #       /testlist_gexp
+        #       RPAR ''
+        #     /atom
+        #     COLON ':'
+        new_child = Node(
+            syms.atom, [lpar, Node(syms.testlist_gexp, context_managers), rpar]
+        )
+        node.insert_child(1, new_child)
+
+
  def remove_with_parens(node: Node, parent: Node) -> None:
      """Recursively hide optional parens in `with` statements."""
      # Removing all unnecessary parentheses in with statements in one pass is a tad
@@ -1150,6 +1345,7 @@ def maybe_make_parens_invisible_in_atom(
              not remove_brackets_around_comma
              and max_delimiter_priority_in_atom(node) >= COMMA_PRIORITY
          )
+        or is_tuple_containing_walrus(node)
      ):
          return False
  
@@ -1159,9 +1355,13 @@ def maybe_make_parens_invisible_in_atom(
              syms.expr_stmt,
              syms.assert_stmt,
              syms.return_stmt,
+            syms.except_clause,
+            syms.funcdef,
+            syms.with_stmt,
              # these ones aren't useful to end users, but they do please fuzzers
              syms.for_stmt,
              syms.del_stmt,
+            syms.for_stmt,
          ]:
              return False
  
@@ -1308,8 +1508,10 @@ def run_transformer(
  
          result.extend(transform_line(transformed_line, mode=mode, features=features))
  
+    features_set = set(features)
      if (
-        transform.__class__.__name__ != "rhs"
+        Feature.FORCE_OPTIONAL_PARENTHESES in features_set
+        or transform.__class__.__name__ != "rhs"
          or not line.bracket_tracker.invisible
          or any(bracket.value for bracket in line.bracket_tracker.invisible)
          or line.contains_multiline_strings()
@@ -1326,7 +1528,7 @@ def run_transformer(
  
      line_copy = line.clone()
      append_leaves(line_copy, line, line.leaves)
-    features_fop = set(features) | {Feature.FORCE_OPTIONAL_PARENTHESES}
+    features_fop = features_set | {Feature.FORCE_OPTIONAL_PARENTHESES}
      second_opinion = run_transformer(
          line_copy, transform, mode, features_fop, line_str=line_str
      )