use STARS instead of STAR | DOUBLESTAR

[etc/vim.git] / black.py
diff --git a/black.py b/black.py

index 537ba599807ffea932a223884a40488d22c8ab45..0323f67c257c1cca2a8ac3655171f3b7d74ddecd 100644 (file)
--- a/black.py
+++ b/black.py
@@ -24,6 +24,7 @@ from typing import (
      Iterator,
      List,
      Optional,
+    Pattern,
      Set,
      Tuple,
      Type,
@@ -40,7 +41,7 @@ from blib2to3 import pygram, pytree
  from blib2to3.pgen2 import driver, token
  from blib2to3.pgen2.parse import ParseError
  
-__version__ = "18.4a1"
+__version__ = "18.4a2"
  DEFAULT_LINE_LENGTH = 88
  # types
  syms = pygram.python_symbols
@@ -521,7 +522,20 @@ MATH_OPERATORS = {
      token.DOUBLESTAR,
      token.DOUBLESLASH,
  }
-VARARGS = {token.STAR, token.DOUBLESTAR}
+STARS = {token.STAR, token.DOUBLESTAR}
+VARARGS_PARENTS = {
+    syms.arglist,
+    syms.argument,  # double star in arglist
+    syms.trailer,  # single argument to call
+    syms.typedargslist,
+    syms.varargslist,  # lambdas
+}
+UNPACKING_PARENTS = {
+    syms.atom,  # single element of a list or set literal
+    syms.dictsetmaker,
+    syms.listmaker,
+    syms.testlist_gexp,
+}
  COMPREHENSION_PRIORITY = 20
  COMMA_PRIORITY = 10
  LOGIC_PRIORITY = 5
@@ -1254,18 +1268,8 @@ def whitespace(leaf: Leaf) -> str:  # noqa C901
                      # that, too.
                      return prevp.prefix
  
-        elif prevp.type == token.DOUBLESTAR:
-            if (
-                prevp.parent
-                and prevp.parent.type in {
-                    syms.arglist,
-                    syms.argument,
-                    syms.dictsetmaker,
-                    syms.parameters,
-                    syms.typedargslist,
-                    syms.varargslist,
-                }
-            ):
+        elif prevp.type in STARS:
+            if is_vararg(prevp, within=VARARGS_PARENTS | UNPACKING_PARENTS):
                  return NO
  
          elif prevp.type == token.COLON:
@@ -1274,7 +1278,7 @@ def whitespace(leaf: Leaf) -> str:  # noqa C901
  
          elif (
              prevp.parent
-            and prevp.parent.type in {syms.factor, syms.star_expr}
+            and prevp.parent.type == syms.factor
              and prevp.type in MATH_OPERATORS
          ):
              return NO
@@ -1360,7 +1364,7 @@ def whitespace(leaf: Leaf) -> str:  # noqa C901
              if not prevp or prevp.type == token.LPAR:
                  return NO
  
-        elif prev.type == token.EQUAL or prev.type == token.DOUBLESTAR:
+        elif prev.type in {token.EQUAL} | STARS:
              return NO
  
      elif p.type == syms.decorator:
@@ -1495,11 +1499,7 @@ def is_split_before_delimiter(leaf: Leaf, previous: Leaf = None) -> int:
  
      Higher numbers are higher priority.
      """
-    if (
-        leaf.type in VARARGS
-        and leaf.parent
-        and leaf.parent.type in {syms.argument, syms.typedargslist, syms.dictsetmaker}
-    ):
+    if is_vararg(leaf, within=VARARGS_PARENTS | UNPACKING_PARENTS):
          # * and ** might also be MATH_OPERATORS but in this case they are not.
          # Don't treat them as a delimiter.
          return 0
@@ -1877,8 +1877,7 @@ def delimiter_split(line: Line, py36: bool = False) -> Iterator[Line]:
          lowest_depth = min(lowest_depth, leaf.bracket_depth)
          if (
              leaf.bracket_depth == lowest_depth
-            and leaf.type == token.STAR
-            or leaf.type == token.DOUBLESTAR
+            and is_vararg(leaf, within=VARARGS_PARENTS)
          ):
              trailing_comma_safe = trailing_comma_safe and py36
          leaf_priority = delimiters.get(id(leaf))
@@ -1984,9 +1983,10 @@ def normalize_string_quotes(leaf: Leaf) -> None:
          return  # There's an internal error
  
      prefix = leaf.value[:first_quote_pos]
-    body = leaf.value[first_quote_pos + len(orig_quote):-len(orig_quote)]
      unescaped_new_quote = re.compile(rf"(([^\\]|^)(\\\\)*){new_quote}")
-    escaped_orig_quote = re.compile(rf"\\(\\\\)*{orig_quote}")
+    escaped_new_quote = re.compile(rf"([^\\]|^)\\(\\\\)*{new_quote}")
+    escaped_orig_quote = re.compile(rf"([^\\]|^)\\(\\\\)*{orig_quote}")
+    body = leaf.value[first_quote_pos + len(orig_quote):-len(orig_quote)]
      if "r" in prefix.casefold():
          if unescaped_new_quote.search(body):
              # There's at least one unescaped new_quote in this raw string
@@ -1996,11 +1996,14 @@ def normalize_string_quotes(leaf: Leaf) -> None:
          # Do not introduce or remove backslashes in raw strings
          new_body = body
      else:
-        new_body = escaped_orig_quote.sub(rf"\1{orig_quote}", body)
-        new_body = unescaped_new_quote.sub(rf"\1\\{new_quote}", new_body)
-        # Add escapes again for consecutive occurences of new_quote (sub
-        # doesn't match overlapping substrings).
-        new_body = unescaped_new_quote.sub(rf"\1\\{new_quote}", new_body)
+        # remove unnecessary quotes
+        new_body = sub_twice(escaped_new_quote, rf"\1\2{new_quote}", body)
+        if body != new_body:
+            # Consider the string without unnecessary quotes as the original
+            body = new_body
+            leaf.value = f"{prefix}{orig_quote}{body}{orig_quote}"
+        new_body = sub_twice(escaped_orig_quote, rf"\1\2{orig_quote}", new_body)
+        new_body = sub_twice(unescaped_new_quote, rf"\1\\{new_quote}", new_body)
      if new_quote == '"""' and new_body[-1] == '"':
          # edge case:
          new_body = new_body[:-1] + '\\"'
@@ -2085,6 +2088,29 @@ def is_one_tuple(node: LN) -> bool:
      )
  
  
+def is_vararg(leaf: Leaf, within: Set[NodeType]) -> bool:
+    """Return True if `leaf` is a star or double star in a vararg or kwarg.
+
+    If `within` includes VARARGS_PARENTS, this applies to function signatures.
+    If `within` includes COLLECTION_LIBERALS_PARENTS, it applies to right
+    hand-side extended iterable unpacking (PEP 3132) and additional unpacking
+    generalizations (PEP 448).
+    """
+    if leaf.type not in STARS or not leaf.parent:
+        return False
+
+    p = leaf.parent
+    if p.type == syms.star_expr:
+        # Star expressions are also used as assignment targets in extended
+        # iterable unpacking (PEP 3132).  See what its parent is instead.
+        if not p.parent:
+            return False
+
+        p = p.parent
+
+    return p.type in within
+
+
  def max_delimiter_priority_in_atom(node: LN) -> int:
      if node.type != syms.atom:
          return 0
@@ -2139,7 +2165,7 @@ def is_python36(node: Node) -> bool:
              and n.children[-1].type == token.COMMA
          ):
              for ch in n.children:
-                if ch.type == token.STAR or ch.type == token.DOUBLESTAR:
+                if ch.type in STARS:
                      return True
  
      return False
@@ -2325,7 +2351,7 @@ def dump_to_file(*output: str) -> str:
      import tempfile
  
      with tempfile.NamedTemporaryFile(
-        mode="w", prefix="blk_", suffix=".log", delete=False
+        mode="w", prefix="blk_", suffix=".log", delete=False, encoding="utf8"
      ) as f:
          for lines in output:
              f.write(lines)
@@ -2374,5 +2400,14 @@ def shutdown(loop: BaseEventLoop) -> None:
          loop.close()
  
  
+def sub_twice(regex: Pattern[str], replacement: str, original: str) -> str:
+    """Replace `regex` with `replacement` twice on `original`.
+
+    This is used by string normalization to perform replaces on
+    overlapping matches.
+    """
+    return regex.sub(replacement, regex.sub(replacement, original))
+
+
  if __name__ == "__main__":
      main()