Fix trailing comma for function with one arg (#880) (#891)

[etc/vim.git] / black.py
diff --git a/black.py b/black.py

index c8aa30b812b49795c797e0e262159ebda024f67a..8318674a722f41fa70e4dfe95febe839dd93c87e 100644 (file)
--- a/black.py
+++ b/black.py
@@ -16,6 +16,7 @@ import signal
  import sys
  import tempfile
  import tokenize
+import traceback
  from typing import (
      Any,
      Callable,
@@ -48,7 +49,6 @@ from blib2to3 import pygram, pytree
  from blib2to3.pgen2 import driver, token
  from blib2to3.pgen2.grammar import Grammar
  from blib2to3.pgen2.parse import ParseError
-from blib2to3.pgen2.tokenize import TokenizerConfig
  
  
  __version__ = "19.3b0"
@@ -139,18 +139,18 @@ class Feature(Enum):
      TRAILING_COMMA_IN_DEF = 5
      # The following two feature-flags are mutually exclusive, and exactly one should be
      # set for every version of python.
-    ASYNC_IS_VALID_IDENTIFIER = 6
-    ASYNC_IS_RESERVED_KEYWORD = 7
+    ASYNC_IDENTIFIERS = 6
+    ASYNC_KEYWORDS = 7
  
  
  VERSION_TO_FEATURES: Dict[TargetVersion, Set[Feature]] = {
-    TargetVersion.PY27: {Feature.ASYNC_IS_VALID_IDENTIFIER},
-    TargetVersion.PY33: {Feature.UNICODE_LITERALS, Feature.ASYNC_IS_VALID_IDENTIFIER},
-    TargetVersion.PY34: {Feature.UNICODE_LITERALS, Feature.ASYNC_IS_VALID_IDENTIFIER},
+    TargetVersion.PY27: {Feature.ASYNC_IDENTIFIERS},
+    TargetVersion.PY33: {Feature.UNICODE_LITERALS, Feature.ASYNC_IDENTIFIERS},
+    TargetVersion.PY34: {Feature.UNICODE_LITERALS, Feature.ASYNC_IDENTIFIERS},
      TargetVersion.PY35: {
          Feature.UNICODE_LITERALS,
          Feature.TRAILING_COMMA_IN_CALL,
-        Feature.ASYNC_IS_VALID_IDENTIFIER,
+        Feature.ASYNC_IDENTIFIERS,
      },
      TargetVersion.PY36: {
          Feature.UNICODE_LITERALS,
@@ -158,7 +158,7 @@ VERSION_TO_FEATURES: Dict[TargetVersion, Set[Feature]] = {
          Feature.NUMERIC_UNDERSCORES,
          Feature.TRAILING_COMMA_IN_CALL,
          Feature.TRAILING_COMMA_IN_DEF,
-        Feature.ASYNC_IS_VALID_IDENTIFIER,
+        Feature.ASYNC_IDENTIFIERS,
      },
      TargetVersion.PY37: {
          Feature.UNICODE_LITERALS,
@@ -166,7 +166,7 @@ VERSION_TO_FEATURES: Dict[TargetVersion, Set[Feature]] = {
          Feature.NUMERIC_UNDERSCORES,
          Feature.TRAILING_COMMA_IN_CALL,
          Feature.TRAILING_COMMA_IN_DEF,
-        Feature.ASYNC_IS_RESERVED_KEYWORD,
+        Feature.ASYNC_KEYWORDS,
      },
      TargetVersion.PY38: {
          Feature.UNICODE_LITERALS,
@@ -174,7 +174,7 @@ VERSION_TO_FEATURES: Dict[TargetVersion, Set[Feature]] = {
          Feature.NUMERIC_UNDERSCORES,
          Feature.TRAILING_COMMA_IN_CALL,
          Feature.TRAILING_COMMA_IN_DEF,
-        Feature.ASYNC_IS_RESERVED_KEYWORD,
+        Feature.ASYNC_KEYWORDS,
      },
  }
  
@@ -337,7 +337,7 @@ def read_pyproject_toml(
      "--quiet",
      is_flag=True,
      help=(
-        "Don't emit non-error messages to stderr. Errors are still emitted, "
+        "Don't emit non-error messages to stderr. Errors are still emitted; "
          "silence those with 2>/dev/null."
      ),
  )
@@ -458,8 +458,7 @@ def main(
          )
  
      if verbose or not quiet:
-        bang = "💥 💔 💥" if report.return_code else "✨ 🍰 ✨"
-        out(f"All done! {bang}")
+        out("Oh no! 💥 💔 💥" if report.return_code else "All done! ✨ 🍰 ✨")
          click.secho(str(report), err=True)
      ctx.exit(report.return_code)
  
@@ -469,8 +468,7 @@ def reformat_one(
  ) -> None:
      """Reformat a single file under `src` without spawning child processes.
  
-    If `quiet` is True, non-error messages are not output. `line_length`,
-    `write_back`, `fast` and `pyi` options are passed to
+    `fast`, `write_back`, and `mode` options are passed to
      :func:`format_file_in_place` or :func:`format_stdin_to_stdout`.
      """
      try:
@@ -610,7 +608,7 @@ def format_file_in_place(
  
      If `write_back` is DIFF, write a diff to stdout. If it is YES, write reformatted
      code to the file.
-    `line_length` and `fast` options are passed to :func:`format_file_contents`.
+    `mode` and `fast` options are passed to :func:`format_file_contents`.
      """
      if src.suffix == ".pyi":
          mode = evolve(mode, is_pyi=True)
@@ -688,7 +686,7 @@ def format_file_contents(
  
      If `fast` is False, additionally confirm that the reformatted code is
      valid by calling :func:`assert_equivalent` and :func:`assert_stable` on it.
-    `line_length` is passed to :func:`format_str`.
+    `mode` is passed to :func:`format_str`.
      """
      if src_contents.strip() == "":
          raise NothingChanged
@@ -706,10 +704,11 @@ def format_file_contents(
  def format_str(src_contents: str, *, mode: FileMode) -> FileContent:
      """Reformat a string and return new contents.
  
-    `line_length` determines how many characters per line are allowed.
+    `mode` determines formatting options, such as how many characters per line are
+    allowed.
      """
      src_node = lib2to3_parse(src_contents.lstrip(), mode.target_versions)
-    dst_contents = ""
+    dst_contents = []
      future_imports = get_future_imports(src_node)
      if mode.target_versions:
          versions = mode.target_versions
@@ -732,15 +731,15 @@ def format_str(src_contents: str, *, mode: FileMode) -> FileContent:
      }
      for current_line in lines.visit(src_node):
          for _ in range(after):
-            dst_contents += str(empty_line)
+            dst_contents.append(str(empty_line))
          before, after = elt.maybe_empty_lines(current_line)
          for _ in range(before):
-            dst_contents += str(empty_line)
+            dst_contents.append(str(empty_line))
          for line in split_line(
              current_line, line_length=mode.line_length, features=split_line_features
          ):
-            dst_contents += str(line)
-    return dst_contents
+            dst_contents.append(str(line))
+    return "".join(dst_contents)
  
  
  def decode_bytes(src: bytes) -> Tuple[FileContent, Encoding, NewLine]:
@@ -760,62 +759,42 @@ def decode_bytes(src: bytes) -> Tuple[FileContent, Encoding, NewLine]:
          return tiow.read(), encoding, newline
  
  
-@dataclass(frozen=True)
-class ParserConfig:
-    grammar: Grammar
-    tokenizer_config: TokenizerConfig = TokenizerConfig()
-
-
-def get_parser_configs(target_versions: Set[TargetVersion]) -> List[ParserConfig]:
+def get_grammars(target_versions: Set[TargetVersion]) -> List[Grammar]:
      if not target_versions:
          # No target_version specified, so try all grammars.
          return [
              # Python 3.7+
-            ParserConfig(
-                pygram.python_grammar_no_print_statement_no_exec_statement,
-                TokenizerConfig(async_is_reserved_keyword=True),
-            ),
+            pygram.python_grammar_no_print_statement_no_exec_statement_async_keywords,
              # Python 3.0-3.6
-            ParserConfig(
-                pygram.python_grammar_no_print_statement_no_exec_statement,
-                TokenizerConfig(async_is_reserved_keyword=False),
-            ),
+            pygram.python_grammar_no_print_statement_no_exec_statement,
              # Python 2.7 with future print_function import
-            ParserConfig(pygram.python_grammar_no_print_statement),
+            pygram.python_grammar_no_print_statement,
              # Python 2.7
-            ParserConfig(pygram.python_grammar),
+            pygram.python_grammar,
          ]
      elif all(version.is_python2() for version in target_versions):
          # Python 2-only code, so try Python 2 grammars.
          return [
              # Python 2.7 with future print_function import
-            ParserConfig(pygram.python_grammar_no_print_statement),
+            pygram.python_grammar_no_print_statement,
              # Python 2.7
-            ParserConfig(pygram.python_grammar),
+            pygram.python_grammar,
          ]
      else:
          # Python 3-compatible code, so only try Python 3 grammar.
-        configs = []
+        grammars = []
          # If we have to parse both, try to parse async as a keyword first
-        if not supports_feature(target_versions, Feature.ASYNC_IS_VALID_IDENTIFIER):
+        if not supports_feature(target_versions, Feature.ASYNC_IDENTIFIERS):
              # Python 3.7+
-            configs.append(
-                ParserConfig(
-                    pygram.python_grammar_no_print_statement_no_exec_statement,
-                    TokenizerConfig(async_is_reserved_keyword=True),
-                )
+            grammars.append(
+                pygram.python_grammar_no_print_statement_no_exec_statement_async_keywords  # noqa: B950
              )
-        if not supports_feature(target_versions, Feature.ASYNC_IS_RESERVED_KEYWORD):
+        if not supports_feature(target_versions, Feature.ASYNC_KEYWORDS):
              # Python 3.0-3.6
-            configs.append(
-                ParserConfig(
-                    pygram.python_grammar_no_print_statement_no_exec_statement,
-                    TokenizerConfig(async_is_reserved_keyword=False),
-                )
-            )
+            grammars.append(pygram.python_grammar_no_print_statement_no_exec_statement)
          # At least one of the above branches must have been taken, because every Python
-        # version has exactly one of the two 'ASYNC_IS_*' flags
-        return configs
+        # version has exactly one of the two 'ASYNC_*' flags
+        return grammars
  
  
  def lib2to3_parse(src_txt: str, target_versions: Iterable[TargetVersion] = ()) -> Node:
@@ -823,12 +802,8 @@ def lib2to3_parse(src_txt: str, target_versions: Iterable[TargetVersion] = ()) -
      if src_txt[-1:] != "\n":
          src_txt += "\n"
  
-    for parser_config in get_parser_configs(set(target_versions)):
-        drv = driver.Driver(
-            parser_config.grammar,
-            pytree.convert,
-            tokenizer_config=parser_config.tokenizer_config,
-        )
+    for grammar in get_grammars(set(target_versions)):
+        drv = driver.Driver(grammar, pytree.convert)
          try:
              result = drv.parse_string(src_txt, True)
              break
@@ -1086,7 +1061,7 @@ class BracketTracker:
          """Return True if there is an yet unmatched open bracket on the line."""
          return bool(self.bracket_match)
  
-    def max_delimiter_priority(self, exclude: Iterable[LeafID] = ()) -> int:
+    def max_delimiter_priority(self, exclude: Iterable[LeafID] = ()) -> Priority:
          """Return the highest priority of a delimiter found on the line.
  
          Values are consistent with what `is_split_*_delimiter()` return.
@@ -1094,7 +1069,7 @@ class BracketTracker:
          """
          return max(v for k, v in self.delimiters.items() if k not in exclude)
  
-    def delimiter_count_with_priority(self, priority: int = 0) -> int:
+    def delimiter_count_with_priority(self, priority: Priority = 0) -> int:
          """Return the number of delimiters with the given `priority`.
  
          If no `priority` is passed, defaults to max priority on the line.
@@ -1377,7 +1352,10 @@ class Line:
              bracket_depth = leaf.bracket_depth
              if bracket_depth == depth and leaf.type == token.COMMA:
                  commas += 1
-                if leaf.parent and leaf.parent.type == syms.arglist:
+                if leaf.parent and leaf.parent.type in {
+                    syms.arglist,
+                    syms.typedargslist,
+                }:
                      commas += 1
                      break
  
@@ -1627,6 +1605,26 @@ class LineGenerator(Visitor[Line]):
                  self.current_line.append(node)
          yield from super().visit_default(node)
  
+    def visit_atom(self, node: Node) -> Iterator[Line]:
+        # Always make parentheses invisible around a single node, because it should
+        # not be needed (except in the case of yield, where removing the parentheses
+        # produces a SyntaxError).
+        if (
+            len(node.children) == 3
+            and isinstance(node.children[0], Leaf)
+            and node.children[0].type == token.LPAR
+            and isinstance(node.children[2], Leaf)
+            and node.children[2].type == token.RPAR
+            and isinstance(node.children[1], Leaf)
+            and not (
+                node.children[1].type == token.NAME
+                and node.children[1].value == "yield"
+            )
+        ):
+            node.children[0].value = ""
+            node.children[2].value = ""
+        yield from super().visit_default(node)
+
      def visit_INDENT(self, node: Node) -> Iterator[Line]:
          """Increase indentation level, maybe yield a line."""
          # In blib2to3 INDENT never holds comments.
@@ -2040,7 +2038,7 @@ def container_of(leaf: Leaf) -> LN:
      return container
  
  
-def is_split_after_delimiter(leaf: Leaf, previous: Optional[Leaf] = None) -> int:
+def is_split_after_delimiter(leaf: Leaf, previous: Optional[Leaf] = None) -> Priority:
      """Return the priority of the `leaf` delimiter, given a line break after it.
  
      The delimiter priorities returned here are from those delimiters that would
@@ -2054,7 +2052,7 @@ def is_split_after_delimiter(leaf: Leaf, previous: Optional[Leaf] = None) -> int
      return 0
  
  
-def is_split_before_delimiter(leaf: Leaf, previous: Optional[Leaf] = None) -> int:
+def is_split_before_delimiter(leaf: Leaf, previous: Optional[Leaf] = None) -> Priority:
      """Return the priority of the `leaf` delimiter, given a line break before it.
  
      The delimiter priorities returned here are from those delimiters that would
@@ -2493,9 +2491,13 @@ def bracket_split_build_line(
          if leaves:
              # Since body is a new indent level, remove spurious leading whitespace.
              normalize_prefix(leaves[0], inside_brackets=True)
-            # Ensure a trailing comma for imports, but be careful not to add one after
-            # any comments.
-            if original.is_import:
+            # Ensure a trailing comma for imports and standalone function arguments, but
+            # be careful not to add one after any comments.
+            no_commas = original.is_def and not any(
+                l.type == token.COMMA for l in leaves
+            )
+
+            if original.is_import or no_commas:
                  for i in range(len(leaves) - 1, -1, -1):
                      if leaves[i].type == STANDALONE_COMMENT:
                          continue
@@ -2734,7 +2736,15 @@ def normalize_string_quotes(leaf: Leaf) -> None:
          new_body = sub_twice(escaped_orig_quote, rf"\1\2{orig_quote}", new_body)
          new_body = sub_twice(unescaped_new_quote, rf"\1\\{new_quote}", new_body)
      if "f" in prefix.casefold():
-        matches = re.findall(r"[^{]\{(.*?)\}[^}]", new_body)
+        matches = re.findall(
+            r"""
+            (?:[^{]|^)\{  # start of the string or a non-{ followed by a single {
+                ([^{].*?)  # contents of the brackets except if begins with {{
+            \}(?:[^}]|$)  # A } followed by end of the string or a non-}
+            """,
+            new_body,
+            re.VERBOSE,
+        )
          for m in matches:
              if "\\" in str(m):
                  # Do not introduce backslashes in interpolated expressions
@@ -2801,7 +2811,7 @@ def format_float_or_int_string(text: str) -> str:
  def normalize_invisible_parens(node: Node, parens_after: Set[str]) -> None:
      """Make existing optional parentheses invisible or create new ones.
  
-    `parens_after` is a set of string leaf values immeditely after which parens
+    `parens_after` is a set of string leaf values immediately after which parens
      should be put.
  
      Standardizes on visible parentheses for single-element tuples, and keeps
@@ -3079,7 +3089,7 @@ def is_stub_body(node: LN) -> bool:
      )
  
  
-def max_delimiter_priority_in_atom(node: LN) -> int:
+def max_delimiter_priority_in_atom(node: LN) -> Priority:
      """Return maximum delimiter priority inside `node`.
  
      This is specific to atoms with contents contained in a pair of parentheses.
@@ -3452,8 +3462,6 @@ def parse_ast(src: str) -> Union[ast3.AST, ast27.AST]:
  def assert_equivalent(src: str, dst: str) -> None:
      """Raise AssertionError if `src` and `dst` aren't equivalent."""
  
-    import traceback
-
      def _v(node: Union[ast3.AST, ast27.AST], depth: int = 0) -> Iterator[str]:
          """Simple visitor generating strings to compare ASTs by content."""
          yield f"{'  ' * depth}{node.__class__.__name__}("
@@ -3544,8 +3552,6 @@ def assert_stable(src: str, dst: str, mode: FileMode) -> None:
  
  def dump_to_file(*output: str) -> str:
      """Dump `output` to a temporary file. Return path to the file."""
-    import tempfile
-
      with tempfile.NamedTemporaryFile(
          mode="w", prefix="blk_", suffix=".log", delete=False, encoding="utf8"
      ) as f:
@@ -3643,7 +3649,6 @@ def enumerate_with_length(
          if "\n" in leaf.value:
              return  # Multiline strings, we can't continue.
  
-        comment: Optional[Leaf]
          for comment in line.comments_after(leaf):
              length += len(comment.value)