All patches and comments are welcome. Please squash your changes to logical
commits before using git-format-patch and git-send-email to
patches@git.madduck.net.
If you'd read over the Git project's submission guidelines and adhered to them,
I'd be especially grateful.
2 from asyncio.base_events import BaseEventLoop
3 from concurrent.futures import Executor, ProcessPoolExecutor
4 from datetime import datetime
6 from functools import lru_cache, partial, wraps
10 from multiprocessing import Manager, freeze_support
12 from pathlib import Path
39 from appdirs import user_cache_dir
40 from attr import dataclass, evolve, Factory
45 from blib2to3.pytree import Node, Leaf, type_repr
46 from blib2to3 import pygram, pytree
47 from blib2to3.pgen2 import driver, token
48 from blib2to3.pgen2.grammar import Grammar
49 from blib2to3.pgen2.parse import ParseError
52 __version__ = "19.3b0"
53 DEFAULT_LINE_LENGTH = 88
55 r"/(\.eggs|\.git|\.hg|\.mypy_cache|\.nox|\.tox|\.venv|_build|buck-out|build|dist)/"
57 DEFAULT_INCLUDES = r"\.pyi?$"
58 CACHE_DIR = Path(user_cache_dir("black", version=__version__))
70 LN = Union[Leaf, Node]
71 SplitFunc = Callable[["Line", Collection["Feature"]], Iterator["Line"]]
74 CacheInfo = Tuple[Timestamp, FileSize]
75 Cache = Dict[Path, CacheInfo]
76 out = partial(click.secho, bold=True, err=True)
77 err = partial(click.secho, fg="red", err=True)
79 pygram.initialize(CACHE_DIR)
80 syms = pygram.python_symbols
83 class NothingChanged(UserWarning):
84 """Raised when reformatted code is the same as source."""
87 class CannotSplit(Exception):
88 """A readable split that fits the allotted line length is impossible."""
91 class InvalidInput(ValueError):
92 """Raised when input source code fails all parse attempts."""
95 class WriteBack(Enum):
102 def from_configuration(cls, *, check: bool, diff: bool) -> "WriteBack":
103 if check and not diff:
106 return cls.DIFF if diff else cls.YES
115 class TargetVersion(Enum):
124 def is_python2(self) -> bool:
125 return self is TargetVersion.PY27
128 PY36_VERSIONS = {TargetVersion.PY36, TargetVersion.PY37, TargetVersion.PY38}
132 # All string literals are unicode
135 NUMERIC_UNDERSCORES = 3
136 TRAILING_COMMA_IN_CALL = 4
137 TRAILING_COMMA_IN_DEF = 5
140 VERSION_TO_FEATURES: Dict[TargetVersion, Set[Feature]] = {
141 TargetVersion.PY27: set(),
142 TargetVersion.PY33: {Feature.UNICODE_LITERALS},
143 TargetVersion.PY34: {Feature.UNICODE_LITERALS},
144 TargetVersion.PY35: {Feature.UNICODE_LITERALS, Feature.TRAILING_COMMA_IN_CALL},
145 TargetVersion.PY36: {
146 Feature.UNICODE_LITERALS,
148 Feature.NUMERIC_UNDERSCORES,
149 Feature.TRAILING_COMMA_IN_CALL,
150 Feature.TRAILING_COMMA_IN_DEF,
152 TargetVersion.PY37: {
153 Feature.UNICODE_LITERALS,
155 Feature.NUMERIC_UNDERSCORES,
156 Feature.TRAILING_COMMA_IN_CALL,
157 Feature.TRAILING_COMMA_IN_DEF,
159 TargetVersion.PY38: {
160 Feature.UNICODE_LITERALS,
162 Feature.NUMERIC_UNDERSCORES,
163 Feature.TRAILING_COMMA_IN_CALL,
164 Feature.TRAILING_COMMA_IN_DEF,
171 target_versions: Set[TargetVersion] = Factory(set)
172 line_length: int = DEFAULT_LINE_LENGTH
173 string_normalization: bool = True
176 def get_cache_key(self) -> str:
177 if self.target_versions:
178 version_str = ",".join(
180 for version in sorted(self.target_versions, key=lambda v: v.value)
186 str(self.line_length),
187 str(int(self.string_normalization)),
188 str(int(self.is_pyi)),
190 return ".".join(parts)
193 def supports_feature(target_versions: Set[TargetVersion], feature: Feature) -> bool:
194 return all(feature in VERSION_TO_FEATURES[version] for version in target_versions)
197 def read_pyproject_toml(
198 ctx: click.Context, param: click.Parameter, value: Union[str, int, bool, None]
200 """Inject Black configuration from "pyproject.toml" into defaults in `ctx`.
202 Returns the path to a successfully found and read configuration file, None
205 assert not isinstance(value, (int, bool)), "Invalid parameter type passed"
207 root = find_project_root(ctx.params.get("src", ()))
208 path = root / "pyproject.toml"
215 pyproject_toml = toml.load(value)
216 config = pyproject_toml.get("tool", {}).get("black", {})
217 except (toml.TomlDecodeError, OSError) as e:
218 raise click.FileError(
219 filename=value, hint=f"Error reading configuration file: {e}"
225 if ctx.default_map is None:
227 ctx.default_map.update( # type: ignore # bad types in .pyi
228 {k.replace("--", "").replace("-", "_"): v for k, v in config.items()}
233 @click.command(context_settings=dict(help_option_names=["-h", "--help"]))
234 @click.option("-c", "--code", type=str, help="Format the code passed in as a string.")
239 default=DEFAULT_LINE_LENGTH,
240 help="How many characters per line to allow.",
246 type=click.Choice([v.name.lower() for v in TargetVersion]),
247 callback=lambda c, p, v: [TargetVersion[val.upper()] for val in v],
250 "Python versions that should be supported by Black's output. [default: "
251 "per-file auto-detection]"
258 "Allow using Python 3.6-only syntax on all input files. This will put "
259 "trailing commas in function signatures and calls also after *args and "
260 "**kwargs. Deprecated; use --target-version instead. "
261 "[default: per-file auto-detection]"
268 "Format all input files like typing stubs regardless of file extension "
269 "(useful when piping source on standard input)."
274 "--skip-string-normalization",
276 help="Don't normalize string quotes or prefixes.",
282 "Don't write the files back, just return the status. Return code 0 "
283 "means nothing would change. Return code 1 means some files would be "
284 "reformatted. Return code 123 means there was an internal error."
290 help="Don't write the files back, just output a diff for each file on stdout.",
295 help="If --fast given, skip temporary sanity checks. [default: --safe]",
300 default=DEFAULT_INCLUDES,
302 "A regular expression that matches files and directories that should be "
303 "included on recursive searches. An empty value means all files are "
304 "included regardless of the name. Use forward slashes for directories on "
305 "all platforms (Windows, too). Exclusions are calculated first, inclusions "
313 default=DEFAULT_EXCLUDES,
315 "A regular expression that matches files and directories that should be "
316 "excluded on recursive searches. An empty value means no paths are excluded. "
317 "Use forward slashes for directories on all platforms (Windows, too). "
318 "Exclusions are calculated first, inclusions later."
327 "Don't emit non-error messages to stderr. Errors are still emitted, "
328 "silence those with 2>/dev/null."
336 "Also emit messages to stderr about files that were not changed or were "
337 "ignored due to --exclude=."
340 @click.version_option(version=__version__)
345 exists=True, file_okay=True, dir_okay=True, readable=True, allow_dash=True
352 exists=False, file_okay=True, dir_okay=False, readable=True, allow_dash=False
355 callback=read_pyproject_toml,
356 help="Read configuration from PATH.",
363 target_version: List[TargetVersion],
369 skip_string_normalization: bool,
375 config: Optional[str],
377 """The uncompromising code formatter."""
378 write_back = WriteBack.from_configuration(check=check, diff=diff)
381 err(f"Cannot use both --target-version and --py36")
384 versions = set(target_version)
387 "--py36 is deprecated and will be removed in a future version. "
388 "Use --target-version py36 instead."
390 versions = PY36_VERSIONS
392 # We'll autodetect later.
395 target_versions=versions,
396 line_length=line_length,
398 string_normalization=not skip_string_normalization,
400 if config and verbose:
401 out(f"Using configuration from {config}.", bold=False, fg="blue")
403 print(format_str(code, mode=mode))
406 include_regex = re_compile_maybe_verbose(include)
408 err(f"Invalid regular expression for include given: {include!r}")
411 exclude_regex = re_compile_maybe_verbose(exclude)
413 err(f"Invalid regular expression for exclude given: {exclude!r}")
415 report = Report(check=check, quiet=quiet, verbose=verbose)
416 root = find_project_root(src)
417 sources: Set[Path] = set()
422 gen_python_files_in_dir(p, root, include_regex, exclude_regex, report)
424 elif p.is_file() or s == "-":
425 # if a file was explicitly given, we don't care about its extension
428 err(f"invalid path: {s}")
429 if len(sources) == 0:
430 if verbose or not quiet:
431 out("No paths given. Nothing to do 😴")
434 if len(sources) == 1:
438 write_back=write_back,
444 sources=sources, fast=fast, write_back=write_back, mode=mode, report=report
447 if verbose or not quiet:
448 bang = "💥 💔 💥" if report.return_code else "✨ 🍰 ✨"
449 out(f"All done! {bang}")
450 click.secho(str(report), err=True)
451 ctx.exit(report.return_code)
455 src: Path, fast: bool, write_back: WriteBack, mode: FileMode, report: "Report"
457 """Reformat a single file under `src` without spawning child processes.
459 If `quiet` is True, non-error messages are not output. `line_length`,
460 `write_back`, `fast` and `pyi` options are passed to
461 :func:`format_file_in_place` or :func:`format_stdin_to_stdout`.
465 if not src.is_file() and str(src) == "-":
466 if format_stdin_to_stdout(fast=fast, write_back=write_back, mode=mode):
467 changed = Changed.YES
470 if write_back != WriteBack.DIFF:
471 cache = read_cache(mode)
472 res_src = src.resolve()
473 if res_src in cache and cache[res_src] == get_cache_info(res_src):
474 changed = Changed.CACHED
475 if changed is not Changed.CACHED and format_file_in_place(
476 src, fast=fast, write_back=write_back, mode=mode
478 changed = Changed.YES
479 if (write_back is WriteBack.YES and changed is not Changed.CACHED) or (
480 write_back is WriteBack.CHECK and changed is Changed.NO
482 write_cache(cache, [src], mode)
483 report.done(src, changed)
484 except Exception as exc:
485 report.failed(src, str(exc))
491 write_back: WriteBack,
495 """Reformat multiple files using a ProcessPoolExecutor."""
496 loop = asyncio.get_event_loop()
497 worker_count = os.cpu_count()
498 if sys.platform == "win32":
499 # Work around https://bugs.python.org/issue26903
500 worker_count = min(worker_count, 61)
501 executor = ProcessPoolExecutor(max_workers=worker_count)
503 loop.run_until_complete(
507 write_back=write_back,
518 async def schedule_formatting(
521 write_back: WriteBack,
527 """Run formatting of `sources` in parallel using the provided `executor`.
529 (Use ProcessPoolExecutors for actual parallelism.)
531 `line_length`, `write_back`, `fast`, and `pyi` options are passed to
532 :func:`format_file_in_place`.
535 if write_back != WriteBack.DIFF:
536 cache = read_cache(mode)
537 sources, cached = filter_cached(cache, sources)
538 for src in sorted(cached):
539 report.done(src, Changed.CACHED)
544 sources_to_cache = []
546 if write_back == WriteBack.DIFF:
547 # For diff output, we need locks to ensure we don't interleave output
548 # from different processes.
550 lock = manager.Lock()
552 asyncio.ensure_future(
553 loop.run_in_executor(
554 executor, format_file_in_place, src, fast, mode, write_back, lock
557 for src in sorted(sources)
559 pending: Iterable[asyncio.Future] = tasks.keys()
561 loop.add_signal_handler(signal.SIGINT, cancel, pending)
562 loop.add_signal_handler(signal.SIGTERM, cancel, pending)
563 except NotImplementedError:
564 # There are no good alternatives for these on Windows.
567 done, _ = await asyncio.wait(pending, return_when=asyncio.FIRST_COMPLETED)
569 src = tasks.pop(task)
571 cancelled.append(task)
572 elif task.exception():
573 report.failed(src, str(task.exception()))
575 changed = Changed.YES if task.result() else Changed.NO
576 # If the file was written back or was successfully checked as
577 # well-formatted, store this information in the cache.
578 if write_back is WriteBack.YES or (
579 write_back is WriteBack.CHECK and changed is Changed.NO
581 sources_to_cache.append(src)
582 report.done(src, changed)
584 await asyncio.gather(*cancelled, loop=loop, return_exceptions=True)
586 write_cache(cache, sources_to_cache, mode)
589 def format_file_in_place(
593 write_back: WriteBack = WriteBack.NO,
594 lock: Any = None, # multiprocessing.Manager().Lock() is some crazy proxy
596 """Format file under `src` path. Return True if changed.
598 If `write_back` is DIFF, write a diff to stdout. If it is YES, write reformatted
600 `line_length` and `fast` options are passed to :func:`format_file_contents`.
602 if src.suffix == ".pyi":
603 mode = evolve(mode, is_pyi=True)
605 then = datetime.utcfromtimestamp(src.stat().st_mtime)
606 with open(src, "rb") as buf:
607 src_contents, encoding, newline = decode_bytes(buf.read())
609 dst_contents = format_file_contents(src_contents, fast=fast, mode=mode)
610 except NothingChanged:
613 if write_back == write_back.YES:
614 with open(src, "w", encoding=encoding, newline=newline) as f:
615 f.write(dst_contents)
616 elif write_back == write_back.DIFF:
617 now = datetime.utcnow()
618 src_name = f"{src}\t{then} +0000"
619 dst_name = f"{src}\t{now} +0000"
620 diff_contents = diff(src_contents, dst_contents, src_name, dst_name)
624 f = io.TextIOWrapper(
630 f.write(diff_contents)
638 def format_stdin_to_stdout(
639 fast: bool, *, write_back: WriteBack = WriteBack.NO, mode: FileMode
641 """Format file on stdin. Return True if changed.
643 If `write_back` is YES, write reformatted code back to stdout. If it is DIFF,
644 write a diff to stdout. The `mode` argument is passed to
645 :func:`format_file_contents`.
647 then = datetime.utcnow()
648 src, encoding, newline = decode_bytes(sys.stdin.buffer.read())
651 dst = format_file_contents(src, fast=fast, mode=mode)
654 except NothingChanged:
658 f = io.TextIOWrapper(
659 sys.stdout.buffer, encoding=encoding, newline=newline, write_through=True
661 if write_back == WriteBack.YES:
663 elif write_back == WriteBack.DIFF:
664 now = datetime.utcnow()
665 src_name = f"STDIN\t{then} +0000"
666 dst_name = f"STDOUT\t{now} +0000"
667 f.write(diff(src, dst, src_name, dst_name))
671 def format_file_contents(
672 src_contents: str, *, fast: bool, mode: FileMode
674 """Reformat contents a file and return new contents.
676 If `fast` is False, additionally confirm that the reformatted code is
677 valid by calling :func:`assert_equivalent` and :func:`assert_stable` on it.
678 `line_length` is passed to :func:`format_str`.
680 if src_contents.strip() == "":
683 dst_contents = format_str(src_contents, mode=mode)
684 if src_contents == dst_contents:
688 assert_equivalent(src_contents, dst_contents)
689 assert_stable(src_contents, dst_contents, mode=mode)
693 def format_str(src_contents: str, *, mode: FileMode) -> FileContent:
694 """Reformat a string and return new contents.
696 `line_length` determines how many characters per line are allowed.
698 src_node = lib2to3_parse(src_contents.lstrip(), mode.target_versions)
700 future_imports = get_future_imports(src_node)
701 if mode.target_versions:
702 versions = mode.target_versions
704 versions = detect_target_versions(src_node)
705 normalize_fmt_off(src_node)
706 lines = LineGenerator(
707 remove_u_prefix="unicode_literals" in future_imports
708 or supports_feature(versions, Feature.UNICODE_LITERALS),
710 normalize_strings=mode.string_normalization,
712 elt = EmptyLineTracker(is_pyi=mode.is_pyi)
715 split_line_features = {
717 for feature in {Feature.TRAILING_COMMA_IN_CALL, Feature.TRAILING_COMMA_IN_DEF}
718 if supports_feature(versions, feature)
720 for current_line in lines.visit(src_node):
721 for _ in range(after):
722 dst_contents += str(empty_line)
723 before, after = elt.maybe_empty_lines(current_line)
724 for _ in range(before):
725 dst_contents += str(empty_line)
726 for line in split_line(
727 current_line, line_length=mode.line_length, features=split_line_features
729 dst_contents += str(line)
733 def decode_bytes(src: bytes) -> Tuple[FileContent, Encoding, NewLine]:
734 """Return a tuple of (decoded_contents, encoding, newline).
736 `newline` is either CRLF or LF but `decoded_contents` is decoded with
737 universal newlines (i.e. only contains LF).
739 srcbuf = io.BytesIO(src)
740 encoding, lines = tokenize.detect_encoding(srcbuf.readline)
742 return "", encoding, "\n"
744 newline = "\r\n" if b"\r\n" == lines[0][-2:] else "\n"
746 with io.TextIOWrapper(srcbuf, encoding) as tiow:
747 return tiow.read(), encoding, newline
750 def get_grammars(target_versions: Set[TargetVersion]) -> List[Grammar]:
751 if not target_versions:
752 # No target_version specified, so try all grammars.
754 pygram.python_grammar_no_print_statement_no_exec_statement,
755 pygram.python_grammar_no_print_statement,
756 pygram.python_grammar,
758 elif all(version.is_python2() for version in target_versions):
759 # Python 2-only code, so try Python 2 grammars.
760 return [pygram.python_grammar_no_print_statement, pygram.python_grammar]
762 # Python 3-compatible code, so only try Python 3 grammar.
763 return [pygram.python_grammar_no_print_statement_no_exec_statement]
766 def lib2to3_parse(src_txt: str, target_versions: Iterable[TargetVersion] = ()) -> Node:
767 """Given a string with source, return the lib2to3 Node."""
768 if src_txt[-1:] != "\n":
771 for grammar in get_grammars(set(target_versions)):
772 drv = driver.Driver(grammar, pytree.convert)
774 result = drv.parse_string(src_txt, True)
777 except ParseError as pe:
778 lineno, column = pe.context[1]
779 lines = src_txt.splitlines()
781 faulty_line = lines[lineno - 1]
783 faulty_line = "<line number missing in source>"
784 exc = InvalidInput(f"Cannot parse: {lineno}:{column}: {faulty_line}")
788 if isinstance(result, Leaf):
789 result = Node(syms.file_input, [result])
793 def lib2to3_unparse(node: Node) -> str:
794 """Given a lib2to3 node, return its string representation."""
802 class Visitor(Generic[T]):
803 """Basic lib2to3 visitor that yields things of type `T` on `visit()`."""
805 def visit(self, node: LN) -> Iterator[T]:
806 """Main method to visit `node` and its children.
808 It tries to find a `visit_*()` method for the given `node.type`, like
809 `visit_simple_stmt` for Node objects or `visit_INDENT` for Leaf objects.
810 If no dedicated `visit_*()` method is found, chooses `visit_default()`
813 Then yields objects of type `T` from the selected visitor.
816 name = token.tok_name[node.type]
818 name = type_repr(node.type)
819 yield from getattr(self, f"visit_{name}", self.visit_default)(node)
821 def visit_default(self, node: LN) -> Iterator[T]:
822 """Default `visit_*()` implementation. Recurses to children of `node`."""
823 if isinstance(node, Node):
824 for child in node.children:
825 yield from self.visit(child)
829 class DebugVisitor(Visitor[T]):
832 def visit_default(self, node: LN) -> Iterator[T]:
833 indent = " " * (2 * self.tree_depth)
834 if isinstance(node, Node):
835 _type = type_repr(node.type)
836 out(f"{indent}{_type}", fg="yellow")
838 for child in node.children:
839 yield from self.visit(child)
842 out(f"{indent}/{_type}", fg="yellow", bold=False)
844 _type = token.tok_name.get(node.type, str(node.type))
845 out(f"{indent}{_type}", fg="blue", nl=False)
847 # We don't have to handle prefixes for `Node` objects since
848 # that delegates to the first child anyway.
849 out(f" {node.prefix!r}", fg="green", bold=False, nl=False)
850 out(f" {node.value!r}", fg="blue", bold=False)
853 def show(cls, code: Union[str, Leaf, Node]) -> None:
854 """Pretty-print the lib2to3 AST of a given string of `code`.
856 Convenience method for debugging.
858 v: DebugVisitor[None] = DebugVisitor()
859 if isinstance(code, str):
860 code = lib2to3_parse(code)
864 WHITESPACE = {token.DEDENT, token.INDENT, token.NEWLINE}
875 STANDALONE_COMMENT = 153
876 token.tok_name[STANDALONE_COMMENT] = "STANDALONE_COMMENT"
877 LOGIC_OPERATORS = {"and", "or"}
902 STARS = {token.STAR, token.DOUBLESTAR}
905 syms.argument, # double star in arglist
906 syms.trailer, # single argument to call
908 syms.varargslist, # lambdas
910 UNPACKING_PARENTS = {
911 syms.atom, # single element of a list or set literal
915 syms.testlist_star_expr,
950 COMPREHENSION_PRIORITY = 20
952 TERNARY_PRIORITY = 16
955 COMPARATOR_PRIORITY = 10
966 token.DOUBLESLASH: 4,
976 class BracketTracker:
977 """Keeps track of brackets on a line."""
980 bracket_match: Dict[Tuple[Depth, NodeType], Leaf] = Factory(dict)
981 delimiters: Dict[LeafID, Priority] = Factory(dict)
982 previous: Optional[Leaf] = None
983 _for_loop_depths: List[int] = Factory(list)
984 _lambda_argument_depths: List[int] = Factory(list)
986 def mark(self, leaf: Leaf) -> None:
987 """Mark `leaf` with bracket-related metadata. Keep track of delimiters.
989 All leaves receive an int `bracket_depth` field that stores how deep
990 within brackets a given leaf is. 0 means there are no enclosing brackets
991 that started on this line.
993 If a leaf is itself a closing bracket, it receives an `opening_bracket`
994 field that it forms a pair with. This is a one-directional link to
995 avoid reference cycles.
997 If a leaf is a delimiter (a token on which Black can split the line if
998 needed) and it's on depth 0, its `id()` is stored in the tracker's
1001 if leaf.type == token.COMMENT:
1004 self.maybe_decrement_after_for_loop_variable(leaf)
1005 self.maybe_decrement_after_lambda_arguments(leaf)
1006 if leaf.type in CLOSING_BRACKETS:
1008 opening_bracket = self.bracket_match.pop((self.depth, leaf.type))
1009 leaf.opening_bracket = opening_bracket
1010 leaf.bracket_depth = self.depth
1012 delim = is_split_before_delimiter(leaf, self.previous)
1013 if delim and self.previous is not None:
1014 self.delimiters[id(self.previous)] = delim
1016 delim = is_split_after_delimiter(leaf, self.previous)
1018 self.delimiters[id(leaf)] = delim
1019 if leaf.type in OPENING_BRACKETS:
1020 self.bracket_match[self.depth, BRACKET[leaf.type]] = leaf
1022 self.previous = leaf
1023 self.maybe_increment_lambda_arguments(leaf)
1024 self.maybe_increment_for_loop_variable(leaf)
1026 def any_open_brackets(self) -> bool:
1027 """Return True if there is an yet unmatched open bracket on the line."""
1028 return bool(self.bracket_match)
1030 def max_delimiter_priority(self, exclude: Iterable[LeafID] = ()) -> int:
1031 """Return the highest priority of a delimiter found on the line.
1033 Values are consistent with what `is_split_*_delimiter()` return.
1034 Raises ValueError on no delimiters.
1036 return max(v for k, v in self.delimiters.items() if k not in exclude)
1038 def delimiter_count_with_priority(self, priority: int = 0) -> int:
1039 """Return the number of delimiters with the given `priority`.
1041 If no `priority` is passed, defaults to max priority on the line.
1043 if not self.delimiters:
1046 priority = priority or self.max_delimiter_priority()
1047 return sum(1 for p in self.delimiters.values() if p == priority)
1049 def maybe_increment_for_loop_variable(self, leaf: Leaf) -> bool:
1050 """In a for loop, or comprehension, the variables are often unpacks.
1052 To avoid splitting on the comma in this situation, increase the depth of
1053 tokens between `for` and `in`.
1055 if leaf.type == token.NAME and leaf.value == "for":
1057 self._for_loop_depths.append(self.depth)
1062 def maybe_decrement_after_for_loop_variable(self, leaf: Leaf) -> bool:
1063 """See `maybe_increment_for_loop_variable` above for explanation."""
1065 self._for_loop_depths
1066 and self._for_loop_depths[-1] == self.depth
1067 and leaf.type == token.NAME
1068 and leaf.value == "in"
1071 self._for_loop_depths.pop()
1076 def maybe_increment_lambda_arguments(self, leaf: Leaf) -> bool:
1077 """In a lambda expression, there might be more than one argument.
1079 To avoid splitting on the comma in this situation, increase the depth of
1080 tokens between `lambda` and `:`.
1082 if leaf.type == token.NAME and leaf.value == "lambda":
1084 self._lambda_argument_depths.append(self.depth)
1089 def maybe_decrement_after_lambda_arguments(self, leaf: Leaf) -> bool:
1090 """See `maybe_increment_lambda_arguments` above for explanation."""
1092 self._lambda_argument_depths
1093 and self._lambda_argument_depths[-1] == self.depth
1094 and leaf.type == token.COLON
1097 self._lambda_argument_depths.pop()
1102 def get_open_lsqb(self) -> Optional[Leaf]:
1103 """Return the most recent opening square bracket (if any)."""
1104 return self.bracket_match.get((self.depth - 1, token.RSQB))
1109 """Holds leaves and comments. Can be printed with `str(line)`."""
1112 leaves: List[Leaf] = Factory(list)
1113 comments: Dict[LeafID, List[Leaf]] = Factory(dict) # keys ordered like `leaves`
1114 bracket_tracker: BracketTracker = Factory(BracketTracker)
1115 inside_brackets: bool = False
1116 should_explode: bool = False
1118 def append(self, leaf: Leaf, preformatted: bool = False) -> None:
1119 """Add a new `leaf` to the end of the line.
1121 Unless `preformatted` is True, the `leaf` will receive a new consistent
1122 whitespace prefix and metadata applied by :class:`BracketTracker`.
1123 Trailing commas are maybe removed, unpacked for loop variables are
1124 demoted from being delimiters.
1126 Inline comments are put aside.
1128 has_value = leaf.type in BRACKETS or bool(leaf.value.strip())
1132 if token.COLON == leaf.type and self.is_class_paren_empty:
1133 del self.leaves[-2:]
1134 if self.leaves and not preformatted:
1135 # Note: at this point leaf.prefix should be empty except for
1136 # imports, for which we only preserve newlines.
1137 leaf.prefix += whitespace(
1138 leaf, complex_subscript=self.is_complex_subscript(leaf)
1140 if self.inside_brackets or not preformatted:
1141 self.bracket_tracker.mark(leaf)
1142 self.maybe_remove_trailing_comma(leaf)
1143 if not self.append_comment(leaf):
1144 self.leaves.append(leaf)
1146 def append_safe(self, leaf: Leaf, preformatted: bool = False) -> None:
1147 """Like :func:`append()` but disallow invalid standalone comment structure.
1149 Raises ValueError when any `leaf` is appended after a standalone comment
1150 or when a standalone comment is not the first leaf on the line.
1152 if self.bracket_tracker.depth == 0:
1154 raise ValueError("cannot append to standalone comments")
1156 if self.leaves and leaf.type == STANDALONE_COMMENT:
1158 "cannot append standalone comments to a populated line"
1161 self.append(leaf, preformatted=preformatted)
1164 def is_comment(self) -> bool:
1165 """Is this line a standalone comment?"""
1166 return len(self.leaves) == 1 and self.leaves[0].type == STANDALONE_COMMENT
1169 def is_decorator(self) -> bool:
1170 """Is this line a decorator?"""
1171 return bool(self) and self.leaves[0].type == token.AT
1174 def is_import(self) -> bool:
1175 """Is this an import line?"""
1176 return bool(self) and is_import(self.leaves[0])
1179 def is_class(self) -> bool:
1180 """Is this line a class definition?"""
1183 and self.leaves[0].type == token.NAME
1184 and self.leaves[0].value == "class"
1188 def is_stub_class(self) -> bool:
1189 """Is this line a class definition with a body consisting only of "..."?"""
1190 return self.is_class and self.leaves[-3:] == [
1191 Leaf(token.DOT, ".") for _ in range(3)
1195 def is_def(self) -> bool:
1196 """Is this a function definition? (Also returns True for async defs.)"""
1198 first_leaf = self.leaves[0]
1203 second_leaf: Optional[Leaf] = self.leaves[1]
1206 return (first_leaf.type == token.NAME and first_leaf.value == "def") or (
1207 first_leaf.type == token.ASYNC
1208 and second_leaf is not None
1209 and second_leaf.type == token.NAME
1210 and second_leaf.value == "def"
1214 def is_class_paren_empty(self) -> bool:
1215 """Is this a class with no base classes but using parentheses?
1217 Those are unnecessary and should be removed.
1221 and len(self.leaves) == 4
1223 and self.leaves[2].type == token.LPAR
1224 and self.leaves[2].value == "("
1225 and self.leaves[3].type == token.RPAR
1226 and self.leaves[3].value == ")"
1230 def is_triple_quoted_string(self) -> bool:
1231 """Is the line a triple quoted string?"""
1234 and self.leaves[0].type == token.STRING
1235 and self.leaves[0].value.startswith(('"""', "'''"))
1238 def contains_standalone_comments(self, depth_limit: int = sys.maxsize) -> bool:
1239 """If so, needs to be split before emitting."""
1240 for leaf in self.leaves:
1241 if leaf.type == STANDALONE_COMMENT:
1242 if leaf.bracket_depth <= depth_limit:
1246 def contains_inner_type_comments(self) -> bool:
1249 last_leaf = self.leaves[-1]
1250 ignored_ids.add(id(last_leaf))
1251 if last_leaf.type == token.COMMA:
1252 # When trailing commas are inserted by Black for consistency, comments
1253 # after the previous last element are not moved (they don't have to,
1254 # rendering will still be correct). So we ignore trailing commas.
1255 last_leaf = self.leaves[-2]
1256 ignored_ids.add(id(last_leaf))
1260 for leaf_id, comments in self.comments.items():
1261 if leaf_id in ignored_ids:
1264 for comment in comments:
1265 if is_type_comment(comment):
1270 def contains_multiline_strings(self) -> bool:
1271 for leaf in self.leaves:
1272 if is_multiline_string(leaf):
1277 def maybe_remove_trailing_comma(self, closing: Leaf) -> bool:
1278 """Remove trailing comma if there is one and it's safe."""
1281 and self.leaves[-1].type == token.COMMA
1282 and closing.type in CLOSING_BRACKETS
1286 if closing.type == token.RBRACE:
1287 self.remove_trailing_comma()
1290 if closing.type == token.RSQB:
1291 comma = self.leaves[-1]
1292 if comma.parent and comma.parent.type == syms.listmaker:
1293 self.remove_trailing_comma()
1296 # For parens let's check if it's safe to remove the comma.
1297 # Imports are always safe.
1299 self.remove_trailing_comma()
1302 # Otherwise, if the trailing one is the only one, we might mistakenly
1303 # change a tuple into a different type by removing the comma.
1304 depth = closing.bracket_depth + 1
1306 opening = closing.opening_bracket
1307 for _opening_index, leaf in enumerate(self.leaves):
1314 for leaf in self.leaves[_opening_index + 1 :]:
1318 bracket_depth = leaf.bracket_depth
1319 if bracket_depth == depth and leaf.type == token.COMMA:
1321 if leaf.parent and leaf.parent.type == syms.arglist:
1326 self.remove_trailing_comma()
1331 def append_comment(self, comment: Leaf) -> bool:
1332 """Add an inline or standalone comment to the line."""
1334 comment.type == STANDALONE_COMMENT
1335 and self.bracket_tracker.any_open_brackets()
1340 if comment.type != token.COMMENT:
1344 comment.type = STANDALONE_COMMENT
1348 self.comments.setdefault(id(self.leaves[-1]), []).append(comment)
1351 def comments_after(self, leaf: Leaf) -> List[Leaf]:
1352 """Generate comments that should appear directly after `leaf`."""
1353 return self.comments.get(id(leaf), [])
1355 def remove_trailing_comma(self) -> None:
1356 """Remove the trailing comma and moves the comments attached to it."""
1357 trailing_comma = self.leaves.pop()
1358 trailing_comma_comments = self.comments.pop(id(trailing_comma), [])
1359 self.comments.setdefault(id(self.leaves[-1]), []).extend(
1360 trailing_comma_comments
1363 def is_complex_subscript(self, leaf: Leaf) -> bool:
1364 """Return True iff `leaf` is part of a slice with non-trivial exprs."""
1365 open_lsqb = self.bracket_tracker.get_open_lsqb()
1366 if open_lsqb is None:
1369 subscript_start = open_lsqb.next_sibling
1371 if isinstance(subscript_start, Node):
1372 if subscript_start.type == syms.listmaker:
1375 if subscript_start.type == syms.subscriptlist:
1376 subscript_start = child_towards(subscript_start, leaf)
1377 return subscript_start is not None and any(
1378 n.type in TEST_DESCENDANTS for n in subscript_start.pre_order()
1381 def __str__(self) -> str:
1382 """Render the line."""
1386 indent = " " * self.depth
1387 leaves = iter(self.leaves)
1388 first = next(leaves)
1389 res = f"{first.prefix}{indent}{first.value}"
1392 for comment in itertools.chain.from_iterable(self.comments.values()):
1396 def __bool__(self) -> bool:
1397 """Return True if the line has leaves or comments."""
1398 return bool(self.leaves or self.comments)
1402 class EmptyLineTracker:
1403 """Provides a stateful method that returns the number of potential extra
1404 empty lines needed before and after the currently processed line.
1406 Note: this tracker works on lines that haven't been split yet. It assumes
1407 the prefix of the first leaf consists of optional newlines. Those newlines
1408 are consumed by `maybe_empty_lines()` and included in the computation.
1411 is_pyi: bool = False
1412 previous_line: Optional[Line] = None
1413 previous_after: int = 0
1414 previous_defs: List[int] = Factory(list)
1416 def maybe_empty_lines(self, current_line: Line) -> Tuple[int, int]:
1417 """Return the number of extra empty lines before and after the `current_line`.
1419 This is for separating `def`, `async def` and `class` with extra empty
1420 lines (two on module-level).
1422 before, after = self._maybe_empty_lines(current_line)
1423 before -= self.previous_after
1424 self.previous_after = after
1425 self.previous_line = current_line
1426 return before, after
1428 def _maybe_empty_lines(self, current_line: Line) -> Tuple[int, int]:
1430 if current_line.depth == 0:
1431 max_allowed = 1 if self.is_pyi else 2
1432 if current_line.leaves:
1433 # Consume the first leaf's extra newlines.
1434 first_leaf = current_line.leaves[0]
1435 before = first_leaf.prefix.count("\n")
1436 before = min(before, max_allowed)
1437 first_leaf.prefix = ""
1440 depth = current_line.depth
1441 while self.previous_defs and self.previous_defs[-1] >= depth:
1442 self.previous_defs.pop()
1444 before = 0 if depth else 1
1446 before = 1 if depth else 2
1447 if current_line.is_decorator or current_line.is_def or current_line.is_class:
1448 return self._maybe_empty_lines_for_class_or_def(current_line, before)
1452 and self.previous_line.is_import
1453 and not current_line.is_import
1454 and depth == self.previous_line.depth
1456 return (before or 1), 0
1460 and self.previous_line.is_class
1461 and current_line.is_triple_quoted_string
1467 def _maybe_empty_lines_for_class_or_def(
1468 self, current_line: Line, before: int
1469 ) -> Tuple[int, int]:
1470 if not current_line.is_decorator:
1471 self.previous_defs.append(current_line.depth)
1472 if self.previous_line is None:
1473 # Don't insert empty lines before the first line in the file.
1476 if self.previous_line.is_decorator:
1479 if self.previous_line.depth < current_line.depth and (
1480 self.previous_line.is_class or self.previous_line.is_def
1485 self.previous_line.is_comment
1486 and self.previous_line.depth == current_line.depth
1492 if self.previous_line.depth > current_line.depth:
1494 elif current_line.is_class or self.previous_line.is_class:
1495 if current_line.is_stub_class and self.previous_line.is_stub_class:
1496 # No blank line between classes with an empty body
1500 elif current_line.is_def and not self.previous_line.is_def:
1501 # Blank line between a block of functions and a block of non-functions
1507 if current_line.depth and newlines:
1513 class LineGenerator(Visitor[Line]):
1514 """Generates reformatted Line objects. Empty lines are not emitted.
1516 Note: destroys the tree it's visiting by mutating prefixes of its leaves
1517 in ways that will no longer stringify to valid Python code on the tree.
1520 is_pyi: bool = False
1521 normalize_strings: bool = True
1522 current_line: Line = Factory(Line)
1523 remove_u_prefix: bool = False
1525 def line(self, indent: int = 0) -> Iterator[Line]:
1528 If the line is empty, only emit if it makes sense.
1529 If the line is too long, split it first and then generate.
1531 If any lines were generated, set up a new current_line.
1533 if not self.current_line:
1534 self.current_line.depth += indent
1535 return # Line is empty, don't emit. Creating a new one unnecessary.
1537 complete_line = self.current_line
1538 self.current_line = Line(depth=complete_line.depth + indent)
1541 def visit_default(self, node: LN) -> Iterator[Line]:
1542 """Default `visit_*()` implementation. Recurses to children of `node`."""
1543 if isinstance(node, Leaf):
1544 any_open_brackets = self.current_line.bracket_tracker.any_open_brackets()
1545 for comment in generate_comments(node):
1546 if any_open_brackets:
1547 # any comment within brackets is subject to splitting
1548 self.current_line.append(comment)
1549 elif comment.type == token.COMMENT:
1550 # regular trailing comment
1551 self.current_line.append(comment)
1552 yield from self.line()
1555 # regular standalone comment
1556 yield from self.line()
1558 self.current_line.append(comment)
1559 yield from self.line()
1561 normalize_prefix(node, inside_brackets=any_open_brackets)
1562 if self.normalize_strings and node.type == token.STRING:
1563 normalize_string_prefix(node, remove_u_prefix=self.remove_u_prefix)
1564 normalize_string_quotes(node)
1565 if node.type == token.NUMBER:
1566 normalize_numeric_literal(node)
1567 if node.type not in WHITESPACE:
1568 self.current_line.append(node)
1569 yield from super().visit_default(node)
1571 def visit_INDENT(self, node: Node) -> Iterator[Line]:
1572 """Increase indentation level, maybe yield a line."""
1573 # In blib2to3 INDENT never holds comments.
1574 yield from self.line(+1)
1575 yield from self.visit_default(node)
1577 def visit_DEDENT(self, node: Node) -> Iterator[Line]:
1578 """Decrease indentation level, maybe yield a line."""
1579 # The current line might still wait for trailing comments. At DEDENT time
1580 # there won't be any (they would be prefixes on the preceding NEWLINE).
1581 # Emit the line then.
1582 yield from self.line()
1584 # While DEDENT has no value, its prefix may contain standalone comments
1585 # that belong to the current indentation level. Get 'em.
1586 yield from self.visit_default(node)
1588 # Finally, emit the dedent.
1589 yield from self.line(-1)
1592 self, node: Node, keywords: Set[str], parens: Set[str]
1593 ) -> Iterator[Line]:
1594 """Visit a statement.
1596 This implementation is shared for `if`, `while`, `for`, `try`, `except`,
1597 `def`, `with`, `class`, `assert` and assignments.
1599 The relevant Python language `keywords` for a given statement will be
1600 NAME leaves within it. This methods puts those on a separate line.
1602 `parens` holds a set of string leaf values immediately after which
1603 invisible parens should be put.
1605 normalize_invisible_parens(node, parens_after=parens)
1606 for child in node.children:
1607 if child.type == token.NAME and child.value in keywords: # type: ignore
1608 yield from self.line()
1610 yield from self.visit(child)
1612 def visit_suite(self, node: Node) -> Iterator[Line]:
1613 """Visit a suite."""
1614 if self.is_pyi and is_stub_suite(node):
1615 yield from self.visit(node.children[2])
1617 yield from self.visit_default(node)
1619 def visit_simple_stmt(self, node: Node) -> Iterator[Line]:
1620 """Visit a statement without nested statements."""
1621 is_suite_like = node.parent and node.parent.type in STATEMENT
1623 if self.is_pyi and is_stub_body(node):
1624 yield from self.visit_default(node)
1626 yield from self.line(+1)
1627 yield from self.visit_default(node)
1628 yield from self.line(-1)
1631 if not self.is_pyi or not node.parent or not is_stub_suite(node.parent):
1632 yield from self.line()
1633 yield from self.visit_default(node)
1635 def visit_async_stmt(self, node: Node) -> Iterator[Line]:
1636 """Visit `async def`, `async for`, `async with`."""
1637 yield from self.line()
1639 children = iter(node.children)
1640 for child in children:
1641 yield from self.visit(child)
1643 if child.type == token.ASYNC:
1646 internal_stmt = next(children)
1647 for child in internal_stmt.children:
1648 yield from self.visit(child)
1650 def visit_decorators(self, node: Node) -> Iterator[Line]:
1651 """Visit decorators."""
1652 for child in node.children:
1653 yield from self.line()
1654 yield from self.visit(child)
1656 def visit_SEMI(self, leaf: Leaf) -> Iterator[Line]:
1657 """Remove a semicolon and put the other statement on a separate line."""
1658 yield from self.line()
1660 def visit_ENDMARKER(self, leaf: Leaf) -> Iterator[Line]:
1661 """End of file. Process outstanding comments and end with a newline."""
1662 yield from self.visit_default(leaf)
1663 yield from self.line()
1665 def visit_STANDALONE_COMMENT(self, leaf: Leaf) -> Iterator[Line]:
1666 if not self.current_line.bracket_tracker.any_open_brackets():
1667 yield from self.line()
1668 yield from self.visit_default(leaf)
1670 def __attrs_post_init__(self) -> None:
1671 """You are in a twisty little maze of passages."""
1674 self.visit_assert_stmt = partial(v, keywords={"assert"}, parens={"assert", ","})
1675 self.visit_if_stmt = partial(
1676 v, keywords={"if", "else", "elif"}, parens={"if", "elif"}
1678 self.visit_while_stmt = partial(v, keywords={"while", "else"}, parens={"while"})
1679 self.visit_for_stmt = partial(v, keywords={"for", "else"}, parens={"for", "in"})
1680 self.visit_try_stmt = partial(
1681 v, keywords={"try", "except", "else", "finally"}, parens=Ø
1683 self.visit_except_clause = partial(v, keywords={"except"}, parens=Ø)
1684 self.visit_with_stmt = partial(v, keywords={"with"}, parens=Ø)
1685 self.visit_funcdef = partial(v, keywords={"def"}, parens=Ø)
1686 self.visit_classdef = partial(v, keywords={"class"}, parens=Ø)
1687 self.visit_expr_stmt = partial(v, keywords=Ø, parens=ASSIGNMENTS)
1688 self.visit_return_stmt = partial(v, keywords={"return"}, parens={"return"})
1689 self.visit_import_from = partial(v, keywords=Ø, parens={"import"})
1690 self.visit_del_stmt = partial(v, keywords=Ø, parens={"del"})
1691 self.visit_async_funcdef = self.visit_async_stmt
1692 self.visit_decorated = self.visit_decorators
1695 IMPLICIT_TUPLE = {syms.testlist, syms.testlist_star_expr, syms.exprlist}
1696 BRACKET = {token.LPAR: token.RPAR, token.LSQB: token.RSQB, token.LBRACE: token.RBRACE}
1697 OPENING_BRACKETS = set(BRACKET.keys())
1698 CLOSING_BRACKETS = set(BRACKET.values())
1699 BRACKETS = OPENING_BRACKETS | CLOSING_BRACKETS
1700 ALWAYS_NO_SPACE = CLOSING_BRACKETS | {token.COMMA, STANDALONE_COMMENT}
1703 def whitespace(leaf: Leaf, *, complex_subscript: bool) -> str: # noqa: C901
1704 """Return whitespace prefix if needed for the given `leaf`.
1706 `complex_subscript` signals whether the given leaf is part of a subscription
1707 which has non-trivial arguments, like arithmetic expressions or function calls.
1715 if t in ALWAYS_NO_SPACE:
1718 if t == token.COMMENT:
1721 assert p is not None, f"INTERNAL ERROR: hand-made leaf without parent: {leaf!r}"
1722 if t == token.COLON and p.type not in {
1729 prev = leaf.prev_sibling
1731 prevp = preceding_leaf(p)
1732 if not prevp or prevp.type in OPENING_BRACKETS:
1735 if t == token.COLON:
1736 if prevp.type == token.COLON:
1739 elif prevp.type != token.COMMA and not complex_subscript:
1744 if prevp.type == token.EQUAL:
1746 if prevp.parent.type in {
1754 elif prevp.parent.type == syms.typedargslist:
1755 # A bit hacky: if the equal sign has whitespace, it means we
1756 # previously found it's a typed argument. So, we're using
1760 elif prevp.type in STARS:
1761 if is_vararg(prevp, within=VARARGS_PARENTS | UNPACKING_PARENTS):
1764 elif prevp.type == token.COLON:
1765 if prevp.parent and prevp.parent.type in {syms.subscript, syms.sliceop}:
1766 return SPACE if complex_subscript else NO
1770 and prevp.parent.type == syms.factor
1771 and prevp.type in MATH_OPERATORS
1776 prevp.type == token.RIGHTSHIFT
1778 and prevp.parent.type == syms.shift_expr
1779 and prevp.prev_sibling
1780 and prevp.prev_sibling.type == token.NAME
1781 and prevp.prev_sibling.value == "print" # type: ignore
1783 # Python 2 print chevron
1786 elif prev.type in OPENING_BRACKETS:
1789 if p.type in {syms.parameters, syms.arglist}:
1790 # untyped function signatures or calls
1791 if not prev or prev.type != token.COMMA:
1794 elif p.type == syms.varargslist:
1796 if prev and prev.type != token.COMMA:
1799 elif p.type == syms.typedargslist:
1800 # typed function signatures
1804 if t == token.EQUAL:
1805 if prev.type != syms.tname:
1808 elif prev.type == token.EQUAL:
1809 # A bit hacky: if the equal sign has whitespace, it means we
1810 # previously found it's a typed argument. So, we're using that, too.
1813 elif prev.type != token.COMMA:
1816 elif p.type == syms.tname:
1819 prevp = preceding_leaf(p)
1820 if not prevp or prevp.type != token.COMMA:
1823 elif p.type == syms.trailer:
1824 # attributes and calls
1825 if t == token.LPAR or t == token.RPAR:
1830 prevp = preceding_leaf(p)
1831 if not prevp or prevp.type != token.NUMBER:
1834 elif t == token.LSQB:
1837 elif prev.type != token.COMMA:
1840 elif p.type == syms.argument:
1842 if t == token.EQUAL:
1846 prevp = preceding_leaf(p)
1847 if not prevp or prevp.type == token.LPAR:
1850 elif prev.type in {token.EQUAL} | STARS:
1853 elif p.type == syms.decorator:
1857 elif p.type == syms.dotted_name:
1861 prevp = preceding_leaf(p)
1862 if not prevp or prevp.type == token.AT or prevp.type == token.DOT:
1865 elif p.type == syms.classdef:
1869 if prev and prev.type == token.LPAR:
1872 elif p.type in {syms.subscript, syms.sliceop}:
1875 assert p.parent is not None, "subscripts are always parented"
1876 if p.parent.type == syms.subscriptlist:
1881 elif not complex_subscript:
1884 elif p.type == syms.atom:
1885 if prev and t == token.DOT:
1886 # dots, but not the first one.
1889 elif p.type == syms.dictsetmaker:
1891 if prev and prev.type == token.DOUBLESTAR:
1894 elif p.type in {syms.factor, syms.star_expr}:
1897 prevp = preceding_leaf(p)
1898 if not prevp or prevp.type in OPENING_BRACKETS:
1901 prevp_parent = prevp.parent
1902 assert prevp_parent is not None
1903 if prevp.type == token.COLON and prevp_parent.type in {
1909 elif prevp.type == token.EQUAL and prevp_parent.type == syms.argument:
1912 elif t in {token.NAME, token.NUMBER, token.STRING}:
1915 elif p.type == syms.import_from:
1917 if prev and prev.type == token.DOT:
1920 elif t == token.NAME:
1924 if prev and prev.type == token.DOT:
1927 elif p.type == syms.sliceop:
1933 def preceding_leaf(node: Optional[LN]) -> Optional[Leaf]:
1934 """Return the first leaf that precedes `node`, if any."""
1936 res = node.prev_sibling
1938 if isinstance(res, Leaf):
1942 return list(res.leaves())[-1]
1951 def child_towards(ancestor: Node, descendant: LN) -> Optional[LN]:
1952 """Return the child of `ancestor` that contains `descendant`."""
1953 node: Optional[LN] = descendant
1954 while node and node.parent != ancestor:
1959 def container_of(leaf: Leaf) -> LN:
1960 """Return `leaf` or one of its ancestors that is the topmost container of it.
1962 By "container" we mean a node where `leaf` is the very first child.
1964 same_prefix = leaf.prefix
1965 container: LN = leaf
1967 parent = container.parent
1971 if parent.children[0].prefix != same_prefix:
1974 if parent.type == syms.file_input:
1977 if parent.prev_sibling is not None and parent.prev_sibling.type in BRACKETS:
1984 def is_split_after_delimiter(leaf: Leaf, previous: Optional[Leaf] = None) -> int:
1985 """Return the priority of the `leaf` delimiter, given a line break after it.
1987 The delimiter priorities returned here are from those delimiters that would
1988 cause a line break after themselves.
1990 Higher numbers are higher priority.
1992 if leaf.type == token.COMMA:
1993 return COMMA_PRIORITY
1998 def is_split_before_delimiter(leaf: Leaf, previous: Optional[Leaf] = None) -> int:
1999 """Return the priority of the `leaf` delimiter, given a line break before it.
2001 The delimiter priorities returned here are from those delimiters that would
2002 cause a line break before themselves.
2004 Higher numbers are higher priority.
2006 if is_vararg(leaf, within=VARARGS_PARENTS | UNPACKING_PARENTS):
2007 # * and ** might also be MATH_OPERATORS but in this case they are not.
2008 # Don't treat them as a delimiter.
2012 leaf.type == token.DOT
2014 and leaf.parent.type not in {syms.import_from, syms.dotted_name}
2015 and (previous is None or previous.type in CLOSING_BRACKETS)
2020 leaf.type in MATH_OPERATORS
2022 and leaf.parent.type not in {syms.factor, syms.star_expr}
2024 return MATH_PRIORITIES[leaf.type]
2026 if leaf.type in COMPARATORS:
2027 return COMPARATOR_PRIORITY
2030 leaf.type == token.STRING
2031 and previous is not None
2032 and previous.type == token.STRING
2034 return STRING_PRIORITY
2036 if leaf.type not in {token.NAME, token.ASYNC}:
2042 and leaf.parent.type in {syms.comp_for, syms.old_comp_for}
2043 or leaf.type == token.ASYNC
2046 not isinstance(leaf.prev_sibling, Leaf)
2047 or leaf.prev_sibling.value != "async"
2049 return COMPREHENSION_PRIORITY
2054 and leaf.parent.type in {syms.comp_if, syms.old_comp_if}
2056 return COMPREHENSION_PRIORITY
2058 if leaf.value in {"if", "else"} and leaf.parent and leaf.parent.type == syms.test:
2059 return TERNARY_PRIORITY
2061 if leaf.value == "is":
2062 return COMPARATOR_PRIORITY
2067 and leaf.parent.type in {syms.comp_op, syms.comparison}
2069 previous is not None
2070 and previous.type == token.NAME
2071 and previous.value == "not"
2074 return COMPARATOR_PRIORITY
2079 and leaf.parent.type == syms.comp_op
2081 previous is not None
2082 and previous.type == token.NAME
2083 and previous.value == "is"
2086 return COMPARATOR_PRIORITY
2088 if leaf.value in LOGIC_OPERATORS and leaf.parent:
2089 return LOGIC_PRIORITY
2094 FMT_OFF = {"# fmt: off", "# fmt:off", "# yapf: disable"}
2095 FMT_ON = {"# fmt: on", "# fmt:on", "# yapf: enable"}
2098 def generate_comments(leaf: LN) -> Iterator[Leaf]:
2099 """Clean the prefix of the `leaf` and generate comments from it, if any.
2101 Comments in lib2to3 are shoved into the whitespace prefix. This happens
2102 in `pgen2/driver.py:Driver.parse_tokens()`. This was a brilliant implementation
2103 move because it does away with modifying the grammar to include all the
2104 possible places in which comments can be placed.
2106 The sad consequence for us though is that comments don't "belong" anywhere.
2107 This is why this function generates simple parentless Leaf objects for
2108 comments. We simply don't know what the correct parent should be.
2110 No matter though, we can live without this. We really only need to
2111 differentiate between inline and standalone comments. The latter don't
2112 share the line with any code.
2114 Inline comments are emitted as regular token.COMMENT leaves. Standalone
2115 are emitted with a fake STANDALONE_COMMENT token identifier.
2117 for pc in list_comments(leaf.prefix, is_endmarker=leaf.type == token.ENDMARKER):
2118 yield Leaf(pc.type, pc.value, prefix="\n" * pc.newlines)
2123 """Describes a piece of syntax that is a comment.
2125 It's not a :class:`blib2to3.pytree.Leaf` so that:
2127 * it can be cached (`Leaf` objects should not be reused more than once as
2128 they store their lineno, column, prefix, and parent information);
2129 * `newlines` and `consumed` fields are kept separate from the `value`. This
2130 simplifies handling of special marker comments like ``# fmt: off/on``.
2133 type: int # token.COMMENT or STANDALONE_COMMENT
2134 value: str # content of the comment
2135 newlines: int # how many newlines before the comment
2136 consumed: int # how many characters of the original leaf's prefix did we consume
2139 @lru_cache(maxsize=4096)
2140 def list_comments(prefix: str, *, is_endmarker: bool) -> List[ProtoComment]:
2141 """Return a list of :class:`ProtoComment` objects parsed from the given `prefix`."""
2142 result: List[ProtoComment] = []
2143 if not prefix or "#" not in prefix:
2149 for index, line in enumerate(prefix.split("\n")):
2150 consumed += len(line) + 1 # adding the length of the split '\n'
2151 line = line.lstrip()
2154 if not line.startswith("#"):
2155 # Escaped newlines outside of a comment are not really newlines at
2156 # all. We treat a single-line comment following an escaped newline
2157 # as a simple trailing comment.
2158 if line.endswith("\\"):
2162 if index == ignored_lines and not is_endmarker:
2163 comment_type = token.COMMENT # simple trailing comment
2165 comment_type = STANDALONE_COMMENT
2166 comment = make_comment(line)
2169 type=comment_type, value=comment, newlines=nlines, consumed=consumed
2176 def make_comment(content: str) -> str:
2177 """Return a consistently formatted comment from the given `content` string.
2179 All comments (except for "##", "#!", "#:", '#'", "#%%") should have a single
2180 space between the hash sign and the content.
2182 If `content` didn't start with a hash sign, one is provided.
2184 content = content.rstrip()
2188 if content[0] == "#":
2189 content = content[1:]
2190 if content and content[0] not in " !:#'%":
2191 content = " " + content
2192 return "#" + content
2198 inner: bool = False,
2199 features: Collection[Feature] = (),
2200 ) -> Iterator[Line]:
2201 """Split a `line` into potentially many lines.
2203 They should fit in the allotted `line_length` but might not be able to.
2204 `inner` signifies that there were a pair of brackets somewhere around the
2205 current `line`, possibly transitively. This means we can fallback to splitting
2206 by delimiters if the LHS/RHS don't yield any results.
2208 `features` are syntactical features that may be used in the output.
2214 line_str = str(line).strip("\n")
2217 not line.contains_inner_type_comments()
2218 and not line.should_explode
2219 and is_line_short_enough(line, line_length=line_length, line_str=line_str)
2224 split_funcs: List[SplitFunc]
2226 split_funcs = [left_hand_split]
2229 def rhs(line: Line, features: Collection[Feature]) -> Iterator[Line]:
2230 for omit in generate_trailers_to_omit(line, line_length):
2231 lines = list(right_hand_split(line, line_length, features, omit=omit))
2232 if is_line_short_enough(lines[0], line_length=line_length):
2236 # All splits failed, best effort split with no omits.
2237 # This mostly happens to multiline strings that are by definition
2238 # reported as not fitting a single line.
2239 yield from right_hand_split(line, line_length, features=features)
2241 if line.inside_brackets:
2242 split_funcs = [delimiter_split, standalone_comment_split, rhs]
2245 for split_func in split_funcs:
2246 # We are accumulating lines in `result` because we might want to abort
2247 # mission and return the original line in the end, or attempt a different
2249 result: List[Line] = []
2251 for l in split_func(line, features):
2252 if str(l).strip("\n") == line_str:
2253 raise CannotSplit("Split function returned an unchanged result")
2257 l, line_length=line_length, inner=True, features=features
2271 def left_hand_split(line: Line, features: Collection[Feature] = ()) -> Iterator[Line]:
2272 """Split line into many lines, starting with the first matching bracket pair.
2274 Note: this usually looks weird, only use this for function definitions.
2275 Prefer RHS otherwise. This is why this function is not symmetrical with
2276 :func:`right_hand_split` which also handles optional parentheses.
2278 tail_leaves: List[Leaf] = []
2279 body_leaves: List[Leaf] = []
2280 head_leaves: List[Leaf] = []
2281 current_leaves = head_leaves
2282 matching_bracket = None
2283 for leaf in line.leaves:
2285 current_leaves is body_leaves
2286 and leaf.type in CLOSING_BRACKETS
2287 and leaf.opening_bracket is matching_bracket
2289 current_leaves = tail_leaves if body_leaves else head_leaves
2290 current_leaves.append(leaf)
2291 if current_leaves is head_leaves:
2292 if leaf.type in OPENING_BRACKETS:
2293 matching_bracket = leaf
2294 current_leaves = body_leaves
2295 if not matching_bracket:
2296 raise CannotSplit("No brackets found")
2298 head = bracket_split_build_line(head_leaves, line, matching_bracket)
2299 body = bracket_split_build_line(body_leaves, line, matching_bracket, is_body=True)
2300 tail = bracket_split_build_line(tail_leaves, line, matching_bracket)
2301 bracket_split_succeeded_or_raise(head, body, tail)
2302 for result in (head, body, tail):
2307 def right_hand_split(
2310 features: Collection[Feature] = (),
2311 omit: Collection[LeafID] = (),
2312 ) -> Iterator[Line]:
2313 """Split line into many lines, starting with the last matching bracket pair.
2315 If the split was by optional parentheses, attempt splitting without them, too.
2316 `omit` is a collection of closing bracket IDs that shouldn't be considered for
2319 Note: running this function modifies `bracket_depth` on the leaves of `line`.
2321 tail_leaves: List[Leaf] = []
2322 body_leaves: List[Leaf] = []
2323 head_leaves: List[Leaf] = []
2324 current_leaves = tail_leaves
2325 opening_bracket = None
2326 closing_bracket = None
2327 for leaf in reversed(line.leaves):
2328 if current_leaves is body_leaves:
2329 if leaf is opening_bracket:
2330 current_leaves = head_leaves if body_leaves else tail_leaves
2331 current_leaves.append(leaf)
2332 if current_leaves is tail_leaves:
2333 if leaf.type in CLOSING_BRACKETS and id(leaf) not in omit:
2334 opening_bracket = leaf.opening_bracket
2335 closing_bracket = leaf
2336 current_leaves = body_leaves
2337 if not (opening_bracket and closing_bracket and head_leaves):
2338 # If there is no opening or closing_bracket that means the split failed and
2339 # all content is in the tail. Otherwise, if `head_leaves` are empty, it means
2340 # the matching `opening_bracket` wasn't available on `line` anymore.
2341 raise CannotSplit("No brackets found")
2343 tail_leaves.reverse()
2344 body_leaves.reverse()
2345 head_leaves.reverse()
2346 head = bracket_split_build_line(head_leaves, line, opening_bracket)
2347 body = bracket_split_build_line(body_leaves, line, opening_bracket, is_body=True)
2348 tail = bracket_split_build_line(tail_leaves, line, opening_bracket)
2349 bracket_split_succeeded_or_raise(head, body, tail)
2351 # the body shouldn't be exploded
2352 not body.should_explode
2353 # the opening bracket is an optional paren
2354 and opening_bracket.type == token.LPAR
2355 and not opening_bracket.value
2356 # the closing bracket is an optional paren
2357 and closing_bracket.type == token.RPAR
2358 and not closing_bracket.value
2359 # it's not an import (optional parens are the only thing we can split on
2360 # in this case; attempting a split without them is a waste of time)
2361 and not line.is_import
2362 # there are no standalone comments in the body
2363 and not body.contains_standalone_comments(0)
2364 # and we can actually remove the parens
2365 and can_omit_invisible_parens(body, line_length)
2367 omit = {id(closing_bracket), *omit}
2369 yield from right_hand_split(line, line_length, features=features, omit=omit)
2375 or is_line_short_enough(body, line_length=line_length)
2378 "Splitting failed, body is still too long and can't be split."
2381 elif head.contains_multiline_strings() or tail.contains_multiline_strings():
2383 "The current optional pair of parentheses is bound to fail to "
2384 "satisfy the splitting algorithm because the head or the tail "
2385 "contains multiline strings which by definition never fit one "
2389 ensure_visible(opening_bracket)
2390 ensure_visible(closing_bracket)
2391 for result in (head, body, tail):
2396 def bracket_split_succeeded_or_raise(head: Line, body: Line, tail: Line) -> None:
2397 """Raise :exc:`CannotSplit` if the last left- or right-hand split failed.
2399 Do nothing otherwise.
2401 A left- or right-hand split is based on a pair of brackets. Content before
2402 (and including) the opening bracket is left on one line, content inside the
2403 brackets is put on a separate line, and finally content starting with and
2404 following the closing bracket is put on a separate line.
2406 Those are called `head`, `body`, and `tail`, respectively. If the split
2407 produced the same line (all content in `head`) or ended up with an empty `body`
2408 and the `tail` is just the closing bracket, then it's considered failed.
2410 tail_len = len(str(tail).strip())
2413 raise CannotSplit("Splitting brackets produced the same line")
2417 f"Splitting brackets on an empty body to save "
2418 f"{tail_len} characters is not worth it"
2422 def bracket_split_build_line(
2423 leaves: List[Leaf], original: Line, opening_bracket: Leaf, *, is_body: bool = False
2425 """Return a new line with given `leaves` and respective comments from `original`.
2427 If `is_body` is True, the result line is one-indented inside brackets and as such
2428 has its first leaf's prefix normalized and a trailing comma added when expected.
2430 result = Line(depth=original.depth)
2432 result.inside_brackets = True
2435 # Since body is a new indent level, remove spurious leading whitespace.
2436 normalize_prefix(leaves[0], inside_brackets=True)
2437 # Ensure a trailing comma for imports, but be careful not to add one after
2439 if original.is_import:
2440 for i in range(len(leaves) - 1, -1, -1):
2441 if leaves[i].type == STANDALONE_COMMENT:
2443 elif leaves[i].type == token.COMMA:
2446 leaves.insert(i + 1, Leaf(token.COMMA, ","))
2450 result.append(leaf, preformatted=True)
2451 for comment_after in original.comments_after(leaf):
2452 result.append(comment_after, preformatted=True)
2454 result.should_explode = should_explode(result, opening_bracket)
2458 def dont_increase_indentation(split_func: SplitFunc) -> SplitFunc:
2459 """Normalize prefix of the first leaf in every line returned by `split_func`.
2461 This is a decorator over relevant split functions.
2465 def split_wrapper(line: Line, features: Collection[Feature] = ()) -> Iterator[Line]:
2466 for l in split_func(line, features):
2467 normalize_prefix(l.leaves[0], inside_brackets=True)
2470 return split_wrapper
2473 @dont_increase_indentation
2474 def delimiter_split(line: Line, features: Collection[Feature] = ()) -> Iterator[Line]:
2475 """Split according to delimiters of the highest priority.
2477 If the appropriate Features are given, the split will add trailing commas
2478 also in function signatures and calls that contain `*` and `**`.
2481 last_leaf = line.leaves[-1]
2483 raise CannotSplit("Line empty")
2485 bt = line.bracket_tracker
2487 delimiter_priority = bt.max_delimiter_priority(exclude={id(last_leaf)})
2489 raise CannotSplit("No delimiters found")
2491 if delimiter_priority == DOT_PRIORITY:
2492 if bt.delimiter_count_with_priority(delimiter_priority) == 1:
2493 raise CannotSplit("Splitting a single attribute from its owner looks wrong")
2495 current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2496 lowest_depth = sys.maxsize
2497 trailing_comma_safe = True
2499 def append_to_line(leaf: Leaf) -> Iterator[Line]:
2500 """Append `leaf` to current line or to new line if appending impossible."""
2501 nonlocal current_line
2503 current_line.append_safe(leaf, preformatted=True)
2507 current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2508 current_line.append(leaf)
2510 for leaf in line.leaves:
2511 yield from append_to_line(leaf)
2513 for comment_after in line.comments_after(leaf):
2514 yield from append_to_line(comment_after)
2516 lowest_depth = min(lowest_depth, leaf.bracket_depth)
2517 if leaf.bracket_depth == lowest_depth:
2518 if is_vararg(leaf, within={syms.typedargslist}):
2519 trailing_comma_safe = (
2520 trailing_comma_safe and Feature.TRAILING_COMMA_IN_DEF in features
2522 elif is_vararg(leaf, within={syms.arglist, syms.argument}):
2523 trailing_comma_safe = (
2524 trailing_comma_safe and Feature.TRAILING_COMMA_IN_CALL in features
2527 leaf_priority = bt.delimiters.get(id(leaf))
2528 if leaf_priority == delimiter_priority:
2531 current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2535 and delimiter_priority == COMMA_PRIORITY
2536 and current_line.leaves[-1].type != token.COMMA
2537 and current_line.leaves[-1].type != STANDALONE_COMMENT
2539 current_line.append(Leaf(token.COMMA, ","))
2543 @dont_increase_indentation
2544 def standalone_comment_split(
2545 line: Line, features: Collection[Feature] = ()
2546 ) -> Iterator[Line]:
2547 """Split standalone comments from the rest of the line."""
2548 if not line.contains_standalone_comments(0):
2549 raise CannotSplit("Line does not have any standalone comments")
2551 current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2553 def append_to_line(leaf: Leaf) -> Iterator[Line]:
2554 """Append `leaf` to current line or to new line if appending impossible."""
2555 nonlocal current_line
2557 current_line.append_safe(leaf, preformatted=True)
2561 current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2562 current_line.append(leaf)
2564 for leaf in line.leaves:
2565 yield from append_to_line(leaf)
2567 for comment_after in line.comments_after(leaf):
2568 yield from append_to_line(comment_after)
2574 def is_import(leaf: Leaf) -> bool:
2575 """Return True if the given leaf starts an import statement."""
2582 (v == "import" and p and p.type == syms.import_name)
2583 or (v == "from" and p and p.type == syms.import_from)
2588 def is_type_comment(leaf: Leaf) -> bool:
2589 """Return True if the given leaf is a special comment.
2590 Only returns true for type comments for now."""
2593 return t in {token.COMMENT, t == STANDALONE_COMMENT} and v.startswith("# type:")
2596 def normalize_prefix(leaf: Leaf, *, inside_brackets: bool) -> None:
2597 """Leave existing extra newlines if not `inside_brackets`. Remove everything
2600 Note: don't use backslashes for formatting or you'll lose your voting rights.
2602 if not inside_brackets:
2603 spl = leaf.prefix.split("#")
2604 if "\\" not in spl[0]:
2605 nl_count = spl[-1].count("\n")
2608 leaf.prefix = "\n" * nl_count
2614 def normalize_string_prefix(leaf: Leaf, remove_u_prefix: bool = False) -> None:
2615 """Make all string prefixes lowercase.
2617 If remove_u_prefix is given, also removes any u prefix from the string.
2619 Note: Mutates its argument.
2621 match = re.match(r"^([furbFURB]*)(.*)$", leaf.value, re.DOTALL)
2622 assert match is not None, f"failed to match string {leaf.value!r}"
2623 orig_prefix = match.group(1)
2624 new_prefix = orig_prefix.lower()
2626 new_prefix = new_prefix.replace("u", "")
2627 leaf.value = f"{new_prefix}{match.group(2)}"
2630 def normalize_string_quotes(leaf: Leaf) -> None:
2631 """Prefer double quotes but only if it doesn't cause more escaping.
2633 Adds or removes backslashes as appropriate. Doesn't parse and fix
2634 strings nested in f-strings (yet).
2636 Note: Mutates its argument.
2638 value = leaf.value.lstrip("furbFURB")
2639 if value[:3] == '"""':
2642 elif value[:3] == "'''":
2645 elif value[0] == '"':
2651 first_quote_pos = leaf.value.find(orig_quote)
2652 if first_quote_pos == -1:
2653 return # There's an internal error
2655 prefix = leaf.value[:first_quote_pos]
2656 unescaped_new_quote = re.compile(rf"(([^\\]|^)(\\\\)*){new_quote}")
2657 escaped_new_quote = re.compile(rf"([^\\]|^)\\((?:\\\\)*){new_quote}")
2658 escaped_orig_quote = re.compile(rf"([^\\]|^)\\((?:\\\\)*){orig_quote}")
2659 body = leaf.value[first_quote_pos + len(orig_quote) : -len(orig_quote)]
2660 if "r" in prefix.casefold():
2661 if unescaped_new_quote.search(body):
2662 # There's at least one unescaped new_quote in this raw string
2663 # so converting is impossible
2666 # Do not introduce or remove backslashes in raw strings
2669 # remove unnecessary escapes
2670 new_body = sub_twice(escaped_new_quote, rf"\1\2{new_quote}", body)
2671 if body != new_body:
2672 # Consider the string without unnecessary escapes as the original
2674 leaf.value = f"{prefix}{orig_quote}{body}{orig_quote}"
2675 new_body = sub_twice(escaped_orig_quote, rf"\1\2{orig_quote}", new_body)
2676 new_body = sub_twice(unescaped_new_quote, rf"\1\\{new_quote}", new_body)
2677 if "f" in prefix.casefold():
2678 matches = re.findall(r"[^{]\{(.*?)\}[^}]", new_body)
2681 # Do not introduce backslashes in interpolated expressions
2683 if new_quote == '"""' and new_body[-1:] == '"':
2685 new_body = new_body[:-1] + '\\"'
2686 orig_escape_count = body.count("\\")
2687 new_escape_count = new_body.count("\\")
2688 if new_escape_count > orig_escape_count:
2689 return # Do not introduce more escaping
2691 if new_escape_count == orig_escape_count and orig_quote == '"':
2692 return # Prefer double quotes
2694 leaf.value = f"{prefix}{new_quote}{new_body}{new_quote}"
2697 def normalize_numeric_literal(leaf: Leaf) -> None:
2698 """Normalizes numeric (float, int, and complex) literals.
2700 All letters used in the representation are normalized to lowercase (except
2701 in Python 2 long literals).
2703 text = leaf.value.lower()
2704 if text.startswith(("0o", "0b")):
2705 # Leave octal and binary literals alone.
2707 elif text.startswith("0x"):
2708 # Change hex literals to upper case.
2709 before, after = text[:2], text[2:]
2710 text = f"{before}{after.upper()}"
2712 before, after = text.split("e")
2714 if after.startswith("-"):
2717 elif after.startswith("+"):
2719 before = format_float_or_int_string(before)
2720 text = f"{before}e{sign}{after}"
2721 elif text.endswith(("j", "l")):
2724 # Capitalize in "2L" because "l" looks too similar to "1".
2727 text = f"{format_float_or_int_string(number)}{suffix}"
2729 text = format_float_or_int_string(text)
2733 def format_float_or_int_string(text: str) -> str:
2734 """Formats a float string like "1.0"."""
2738 before, after = text.split(".")
2739 return f"{before or 0}.{after or 0}"
2742 def normalize_invisible_parens(node: Node, parens_after: Set[str]) -> None:
2743 """Make existing optional parentheses invisible or create new ones.
2745 `parens_after` is a set of string leaf values immeditely after which parens
2748 Standardizes on visible parentheses for single-element tuples, and keeps
2749 existing visible parentheses for other tuples and generator expressions.
2751 for pc in list_comments(node.prefix, is_endmarker=False):
2752 if pc.value in FMT_OFF:
2753 # This `node` has a prefix with `# fmt: off`, don't mess with parens.
2757 for index, child in enumerate(list(node.children)):
2758 # Add parentheses around long tuple unpacking in assignments.
2761 and isinstance(child, Node)
2762 and child.type == syms.testlist_star_expr
2767 if child.type == syms.atom:
2768 if maybe_make_parens_invisible_in_atom(child, parent=node):
2769 lpar = Leaf(token.LPAR, "")
2770 rpar = Leaf(token.RPAR, "")
2771 index = child.remove() or 0
2772 node.insert_child(index, Node(syms.atom, [lpar, child, rpar]))
2773 elif is_one_tuple(child):
2774 # wrap child in visible parentheses
2775 lpar = Leaf(token.LPAR, "(")
2776 rpar = Leaf(token.RPAR, ")")
2778 node.insert_child(index, Node(syms.atom, [lpar, child, rpar]))
2779 elif node.type == syms.import_from:
2780 # "import from" nodes store parentheses directly as part of
2782 if child.type == token.LPAR:
2783 # make parentheses invisible
2784 child.value = "" # type: ignore
2785 node.children[-1].value = "" # type: ignore
2786 elif child.type != token.STAR:
2787 # insert invisible parentheses
2788 node.insert_child(index, Leaf(token.LPAR, ""))
2789 node.append_child(Leaf(token.RPAR, ""))
2792 elif not (isinstance(child, Leaf) and is_multiline_string(child)):
2793 # wrap child in invisible parentheses
2794 lpar = Leaf(token.LPAR, "")
2795 rpar = Leaf(token.RPAR, "")
2796 index = child.remove() or 0
2797 prefix = child.prefix
2799 new_child = Node(syms.atom, [lpar, child, rpar])
2800 new_child.prefix = prefix
2801 node.insert_child(index, new_child)
2803 check_lpar = isinstance(child, Leaf) and child.value in parens_after
2806 def normalize_fmt_off(node: Node) -> None:
2807 """Convert content between `# fmt: off`/`# fmt: on` into standalone comments."""
2810 try_again = convert_one_fmt_off_pair(node)
2813 def convert_one_fmt_off_pair(node: Node) -> bool:
2814 """Convert content of a single `# fmt: off`/`# fmt: on` into a standalone comment.
2816 Returns True if a pair was converted.
2818 for leaf in node.leaves():
2819 previous_consumed = 0
2820 for comment in list_comments(leaf.prefix, is_endmarker=False):
2821 if comment.value in FMT_OFF:
2822 # We only want standalone comments. If there's no previous leaf or
2823 # the previous leaf is indentation, it's a standalone comment in
2825 if comment.type != STANDALONE_COMMENT:
2826 prev = preceding_leaf(leaf)
2827 if prev and prev.type not in WHITESPACE:
2830 ignored_nodes = list(generate_ignored_nodes(leaf))
2831 if not ignored_nodes:
2834 first = ignored_nodes[0] # Can be a container node with the `leaf`.
2835 parent = first.parent
2836 prefix = first.prefix
2837 first.prefix = prefix[comment.consumed :]
2839 comment.value + "\n" + "".join(str(n) for n in ignored_nodes)
2841 if hidden_value.endswith("\n"):
2842 # That happens when one of the `ignored_nodes` ended with a NEWLINE
2843 # leaf (possibly followed by a DEDENT).
2844 hidden_value = hidden_value[:-1]
2846 for ignored in ignored_nodes:
2847 index = ignored.remove()
2848 if first_idx is None:
2850 assert parent is not None, "INTERNAL ERROR: fmt: on/off handling (1)"
2851 assert first_idx is not None, "INTERNAL ERROR: fmt: on/off handling (2)"
2852 parent.insert_child(
2857 prefix=prefix[:previous_consumed] + "\n" * comment.newlines,
2862 previous_consumed = comment.consumed
2867 def generate_ignored_nodes(leaf: Leaf) -> Iterator[LN]:
2868 """Starting from the container of `leaf`, generate all leaves until `# fmt: on`.
2870 Stops at the end of the block.
2872 container: Optional[LN] = container_of(leaf)
2873 while container is not None and container.type != token.ENDMARKER:
2874 for comment in list_comments(container.prefix, is_endmarker=False):
2875 if comment.value in FMT_ON:
2880 container = container.next_sibling
2883 def maybe_make_parens_invisible_in_atom(node: LN, parent: LN) -> bool:
2884 """If it's safe, make the parens in the atom `node` invisible, recursively.
2886 Returns whether the node should itself be wrapped in invisible parentheses.
2890 node.type != syms.atom
2891 or is_empty_tuple(node)
2892 or is_one_tuple(node)
2893 or (is_yield(node) and parent.type != syms.expr_stmt)
2894 or max_delimiter_priority_in_atom(node) >= COMMA_PRIORITY
2898 first = node.children[0]
2899 last = node.children[-1]
2900 if first.type == token.LPAR and last.type == token.RPAR:
2901 # make parentheses invisible
2902 first.value = "" # type: ignore
2903 last.value = "" # type: ignore
2904 if len(node.children) > 1:
2905 maybe_make_parens_invisible_in_atom(node.children[1], parent=parent)
2911 def is_empty_tuple(node: LN) -> bool:
2912 """Return True if `node` holds an empty tuple."""
2914 node.type == syms.atom
2915 and len(node.children) == 2
2916 and node.children[0].type == token.LPAR
2917 and node.children[1].type == token.RPAR
2921 def is_one_tuple(node: LN) -> bool:
2922 """Return True if `node` holds a tuple with one element, with or without parens."""
2923 if node.type == syms.atom:
2924 if len(node.children) != 3:
2927 lpar, gexp, rpar = node.children
2929 lpar.type == token.LPAR
2930 and gexp.type == syms.testlist_gexp
2931 and rpar.type == token.RPAR
2935 return len(gexp.children) == 2 and gexp.children[1].type == token.COMMA
2938 node.type in IMPLICIT_TUPLE
2939 and len(node.children) == 2
2940 and node.children[1].type == token.COMMA
2944 def is_yield(node: LN) -> bool:
2945 """Return True if `node` holds a `yield` or `yield from` expression."""
2946 if node.type == syms.yield_expr:
2949 if node.type == token.NAME and node.value == "yield": # type: ignore
2952 if node.type != syms.atom:
2955 if len(node.children) != 3:
2958 lpar, expr, rpar = node.children
2959 if lpar.type == token.LPAR and rpar.type == token.RPAR:
2960 return is_yield(expr)
2965 def is_vararg(leaf: Leaf, within: Set[NodeType]) -> bool:
2966 """Return True if `leaf` is a star or double star in a vararg or kwarg.
2968 If `within` includes VARARGS_PARENTS, this applies to function signatures.
2969 If `within` includes UNPACKING_PARENTS, it applies to right hand-side
2970 extended iterable unpacking (PEP 3132) and additional unpacking
2971 generalizations (PEP 448).
2973 if leaf.type not in STARS or not leaf.parent:
2977 if p.type == syms.star_expr:
2978 # Star expressions are also used as assignment targets in extended
2979 # iterable unpacking (PEP 3132). See what its parent is instead.
2985 return p.type in within
2988 def is_multiline_string(leaf: Leaf) -> bool:
2989 """Return True if `leaf` is a multiline string that actually spans many lines."""
2990 value = leaf.value.lstrip("furbFURB")
2991 return value[:3] in {'"""', "'''"} and "\n" in value
2994 def is_stub_suite(node: Node) -> bool:
2995 """Return True if `node` is a suite with a stub body."""
2997 len(node.children) != 4
2998 or node.children[0].type != token.NEWLINE
2999 or node.children[1].type != token.INDENT
3000 or node.children[3].type != token.DEDENT
3004 return is_stub_body(node.children[2])
3007 def is_stub_body(node: LN) -> bool:
3008 """Return True if `node` is a simple statement containing an ellipsis."""
3009 if not isinstance(node, Node) or node.type != syms.simple_stmt:
3012 if len(node.children) != 2:
3015 child = node.children[0]
3017 child.type == syms.atom
3018 and len(child.children) == 3
3019 and all(leaf == Leaf(token.DOT, ".") for leaf in child.children)
3023 def max_delimiter_priority_in_atom(node: LN) -> int:
3024 """Return maximum delimiter priority inside `node`.
3026 This is specific to atoms with contents contained in a pair of parentheses.
3027 If `node` isn't an atom or there are no enclosing parentheses, returns 0.
3029 if node.type != syms.atom:
3032 first = node.children[0]
3033 last = node.children[-1]
3034 if not (first.type == token.LPAR and last.type == token.RPAR):
3037 bt = BracketTracker()
3038 for c in node.children[1:-1]:
3039 if isinstance(c, Leaf):
3042 for leaf in c.leaves():
3045 return bt.max_delimiter_priority()
3051 def ensure_visible(leaf: Leaf) -> None:
3052 """Make sure parentheses are visible.
3054 They could be invisible as part of some statements (see
3055 :func:`normalize_invible_parens` and :func:`visit_import_from`).
3057 if leaf.type == token.LPAR:
3059 elif leaf.type == token.RPAR:
3063 def should_explode(line: Line, opening_bracket: Leaf) -> bool:
3064 """Should `line` immediately be split with `delimiter_split()` after RHS?"""
3067 opening_bracket.parent
3068 and opening_bracket.parent.type in {syms.atom, syms.import_from}
3069 and opening_bracket.value in "[{("
3074 last_leaf = line.leaves[-1]
3075 exclude = {id(last_leaf)} if last_leaf.type == token.COMMA else set()
3076 max_priority = line.bracket_tracker.max_delimiter_priority(exclude=exclude)
3077 except (IndexError, ValueError):
3080 return max_priority == COMMA_PRIORITY
3083 def get_features_used(node: Node) -> Set[Feature]:
3084 """Return a set of (relatively) new Python features used in this file.
3086 Currently looking for:
3088 - underscores in numeric literals; and
3089 - trailing commas after * or ** in function signatures and calls.
3091 features: Set[Feature] = set()
3092 for n in node.pre_order():
3093 if n.type == token.STRING:
3094 value_head = n.value[:2] # type: ignore
3095 if value_head in {'f"', 'F"', "f'", "F'", "rf", "fr", "RF", "FR"}:
3096 features.add(Feature.F_STRINGS)
3098 elif n.type == token.NUMBER:
3099 if "_" in n.value: # type: ignore
3100 features.add(Feature.NUMERIC_UNDERSCORES)
3103 n.type in {syms.typedargslist, syms.arglist}
3105 and n.children[-1].type == token.COMMA
3107 if n.type == syms.typedargslist:
3108 feature = Feature.TRAILING_COMMA_IN_DEF
3110 feature = Feature.TRAILING_COMMA_IN_CALL
3112 for ch in n.children:
3113 if ch.type in STARS:
3114 features.add(feature)
3116 if ch.type == syms.argument:
3117 for argch in ch.children:
3118 if argch.type in STARS:
3119 features.add(feature)
3124 def detect_target_versions(node: Node) -> Set[TargetVersion]:
3125 """Detect the version to target based on the nodes used."""
3126 features = get_features_used(node)
3128 version for version in TargetVersion if features <= VERSION_TO_FEATURES[version]
3132 def generate_trailers_to_omit(line: Line, line_length: int) -> Iterator[Set[LeafID]]:
3133 """Generate sets of closing bracket IDs that should be omitted in a RHS.
3135 Brackets can be omitted if the entire trailer up to and including
3136 a preceding closing bracket fits in one line.
3138 Yielded sets are cumulative (contain results of previous yields, too). First
3142 omit: Set[LeafID] = set()
3145 length = 4 * line.depth
3146 opening_bracket = None
3147 closing_bracket = None
3148 inner_brackets: Set[LeafID] = set()
3149 for index, leaf, leaf_length in enumerate_with_length(line, reversed=True):
3150 length += leaf_length
3151 if length > line_length:
3154 has_inline_comment = leaf_length > len(leaf.value) + len(leaf.prefix)
3155 if leaf.type == STANDALONE_COMMENT or has_inline_comment:
3159 if leaf is opening_bracket:
3160 opening_bracket = None
3161 elif leaf.type in CLOSING_BRACKETS:
3162 inner_brackets.add(id(leaf))
3163 elif leaf.type in CLOSING_BRACKETS:
3164 if index > 0 and line.leaves[index - 1].type in OPENING_BRACKETS:
3165 # Empty brackets would fail a split so treat them as "inner"
3166 # brackets (e.g. only add them to the `omit` set if another
3167 # pair of brackets was good enough.
3168 inner_brackets.add(id(leaf))
3172 omit.add(id(closing_bracket))
3173 omit.update(inner_brackets)
3174 inner_brackets.clear()
3178 opening_bracket = leaf.opening_bracket
3179 closing_bracket = leaf
3182 def get_future_imports(node: Node) -> Set[str]:
3183 """Return a set of __future__ imports in the file."""
3184 imports: Set[str] = set()
3186 def get_imports_from_children(children: List[LN]) -> Generator[str, None, None]:
3187 for child in children:
3188 if isinstance(child, Leaf):
3189 if child.type == token.NAME:
3191 elif child.type == syms.import_as_name:
3192 orig_name = child.children[0]
3193 assert isinstance(orig_name, Leaf), "Invalid syntax parsing imports"
3194 assert orig_name.type == token.NAME, "Invalid syntax parsing imports"
3195 yield orig_name.value
3196 elif child.type == syms.import_as_names:
3197 yield from get_imports_from_children(child.children)
3199 raise AssertionError("Invalid syntax parsing imports")
3201 for child in node.children:
3202 if child.type != syms.simple_stmt:
3204 first_child = child.children[0]
3205 if isinstance(first_child, Leaf):
3206 # Continue looking if we see a docstring; otherwise stop.
3208 len(child.children) == 2
3209 and first_child.type == token.STRING
3210 and child.children[1].type == token.NEWLINE
3215 elif first_child.type == syms.import_from:
3216 module_name = first_child.children[1]
3217 if not isinstance(module_name, Leaf) or module_name.value != "__future__":
3219 imports |= set(get_imports_from_children(first_child.children[3:]))
3225 def gen_python_files_in_dir(
3228 include: Pattern[str],
3229 exclude: Pattern[str],
3231 ) -> Iterator[Path]:
3232 """Generate all files under `path` whose paths are not excluded by the
3233 `exclude` regex, but are included by the `include` regex.
3235 Symbolic links pointing outside of the `root` directory are ignored.
3237 `report` is where output about exclusions goes.
3239 assert root.is_absolute(), f"INTERNAL ERROR: `root` must be absolute but is {root}"
3240 for child in path.iterdir():
3242 normalized_path = "/" + child.resolve().relative_to(root).as_posix()
3244 if child.is_symlink():
3245 report.path_ignored(
3246 child, f"is a symbolic link that points outside {root}"
3253 normalized_path += "/"
3254 exclude_match = exclude.search(normalized_path)
3255 if exclude_match and exclude_match.group(0):
3256 report.path_ignored(child, f"matches the --exclude regular expression")
3260 yield from gen_python_files_in_dir(child, root, include, exclude, report)
3262 elif child.is_file():
3263 include_match = include.search(normalized_path)
3269 def find_project_root(srcs: Iterable[str]) -> Path:
3270 """Return a directory containing .git, .hg, or pyproject.toml.
3272 That directory can be one of the directories passed in `srcs` or their
3275 If no directory in the tree contains a marker that would specify it's the
3276 project root, the root of the file system is returned.
3279 return Path("/").resolve()
3281 common_base = min(Path(src).resolve() for src in srcs)
3282 if common_base.is_dir():
3283 # Append a fake file so `parents` below returns `common_base_dir`, too.
3284 common_base /= "fake-file"
3285 for directory in common_base.parents:
3286 if (directory / ".git").is_dir():
3289 if (directory / ".hg").is_dir():
3292 if (directory / "pyproject.toml").is_file():
3300 """Provides a reformatting counter. Can be rendered with `str(report)`."""
3304 verbose: bool = False
3305 change_count: int = 0
3307 failure_count: int = 0
3309 def done(self, src: Path, changed: Changed) -> None:
3310 """Increment the counter for successful reformatting. Write out a message."""
3311 if changed is Changed.YES:
3312 reformatted = "would reformat" if self.check else "reformatted"
3313 if self.verbose or not self.quiet:
3314 out(f"{reformatted} {src}")
3315 self.change_count += 1
3318 if changed is Changed.NO:
3319 msg = f"{src} already well formatted, good job."
3321 msg = f"{src} wasn't modified on disk since last run."
3322 out(msg, bold=False)
3323 self.same_count += 1
3325 def failed(self, src: Path, message: str) -> None:
3326 """Increment the counter for failed reformatting. Write out a message."""
3327 err(f"error: cannot format {src}: {message}")
3328 self.failure_count += 1
3330 def path_ignored(self, path: Path, message: str) -> None:
3332 out(f"{path} ignored: {message}", bold=False)
3335 def return_code(self) -> int:
3336 """Return the exit code that the app should use.
3338 This considers the current state of changed files and failures:
3339 - if there were any failures, return 123;
3340 - if any files were changed and --check is being used, return 1;
3341 - otherwise return 0.
3343 # According to http://tldp.org/LDP/abs/html/exitcodes.html starting with
3344 # 126 we have special return codes reserved by the shell.
3345 if self.failure_count:
3348 elif self.change_count and self.check:
3353 def __str__(self) -> str:
3354 """Render a color report of the current state.
3356 Use `click.unstyle` to remove colors.
3359 reformatted = "would be reformatted"
3360 unchanged = "would be left unchanged"
3361 failed = "would fail to reformat"
3363 reformatted = "reformatted"
3364 unchanged = "left unchanged"
3365 failed = "failed to reformat"
3367 if self.change_count:
3368 s = "s" if self.change_count > 1 else ""
3370 click.style(f"{self.change_count} file{s} {reformatted}", bold=True)
3373 s = "s" if self.same_count > 1 else ""
3374 report.append(f"{self.same_count} file{s} {unchanged}")
3375 if self.failure_count:
3376 s = "s" if self.failure_count > 1 else ""
3378 click.style(f"{self.failure_count} file{s} {failed}", fg="red")
3380 return ", ".join(report) + "."
3383 def assert_equivalent(src: str, dst: str) -> None:
3384 """Raise AssertionError if `src` and `dst` aren't equivalent."""
3389 def _v(node: ast.AST, depth: int = 0) -> Iterator[str]:
3390 """Simple visitor generating strings to compare ASTs by content."""
3391 yield f"{' ' * depth}{node.__class__.__name__}("
3393 for field in sorted(node._fields):
3395 value = getattr(node, field)
3396 except AttributeError:
3399 yield f"{' ' * (depth+1)}{field}="
3401 if isinstance(value, list):
3403 # Ignore nested tuples within del statements, because we may insert
3404 # parentheses and they change the AST.
3407 and isinstance(node, ast.Delete)
3408 and isinstance(item, ast.Tuple)
3410 for item in item.elts:
3411 yield from _v(item, depth + 2)
3412 elif isinstance(item, ast.AST):
3413 yield from _v(item, depth + 2)
3415 elif isinstance(value, ast.AST):
3416 yield from _v(value, depth + 2)
3419 yield f"{' ' * (depth+2)}{value!r}, # {value.__class__.__name__}"
3421 yield f"{' ' * depth}) # /{node.__class__.__name__}"
3424 src_ast = ast.parse(src)
3425 except Exception as exc:
3426 major, minor = sys.version_info[:2]
3427 raise AssertionError(
3428 f"cannot use --safe with this file; failed to parse source file "
3429 f"with Python {major}.{minor}'s builtin AST. Re-run with --fast "
3430 f"or stop using deprecated Python 2 syntax. AST error message: {exc}"
3434 dst_ast = ast.parse(dst)
3435 except Exception as exc:
3436 log = dump_to_file("".join(traceback.format_tb(exc.__traceback__)), dst)
3437 raise AssertionError(
3438 f"INTERNAL ERROR: Black produced invalid code: {exc}. "
3439 f"Please report a bug on https://github.com/python/black/issues. "
3440 f"This invalid output might be helpful: {log}"
3443 src_ast_str = "\n".join(_v(src_ast))
3444 dst_ast_str = "\n".join(_v(dst_ast))
3445 if src_ast_str != dst_ast_str:
3446 log = dump_to_file(diff(src_ast_str, dst_ast_str, "src", "dst"))
3447 raise AssertionError(
3448 f"INTERNAL ERROR: Black produced code that is not equivalent to "
3450 f"Please report a bug on https://github.com/python/black/issues. "
3451 f"This diff might be helpful: {log}"
3455 def assert_stable(src: str, dst: str, mode: FileMode) -> None:
3456 """Raise AssertionError if `dst` reformats differently the second time."""
3457 newdst = format_str(dst, mode=mode)
3460 diff(src, dst, "source", "first pass"),
3461 diff(dst, newdst, "first pass", "second pass"),
3463 raise AssertionError(
3464 f"INTERNAL ERROR: Black produced different code on the second pass "
3465 f"of the formatter. "
3466 f"Please report a bug on https://github.com/python/black/issues. "
3467 f"This diff might be helpful: {log}"
3471 def dump_to_file(*output: str) -> str:
3472 """Dump `output` to a temporary file. Return path to the file."""
3475 with tempfile.NamedTemporaryFile(
3476 mode="w", prefix="blk_", suffix=".log", delete=False, encoding="utf8"
3478 for lines in output:
3480 if lines and lines[-1] != "\n":
3485 def diff(a: str, b: str, a_name: str, b_name: str) -> str:
3486 """Return a unified diff string between strings `a` and `b`."""
3489 a_lines = [line + "\n" for line in a.split("\n")]
3490 b_lines = [line + "\n" for line in b.split("\n")]
3492 difflib.unified_diff(a_lines, b_lines, fromfile=a_name, tofile=b_name, n=5)
3496 def cancel(tasks: Iterable[asyncio.Task]) -> None:
3497 """asyncio signal handler that cancels all `tasks` and reports to stderr."""
3503 def shutdown(loop: BaseEventLoop) -> None:
3504 """Cancel all pending tasks on `loop`, wait for them, and close the loop."""
3506 if sys.version_info[:2] >= (3, 7):
3507 all_tasks = asyncio.all_tasks
3509 all_tasks = asyncio.Task.all_tasks
3510 # This part is borrowed from asyncio/runners.py in Python 3.7b2.
3511 to_cancel = [task for task in all_tasks(loop) if not task.done()]
3515 for task in to_cancel:
3517 loop.run_until_complete(
3518 asyncio.gather(*to_cancel, loop=loop, return_exceptions=True)
3521 # `concurrent.futures.Future` objects cannot be cancelled once they
3522 # are already running. There might be some when the `shutdown()` happened.
3523 # Silence their logger's spew about the event loop being closed.
3524 cf_logger = logging.getLogger("concurrent.futures")
3525 cf_logger.setLevel(logging.CRITICAL)
3529 def sub_twice(regex: Pattern[str], replacement: str, original: str) -> str:
3530 """Replace `regex` with `replacement` twice on `original`.
3532 This is used by string normalization to perform replaces on
3533 overlapping matches.
3535 return regex.sub(replacement, regex.sub(replacement, original))
3538 def re_compile_maybe_verbose(regex: str) -> Pattern[str]:
3539 """Compile a regular expression string in `regex`.
3541 If it contains newlines, use verbose mode.
3544 regex = "(?x)" + regex
3545 return re.compile(regex)
3548 def enumerate_reversed(sequence: Sequence[T]) -> Iterator[Tuple[Index, T]]:
3549 """Like `reversed(enumerate(sequence))` if that were possible."""
3550 index = len(sequence) - 1
3551 for element in reversed(sequence):
3552 yield (index, element)
3556 def enumerate_with_length(
3557 line: Line, reversed: bool = False
3558 ) -> Iterator[Tuple[Index, Leaf, int]]:
3559 """Return an enumeration of leaves with their length.
3561 Stops prematurely on multiline strings and standalone comments.
3564 Callable[[Sequence[Leaf]], Iterator[Tuple[Index, Leaf]]],
3565 enumerate_reversed if reversed else enumerate,
3567 for index, leaf in op(line.leaves):
3568 length = len(leaf.prefix) + len(leaf.value)
3569 if "\n" in leaf.value:
3570 return # Multiline strings, we can't continue.
3572 comment: Optional[Leaf]
3573 for comment in line.comments_after(leaf):
3574 length += len(comment.value)
3576 yield index, leaf, length
3579 def is_line_short_enough(line: Line, *, line_length: int, line_str: str = "") -> bool:
3580 """Return True if `line` is no longer than `line_length`.
3582 Uses the provided `line_str` rendering, if any, otherwise computes a new one.
3585 line_str = str(line).strip("\n")
3587 len(line_str) <= line_length
3588 and "\n" not in line_str # multiline strings
3589 and not line.contains_standalone_comments()
3593 def can_be_split(line: Line) -> bool:
3594 """Return False if the line cannot be split *for sure*.
3596 This is not an exhaustive search but a cheap heuristic that we can use to
3597 avoid some unfortunate formattings (mostly around wrapping unsplittable code
3598 in unnecessary parentheses).
3600 leaves = line.leaves
3604 if leaves[0].type == token.STRING and leaves[1].type == token.DOT:
3608 for leaf in leaves[-2::-1]:
3609 if leaf.type in OPENING_BRACKETS:
3610 if next.type not in CLOSING_BRACKETS:
3614 elif leaf.type == token.DOT:
3616 elif leaf.type == token.NAME:
3617 if not (next.type == token.DOT or next.type in OPENING_BRACKETS):
3620 elif leaf.type not in CLOSING_BRACKETS:
3623 if dot_count > 1 and call_count > 1:
3629 def can_omit_invisible_parens(line: Line, line_length: int) -> bool:
3630 """Does `line` have a shape safe to reformat without optional parens around it?
3632 Returns True for only a subset of potentially nice looking formattings but
3633 the point is to not return false positives that end up producing lines that
3636 bt = line.bracket_tracker
3637 if not bt.delimiters:
3638 # Without delimiters the optional parentheses are useless.
3641 max_priority = bt.max_delimiter_priority()
3642 if bt.delimiter_count_with_priority(max_priority) > 1:
3643 # With more than one delimiter of a kind the optional parentheses read better.
3646 if max_priority == DOT_PRIORITY:
3647 # A single stranded method call doesn't require optional parentheses.
3650 assert len(line.leaves) >= 2, "Stranded delimiter"
3652 first = line.leaves[0]
3653 second = line.leaves[1]
3654 penultimate = line.leaves[-2]
3655 last = line.leaves[-1]
3657 # With a single delimiter, omit if the expression starts or ends with
3659 if first.type in OPENING_BRACKETS and second.type not in CLOSING_BRACKETS:
3661 length = 4 * line.depth
3662 for _index, leaf, leaf_length in enumerate_with_length(line):
3663 if leaf.type in CLOSING_BRACKETS and leaf.opening_bracket is first:
3666 length += leaf_length
3667 if length > line_length:
3670 if leaf.type in OPENING_BRACKETS:
3671 # There are brackets we can further split on.
3675 # checked the entire string and line length wasn't exceeded
3676 if len(line.leaves) == _index + 1:
3679 # Note: we are not returning False here because a line might have *both*
3680 # a leading opening bracket and a trailing closing bracket. If the
3681 # opening bracket doesn't match our rule, maybe the closing will.
3684 last.type == token.RPAR
3685 or last.type == token.RBRACE
3687 # don't use indexing for omitting optional parentheses;
3689 last.type == token.RSQB
3691 and last.parent.type != syms.trailer
3694 if penultimate.type in OPENING_BRACKETS:
3695 # Empty brackets don't help.
3698 if is_multiline_string(first):
3699 # Additional wrapping of a multiline string in this situation is
3703 length = 4 * line.depth
3704 seen_other_brackets = False
3705 for _index, leaf, leaf_length in enumerate_with_length(line):
3706 length += leaf_length
3707 if leaf is last.opening_bracket:
3708 if seen_other_brackets or length <= line_length:
3711 elif leaf.type in OPENING_BRACKETS:
3712 # There are brackets we can further split on.
3713 seen_other_brackets = True
3718 def get_cache_file(mode: FileMode) -> Path:
3719 return CACHE_DIR / f"cache.{mode.get_cache_key()}.pickle"
3722 def read_cache(mode: FileMode) -> Cache:
3723 """Read the cache if it exists and is well formed.
3725 If it is not well formed, the call to write_cache later should resolve the issue.
3727 cache_file = get_cache_file(mode)
3728 if not cache_file.exists():
3731 with cache_file.open("rb") as fobj:
3733 cache: Cache = pickle.load(fobj)
3734 except pickle.UnpicklingError:
3740 def get_cache_info(path: Path) -> CacheInfo:
3741 """Return the information used to check if a file is already formatted or not."""
3743 return stat.st_mtime, stat.st_size
3746 def filter_cached(cache: Cache, sources: Iterable[Path]) -> Tuple[Set[Path], Set[Path]]:
3747 """Split an iterable of paths in `sources` into two sets.
3749 The first contains paths of files that modified on disk or are not in the
3750 cache. The other contains paths to non-modified files.
3752 todo, done = set(), set()
3755 if cache.get(src) != get_cache_info(src):
3762 def write_cache(cache: Cache, sources: Iterable[Path], mode: FileMode) -> None:
3763 """Update the cache file."""
3764 cache_file = get_cache_file(mode)
3766 CACHE_DIR.mkdir(parents=True, exist_ok=True)
3767 new_cache = {**cache, **{src.resolve(): get_cache_info(src) for src in sources}}
3768 with tempfile.NamedTemporaryFile(dir=str(cache_file.parent), delete=False) as f:
3769 pickle.dump(new_cache, f, protocol=pickle.HIGHEST_PROTOCOL)
3770 os.replace(f.name, cache_file)
3775 def patch_click() -> None:
3776 """Make Click not crash.
3778 On certain misconfigured environments, Python 3 selects the ASCII encoding as the
3779 default which restricts paths that it can access during the lifetime of the
3780 application. Click refuses to work in this scenario by raising a RuntimeError.
3782 In case of Black the likelihood that non-ASCII characters are going to be used in
3783 file paths is minimal since it's Python source code. Moreover, this crash was
3784 spurious on Python 3.7 thanks to PEP 538 and PEP 540.
3787 from click import core
3788 from click import _unicodefun # type: ignore
3789 except ModuleNotFoundError:
3792 for module in (core, _unicodefun):
3793 if hasattr(module, "_verify_python3_env"):
3794 module._verify_python3_env = lambda: None
3797 def patched_main() -> None:
3803 if __name__ == "__main__":