black.py

   1 import asyncio
   2 from asyncio.base_events import BaseEventLoop
   3 from concurrent.futures import Executor, ProcessPoolExecutor
   4 from datetime import datetime
   5 from enum import Enum, Flag
   6 from functools import lru_cache, partial, wraps
   7 import io
   8 import keyword
   9 import logging
  10 from multiprocessing import Manager
  11 import os
  12 from pathlib import Path
  13 import pickle
  14 import re
  15 import signal
  16 import sys
  17 import tokenize
  18 from typing import (
  19     Any,
  20     Callable,
  21     Collection,
  22     Dict,
  23     Generator,
  24     Generic,
  25     Iterable,
  26     Iterator,
  27     List,
  28     Optional,
  29     Pattern,
  30     Sequence,
  31     Set,
  32     Tuple,
  33     TypeVar,
  34     Union,
  35     cast,
  36 )
  37
  38 from appdirs import user_cache_dir
  39 from attr import dataclass, Factory
  40 import click
  41 import toml
  42
  43 # lib2to3 fork
  44 from blib2to3.pytree import Node, Leaf, type_repr
  45 from blib2to3 import pygram, pytree
  46 from blib2to3.pgen2 import driver, token
  47 from blib2to3.pgen2.parse import ParseError
  48
  49
  50 __version__ = "18.6b4"
  51 DEFAULT_LINE_LENGTH = 88
  52 DEFAULT_EXCLUDES = (
  53     r"/(\.git|\.hg|\.mypy_cache|\.tox|\.venv|_build|buck-out|build|dist)/"
  54 )
  55 DEFAULT_INCLUDES = r"\.pyi?$"
  56 CACHE_DIR = Path(user_cache_dir("black", version=__version__))
  57
  58
  59 # types
  60 FileContent = str
  61 Encoding = str
  62 NewLine = str
  63 Depth = int
  64 NodeType = int
  65 LeafID = int
  66 Priority = int
  67 Index = int
  68 LN = Union[Leaf, Node]
  69 SplitFunc = Callable[["Line", bool], Iterator["Line"]]
  70 Timestamp = float
  71 FileSize = int
  72 CacheInfo = Tuple[Timestamp, FileSize]
  73 Cache = Dict[Path, CacheInfo]
  74 out = partial(click.secho, bold=True, err=True)
  75 err = partial(click.secho, fg="red", err=True)
  76
  77 pygram.initialize(CACHE_DIR)
  78 syms = pygram.python_symbols
  79
  80
  81 class NothingChanged(UserWarning):
  82     """Raised by :func:`format_file` when reformatted code is the same as source."""
  83
  84
  85 class CannotSplit(Exception):
  86     """A readable split that fits the allotted line length is impossible.
  87
  88     Raised by :func:`left_hand_split`, :func:`right_hand_split`, and
  89     :func:`delimiter_split`.
  90     """
  91
  92
  93 class WriteBack(Enum):
  94     NO = 0
  95     YES = 1
  96     DIFF = 2
  97     CHECK = 3
  98
  99     @classmethod
 100     def from_configuration(cls, *, check: bool, diff: bool) -> "WriteBack":
 101         if check and not diff:
 102             return cls.CHECK
 103
 104         return cls.DIFF if diff else cls.YES
 105
 106
 107 class Changed(Enum):
 108     NO = 0
 109     CACHED = 1
 110     YES = 2
 111
 112
 113 class FileMode(Flag):
 114     AUTO_DETECT = 0
 115     PYTHON36 = 1
 116     PYI = 2
 117     NO_STRING_NORMALIZATION = 4
 118
 119     @classmethod
 120     def from_configuration(
 121         cls, *, py36: bool, pyi: bool, skip_string_normalization: bool
 122     ) -> "FileMode":
 123         mode = cls.AUTO_DETECT
 124         if py36:
 125             mode |= cls.PYTHON36
 126         if pyi:
 127             mode |= cls.PYI
 128         if skip_string_normalization:
 129             mode |= cls.NO_STRING_NORMALIZATION
 130         return mode
 131
 132
 133 def read_pyproject_toml(
 134     ctx: click.Context, param: click.Parameter, value: Union[str, int, bool, None]
 135 ) -> Optional[str]:
 136     """Inject Black configuration from "pyproject.toml" into defaults in `ctx`.
 137
 138     Returns the path to a successfully found and read configuration file, None
 139     otherwise.
 140     """
 141     assert not isinstance(value, (int, bool)), "Invalid parameter type passed"
 142     if not value:
 143         root = find_project_root(ctx.params.get("src", ()))
 144         path = root / "pyproject.toml"
 145         if path.is_file():
 146             value = str(path)
 147         else:
 148             return None
 149
 150     try:
 151         pyproject_toml = toml.load(value)
 152         config = pyproject_toml.get("tool", {}).get("black", {})
 153     except (toml.TomlDecodeError, OSError) as e:
 154         raise click.BadOptionUsage(f"Error reading configuration file: {e}", ctx)
 155
 156     if not config:
 157         return None
 158
 159     if ctx.default_map is None:
 160         ctx.default_map = {}
 161     ctx.default_map.update(  # type: ignore  # bad types in .pyi
 162         {k.replace("--", "").replace("-", "_"): v for k, v in config.items()}
 163     )
 164     return value
 165
 166
 167 @click.command(context_settings=dict(help_option_names=["-h", "--help"]))
 168 @click.option(
 169     "-l",
 170     "--line-length",
 171     type=int,
 172     default=DEFAULT_LINE_LENGTH,
 173     help="How many character per line to allow.",
 174     show_default=True,
 175 )
 176 @click.option(
 177     "--py36",
 178     is_flag=True,
 179     help=(
 180         "Allow using Python 3.6-only syntax on all input files.  This will put "
 181         "trailing commas in function signatures and calls also after *args and "
 182         "**kwargs.  [default: per-file auto-detection]"
 183     ),
 184 )
 185 @click.option(
 186     "--pyi",
 187     is_flag=True,
 188     help=(
 189         "Format all input files like typing stubs regardless of file extension "
 190         "(useful when piping source on standard input)."
 191     ),
 192 )
 193 @click.option(
 194     "-S",
 195     "--skip-string-normalization",
 196     is_flag=True,
 197     help="Don't normalize string quotes or prefixes.",
 198 )
 199 @click.option(
 200     "--check",
 201     is_flag=True,
 202     help=(
 203         "Don't write the files back, just return the status.  Return code 0 "
 204         "means nothing would change.  Return code 1 means some files would be "
 205         "reformatted.  Return code 123 means there was an internal error."
 206     ),
 207 )
 208 @click.option(
 209     "--diff",
 210     is_flag=True,
 211     help="Don't write the files back, just output a diff for each file on stdout.",
 212 )
 213 @click.option(
 214     "--fast/--safe",
 215     is_flag=True,
 216     help="If --fast given, skip temporary sanity checks. [default: --safe]",
 217 )
 218 @click.option(
 219     "--include",
 220     type=str,
 221     default=DEFAULT_INCLUDES,
 222     help=(
 223         "A regular expression that matches files and directories that should be "
 224         "included on recursive searches.  An empty value means all files are "
 225         "included regardless of the name.  Use forward slashes for directories on "
 226         "all platforms (Windows, too).  Exclusions are calculated first, inclusions "
 227         "later."
 228     ),
 229     show_default=True,
 230 )
 231 @click.option(
 232     "--exclude",
 233     type=str,
 234     default=DEFAULT_EXCLUDES,
 235     help=(
 236         "A regular expression that matches files and directories that should be "
 237         "excluded on recursive searches.  An empty value means no paths are excluded. "
 238         "Use forward slashes for directories on all platforms (Windows, too).  "
 239         "Exclusions are calculated first, inclusions later."
 240     ),
 241     show_default=True,
 242 )
 243 @click.option(
 244     "-q",
 245     "--quiet",
 246     is_flag=True,
 247     help=(
 248         "Don't emit non-error messages to stderr. Errors are still emitted, "
 249         "silence those with 2>/dev/null."
 250     ),
 251 )
 252 @click.option(
 253     "-v",
 254     "--verbose",
 255     is_flag=True,
 256     help=(
 257         "Also emit messages to stderr about files that were not changed or were "
 258         "ignored due to --exclude=."
 259     ),
 260 )
 261 @click.version_option(version=__version__)
 262 @click.argument(
 263     "src",
 264     nargs=-1,
 265     type=click.Path(
 266         exists=True, file_okay=True, dir_okay=True, readable=True, allow_dash=True
 267     ),
 268     is_eager=True,
 269 )
 270 @click.option(
 271     "--config",
 272     type=click.Path(
 273         exists=False, file_okay=True, dir_okay=False, readable=True, allow_dash=False
 274     ),
 275     is_eager=True,
 276     callback=read_pyproject_toml,
 277     help="Read configuration from PATH.",
 278 )
 279 @click.pass_context
 280 def main(
 281     ctx: click.Context,
 282     line_length: int,
 283     check: bool,
 284     diff: bool,
 285     fast: bool,
 286     pyi: bool,
 287     py36: bool,
 288     skip_string_normalization: bool,
 289     quiet: bool,
 290     verbose: bool,
 291     include: str,
 292     exclude: str,
 293     src: Tuple[str],
 294     config: Optional[str],
 295 ) -> None:
 296     """The uncompromising code formatter."""
 297     write_back = WriteBack.from_configuration(check=check, diff=diff)
 298     mode = FileMode.from_configuration(
 299         py36=py36, pyi=pyi, skip_string_normalization=skip_string_normalization
 300     )
 301     if config and verbose:
 302         out(f"Using configuration from {config}.", bold=False, fg="blue")
 303     try:
 304         include_regex = re_compile_maybe_verbose(include)
 305     except re.error:
 306         err(f"Invalid regular expression for include given: {include!r}")
 307         ctx.exit(2)
 308     try:
 309         exclude_regex = re_compile_maybe_verbose(exclude)
 310     except re.error:
 311         err(f"Invalid regular expression for exclude given: {exclude!r}")
 312         ctx.exit(2)
 313     report = Report(check=check, quiet=quiet, verbose=verbose)
 314     root = find_project_root(src)
 315     sources: Set[Path] = set()
 316     for s in src:
 317         p = Path(s)
 318         if p.is_dir():
 319             sources.update(
 320                 gen_python_files_in_dir(p, root, include_regex, exclude_regex, report)
 321             )
 322         elif p.is_file() or s == "-":
 323             # if a file was explicitly given, we don't care about its extension
 324             sources.add(p)
 325         else:
 326             err(f"invalid path: {s}")
 327     if len(sources) == 0:
 328         if verbose or not quiet:
 329             out("No paths given. Nothing to do 😴")
 330         ctx.exit(0)
 331
 332     if len(sources) == 1:
 333         reformat_one(
 334             src=sources.pop(),
 335             line_length=line_length,
 336             fast=fast,
 337             write_back=write_back,
 338             mode=mode,
 339             report=report,
 340         )
 341     else:
 342         loop = asyncio.get_event_loop()
 343         executor = ProcessPoolExecutor(max_workers=os.cpu_count())
 344         try:
 345             loop.run_until_complete(
 346                 schedule_formatting(
 347                     sources=sources,
 348                     line_length=line_length,
 349                     fast=fast,
 350                     write_back=write_back,
 351                     mode=mode,
 352                     report=report,
 353                     loop=loop,
 354                     executor=executor,
 355                 )
 356             )
 357         finally:
 358             shutdown(loop)
 359     if verbose or not quiet:
 360         bang = "💥 💔 💥" if report.return_code else "✨ 🍰 ✨"
 361         out(f"All done! {bang}")
 362         click.secho(str(report), err=True)
 363     ctx.exit(report.return_code)
 364
 365
 366 def reformat_one(
 367     src: Path,
 368     line_length: int,
 369     fast: bool,
 370     write_back: WriteBack,
 371     mode: FileMode,
 372     report: "Report",
 373 ) -> None:
 374     """Reformat a single file under `src` without spawning child processes.
 375
 376     If `quiet` is True, non-error messages are not output. `line_length`,
 377     `write_back`, `fast` and `pyi` options are passed to
 378     :func:`format_file_in_place` or :func:`format_stdin_to_stdout`.
 379     """
 380     try:
 381         changed = Changed.NO
 382         if not src.is_file() and str(src) == "-":
 383             if format_stdin_to_stdout(
 384                 line_length=line_length, fast=fast, write_back=write_back, mode=mode
 385             ):
 386                 changed = Changed.YES
 387         else:
 388             cache: Cache = {}
 389             if write_back != WriteBack.DIFF:
 390                 cache = read_cache(line_length, mode)
 391                 res_src = src.resolve()
 392                 if res_src in cache and cache[res_src] == get_cache_info(res_src):
 393                     changed = Changed.CACHED
 394             if changed is not Changed.CACHED and format_file_in_place(
 395                 src,
 396                 line_length=line_length,
 397                 fast=fast,
 398                 write_back=write_back,
 399                 mode=mode,
 400             ):
 401                 changed = Changed.YES
 402             if (write_back is WriteBack.YES and changed is not Changed.CACHED) or (
 403                 write_back is WriteBack.CHECK and changed is Changed.NO
 404             ):
 405                 write_cache(cache, [src], line_length, mode)
 406         report.done(src, changed)
 407     except Exception as exc:
 408         report.failed(src, str(exc))
 409
 410
 411 async def schedule_formatting(
 412     sources: Set[Path],
 413     line_length: int,
 414     fast: bool,
 415     write_back: WriteBack,
 416     mode: FileMode,
 417     report: "Report",
 418     loop: BaseEventLoop,
 419     executor: Executor,
 420 ) -> None:
 421     """Run formatting of `sources` in parallel using the provided `executor`.
 422
 423     (Use ProcessPoolExecutors for actual parallelism.)
 424
 425     `line_length`, `write_back`, `fast`, and `pyi` options are passed to
 426     :func:`format_file_in_place`.
 427     """
 428     cache: Cache = {}
 429     if write_back != WriteBack.DIFF:
 430         cache = read_cache(line_length, mode)
 431         sources, cached = filter_cached(cache, sources)
 432         for src in sorted(cached):
 433             report.done(src, Changed.CACHED)
 434     if not sources:
 435         return
 436
 437     cancelled = []
 438     sources_to_cache = []
 439     lock = None
 440     if write_back == WriteBack.DIFF:
 441         # For diff output, we need locks to ensure we don't interleave output
 442         # from different processes.
 443         manager = Manager()
 444         lock = manager.Lock()
 445     tasks = {
 446         loop.run_in_executor(
 447             executor,
 448             format_file_in_place,
 449             src,
 450             line_length,
 451             fast,
 452             write_back,
 453             mode,
 454             lock,
 455         ): src
 456         for src in sorted(sources)
 457     }
 458     pending: Iterable[asyncio.Task] = tasks.keys()
 459     try:
 460         loop.add_signal_handler(signal.SIGINT, cancel, pending)
 461         loop.add_signal_handler(signal.SIGTERM, cancel, pending)
 462     except NotImplementedError:
 463         # There are no good alternatives for these on Windows.
 464         pass
 465     while pending:
 466         done, _ = await asyncio.wait(pending, return_when=asyncio.FIRST_COMPLETED)
 467         for task in done:
 468             src = tasks.pop(task)
 469             if task.cancelled():
 470                 cancelled.append(task)
 471             elif task.exception():
 472                 report.failed(src, str(task.exception()))
 473             else:
 474                 changed = Changed.YES if task.result() else Changed.NO
 475                 # If the file was written back or was successfully checked as
 476                 # well-formatted, store this information in the cache.
 477                 if write_back is WriteBack.YES or (
 478                     write_back is WriteBack.CHECK and changed is Changed.NO
 479                 ):
 480                     sources_to_cache.append(src)
 481                 report.done(src, changed)
 482     if cancelled:
 483         await asyncio.gather(*cancelled, loop=loop, return_exceptions=True)
 484     if sources_to_cache:
 485         write_cache(cache, sources_to_cache, line_length, mode)
 486
 487
 488 def format_file_in_place(
 489     src: Path,
 490     line_length: int,
 491     fast: bool,
 492     write_back: WriteBack = WriteBack.NO,
 493     mode: FileMode = FileMode.AUTO_DETECT,
 494     lock: Any = None,  # multiprocessing.Manager().Lock() is some crazy proxy
 495 ) -> bool:
 496     """Format file under `src` path. Return True if changed.
 497
 498     If `write_back` is DIFF, write a diff to stdout. If it is YES, write reformatted
 499     code to the file.
 500     `line_length` and `fast` options are passed to :func:`format_file_contents`.
 501     """
 502     if src.suffix == ".pyi":
 503         mode |= FileMode.PYI
 504
 505     then = datetime.utcfromtimestamp(src.stat().st_mtime)
 506     with open(src, "rb") as buf:
 507         src_contents, encoding, newline = decode_bytes(buf.read())
 508     try:
 509         dst_contents = format_file_contents(
 510             src_contents, line_length=line_length, fast=fast, mode=mode
 511         )
 512     except NothingChanged:
 513         return False
 514
 515     if write_back == write_back.YES:
 516         with open(src, "w", encoding=encoding, newline=newline) as f:
 517             f.write(dst_contents)
 518     elif write_back == write_back.DIFF:
 519         now = datetime.utcnow()
 520         src_name = f"{src}\t{then} +0000"
 521         dst_name = f"{src}\t{now} +0000"
 522         diff_contents = diff(src_contents, dst_contents, src_name, dst_name)
 523         if lock:
 524             lock.acquire()
 525         try:
 526             f = io.TextIOWrapper(
 527                 sys.stdout.buffer,
 528                 encoding=encoding,
 529                 newline=newline,
 530                 write_through=True,
 531             )
 532             f.write(diff_contents)
 533             f.detach()
 534         finally:
 535             if lock:
 536                 lock.release()
 537     return True
 538
 539
 540 def format_stdin_to_stdout(
 541     line_length: int,
 542     fast: bool,
 543     write_back: WriteBack = WriteBack.NO,
 544     mode: FileMode = FileMode.AUTO_DETECT,
 545 ) -> bool:
 546     """Format file on stdin. Return True if changed.
 547
 548     If `write_back` is YES, write reformatted code back to stdout. If it is DIFF,
 549     write a diff to stdout.
 550     `line_length`, `fast`, `is_pyi`, and `force_py36` arguments are passed to
 551     :func:`format_file_contents`.
 552     """
 553     then = datetime.utcnow()
 554     src, encoding, newline = decode_bytes(sys.stdin.buffer.read())
 555     dst = src
 556     try:
 557         dst = format_file_contents(src, line_length=line_length, fast=fast, mode=mode)
 558         return True
 559
 560     except NothingChanged:
 561         return False
 562
 563     finally:
 564         f = io.TextIOWrapper(
 565             sys.stdout.buffer, encoding=encoding, newline=newline, write_through=True
 566         )
 567         if write_back == WriteBack.YES:
 568             f.write(dst)
 569         elif write_back == WriteBack.DIFF:
 570             now = datetime.utcnow()
 571             src_name = f"STDIN\t{then} +0000"
 572             dst_name = f"STDOUT\t{now} +0000"
 573             f.write(diff(src, dst, src_name, dst_name))
 574         f.detach()
 575
 576
 577 def format_file_contents(
 578     src_contents: str,
 579     *,
 580     line_length: int,
 581     fast: bool,
 582     mode: FileMode = FileMode.AUTO_DETECT,
 583 ) -> FileContent:
 584     """Reformat contents a file and return new contents.
 585
 586     If `fast` is False, additionally confirm that the reformatted code is
 587     valid by calling :func:`assert_equivalent` and :func:`assert_stable` on it.
 588     `line_length` is passed to :func:`format_str`.
 589     """
 590     if src_contents.strip() == "":
 591         raise NothingChanged
 592
 593     dst_contents = format_str(src_contents, line_length=line_length, mode=mode)
 594     if src_contents == dst_contents:
 595         raise NothingChanged
 596
 597     if not fast:
 598         assert_equivalent(src_contents, dst_contents)
 599         assert_stable(src_contents, dst_contents, line_length=line_length, mode=mode)
 600     return dst_contents
 601
 602
 603 def format_str(
 604     src_contents: str, line_length: int, *, mode: FileMode = FileMode.AUTO_DETECT
 605 ) -> FileContent:
 606     """Reformat a string and return new contents.
 607
 608     `line_length` determines how many characters per line are allowed.
 609     """
 610     src_node = lib2to3_parse(src_contents)
 611     dst_contents = ""
 612     future_imports = get_future_imports(src_node)
 613     is_pyi = bool(mode & FileMode.PYI)
 614     py36 = bool(mode & FileMode.PYTHON36) or is_python36(src_node)
 615     normalize_strings = not bool(mode & FileMode.NO_STRING_NORMALIZATION)
 616     normalize_fmt_off(src_node)
 617     lines = LineGenerator(
 618         remove_u_prefix=py36 or "unicode_literals" in future_imports,
 619         is_pyi=is_pyi,
 620         normalize_strings=normalize_strings,
 621         allow_underscores=py36,
 622     )
 623     elt = EmptyLineTracker(is_pyi=is_pyi)
 624     empty_line = Line()
 625     after = 0
 626     for current_line in lines.visit(src_node):
 627         for _ in range(after):
 628             dst_contents += str(empty_line)
 629         before, after = elt.maybe_empty_lines(current_line)
 630         for _ in range(before):
 631             dst_contents += str(empty_line)
 632         for line in split_line(current_line, line_length=line_length, py36=py36):
 633             dst_contents += str(line)
 634     return dst_contents
 635
 636
 637 def decode_bytes(src: bytes) -> Tuple[FileContent, Encoding, NewLine]:
 638     """Return a tuple of (decoded_contents, encoding, newline).
 639
 640     `newline` is either CRLF or LF but `decoded_contents` is decoded with
 641     universal newlines (i.e. only contains LF).
 642     """
 643     srcbuf = io.BytesIO(src)
 644     encoding, lines = tokenize.detect_encoding(srcbuf.readline)
 645     if not lines:
 646         return "", encoding, "\n"
 647
 648     newline = "\r\n" if b"\r\n" == lines[0][-2:] else "\n"
 649     srcbuf.seek(0)
 650     with io.TextIOWrapper(srcbuf, encoding) as tiow:
 651         return tiow.read(), encoding, newline
 652
 653
 654 GRAMMARS = [
 655     pygram.python_grammar_no_print_statement_no_exec_statement,
 656     pygram.python_grammar_no_print_statement,
 657     pygram.python_grammar,
 658 ]
 659
 660
 661 def lib2to3_parse(src_txt: str) -> Node:
 662     """Given a string with source, return the lib2to3 Node."""
 663     grammar = pygram.python_grammar_no_print_statement
 664     if src_txt[-1:] != "\n":
 665         src_txt += "\n"
 666     for grammar in GRAMMARS:
 667         drv = driver.Driver(grammar, pytree.convert)
 668         try:
 669             result = drv.parse_string(src_txt, True)
 670             break
 671
 672         except ParseError as pe:
 673             lineno, column = pe.context[1]
 674             lines = src_txt.splitlines()
 675             try:
 676                 faulty_line = lines[lineno - 1]
 677             except IndexError:
 678                 faulty_line = "<line number missing in source>"
 679             exc = ValueError(f"Cannot parse: {lineno}:{column}: {faulty_line}")
 680     else:
 681         raise exc from None
 682
 683     if isinstance(result, Leaf):
 684         result = Node(syms.file_input, [result])
 685     return result
 686
 687
 688 def lib2to3_unparse(node: Node) -> str:
 689     """Given a lib2to3 node, return its string representation."""
 690     code = str(node)
 691     return code
 692
 693
 694 T = TypeVar("T")
 695
 696
 697 class Visitor(Generic[T]):
 698     """Basic lib2to3 visitor that yields things of type `T` on `visit()`."""
 699
 700     def visit(self, node: LN) -> Iterator[T]:
 701         """Main method to visit `node` and its children.
 702
 703         It tries to find a `visit_*()` method for the given `node.type`, like
 704         `visit_simple_stmt` for Node objects or `visit_INDENT` for Leaf objects.
 705         If no dedicated `visit_*()` method is found, chooses `visit_default()`
 706         instead.
 707
 708         Then yields objects of type `T` from the selected visitor.
 709         """
 710         if node.type < 256:
 711             name = token.tok_name[node.type]
 712         else:
 713             name = type_repr(node.type)
 714         yield from getattr(self, f"visit_{name}", self.visit_default)(node)
 715
 716     def visit_default(self, node: LN) -> Iterator[T]:
 717         """Default `visit_*()` implementation. Recurses to children of `node`."""
 718         if isinstance(node, Node):
 719             for child in node.children:
 720                 yield from self.visit(child)
 721
 722
 723 @dataclass
 724 class DebugVisitor(Visitor[T]):
 725     tree_depth: int = 0
 726
 727     def visit_default(self, node: LN) -> Iterator[T]:
 728         indent = " " * (2 * self.tree_depth)
 729         if isinstance(node, Node):
 730             _type = type_repr(node.type)
 731             out(f"{indent}{_type}", fg="yellow")
 732             self.tree_depth += 1
 733             for child in node.children:
 734                 yield from self.visit(child)
 735
 736             self.tree_depth -= 1
 737             out(f"{indent}/{_type}", fg="yellow", bold=False)
 738         else:
 739             _type = token.tok_name.get(node.type, str(node.type))
 740             out(f"{indent}{_type}", fg="blue", nl=False)
 741             if node.prefix:
 742                 # We don't have to handle prefixes for `Node` objects since
 743                 # that delegates to the first child anyway.
 744                 out(f" {node.prefix!r}", fg="green", bold=False, nl=False)
 745             out(f" {node.value!r}", fg="blue", bold=False)
 746
 747     @classmethod
 748     def show(cls, code: Union[str, Leaf, Node]) -> None:
 749         """Pretty-print the lib2to3 AST of a given string of `code`.
 750
 751         Convenience method for debugging.
 752         """
 753         v: DebugVisitor[None] = DebugVisitor()
 754         if isinstance(code, str):
 755             code = lib2to3_parse(code)
 756         list(v.visit(code))
 757
 758
 759 KEYWORDS = set(keyword.kwlist)
 760 WHITESPACE = {token.DEDENT, token.INDENT, token.NEWLINE}
 761 FLOW_CONTROL = {"return", "raise", "break", "continue"}
 762 STATEMENT = {
 763     syms.if_stmt,
 764     syms.while_stmt,
 765     syms.for_stmt,
 766     syms.try_stmt,
 767     syms.except_clause,
 768     syms.with_stmt,
 769     syms.funcdef,
 770     syms.classdef,
 771 }
 772 STANDALONE_COMMENT = 153
 773 token.tok_name[STANDALONE_COMMENT] = "STANDALONE_COMMENT"
 774 LOGIC_OPERATORS = {"and", "or"}
 775 COMPARATORS = {
 776     token.LESS,
 777     token.GREATER,
 778     token.EQEQUAL,
 779     token.NOTEQUAL,
 780     token.LESSEQUAL,
 781     token.GREATEREQUAL,
 782 }
 783 MATH_OPERATORS = {
 784     token.VBAR,
 785     token.CIRCUMFLEX,
 786     token.AMPER,
 787     token.LEFTSHIFT,
 788     token.RIGHTSHIFT,
 789     token.PLUS,
 790     token.MINUS,
 791     token.STAR,
 792     token.SLASH,
 793     token.DOUBLESLASH,
 794     token.PERCENT,
 795     token.AT,
 796     token.TILDE,
 797     token.DOUBLESTAR,
 798 }
 799 STARS = {token.STAR, token.DOUBLESTAR}
 800 VARARGS_PARENTS = {
 801     syms.arglist,
 802     syms.argument,  # double star in arglist
 803     syms.trailer,  # single argument to call
 804     syms.typedargslist,
 805     syms.varargslist,  # lambdas
 806 }
 807 UNPACKING_PARENTS = {
 808     syms.atom,  # single element of a list or set literal
 809     syms.dictsetmaker,
 810     syms.listmaker,
 811     syms.testlist_gexp,
 812     syms.testlist_star_expr,
 813 }
 814 TEST_DESCENDANTS = {
 815     syms.test,
 816     syms.lambdef,
 817     syms.or_test,
 818     syms.and_test,
 819     syms.not_test,
 820     syms.comparison,
 821     syms.star_expr,
 822     syms.expr,
 823     syms.xor_expr,
 824     syms.and_expr,
 825     syms.shift_expr,
 826     syms.arith_expr,
 827     syms.trailer,
 828     syms.term,
 829     syms.power,
 830 }
 831 ASSIGNMENTS = {
 832     "=",
 833     "+=",
 834     "-=",
 835     "*=",
 836     "@=",
 837     "/=",
 838     "%=",
 839     "&=",
 840     "|=",
 841     "^=",
 842     "<<=",
 843     ">>=",
 844     "**=",
 845     "//=",
 846 }
 847 COMPREHENSION_PRIORITY = 20
 848 COMMA_PRIORITY = 18
 849 TERNARY_PRIORITY = 16
 850 LOGIC_PRIORITY = 14
 851 STRING_PRIORITY = 12
 852 COMPARATOR_PRIORITY = 10
 853 MATH_PRIORITIES = {
 854     token.VBAR: 9,
 855     token.CIRCUMFLEX: 8,
 856     token.AMPER: 7,
 857     token.LEFTSHIFT: 6,
 858     token.RIGHTSHIFT: 6,
 859     token.PLUS: 5,
 860     token.MINUS: 5,
 861     token.STAR: 4,
 862     token.SLASH: 4,
 863     token.DOUBLESLASH: 4,
 864     token.PERCENT: 4,
 865     token.AT: 4,
 866     token.TILDE: 3,
 867     token.DOUBLESTAR: 2,
 868 }
 869 DOT_PRIORITY = 1
 870
 871
 872 @dataclass
 873 class BracketTracker:
 874     """Keeps track of brackets on a line."""
 875
 876     depth: int = 0
 877     bracket_match: Dict[Tuple[Depth, NodeType], Leaf] = Factory(dict)
 878     delimiters: Dict[LeafID, Priority] = Factory(dict)
 879     previous: Optional[Leaf] = None
 880     _for_loop_variable: int = 0
 881     _lambda_arguments: int = 0
 882
 883     def mark(self, leaf: Leaf) -> None:
 884         """Mark `leaf` with bracket-related metadata. Keep track of delimiters.
 885
 886         All leaves receive an int `bracket_depth` field that stores how deep
 887         within brackets a given leaf is. 0 means there are no enclosing brackets
 888         that started on this line.
 889
 890         If a leaf is itself a closing bracket, it receives an `opening_bracket`
 891         field that it forms a pair with. This is a one-directional link to
 892         avoid reference cycles.
 893
 894         If a leaf is a delimiter (a token on which Black can split the line if
 895         needed) and it's on depth 0, its `id()` is stored in the tracker's
 896         `delimiters` field.
 897         """
 898         if leaf.type == token.COMMENT:
 899             return
 900
 901         self.maybe_decrement_after_for_loop_variable(leaf)
 902         self.maybe_decrement_after_lambda_arguments(leaf)
 903         if leaf.type in CLOSING_BRACKETS:
 904             self.depth -= 1
 905             opening_bracket = self.bracket_match.pop((self.depth, leaf.type))
 906             leaf.opening_bracket = opening_bracket
 907         leaf.bracket_depth = self.depth
 908         if self.depth == 0:
 909             delim = is_split_before_delimiter(leaf, self.previous)
 910             if delim and self.previous is not None:
 911                 self.delimiters[id(self.previous)] = delim
 912             else:
 913                 delim = is_split_after_delimiter(leaf, self.previous)
 914                 if delim:
 915                     self.delimiters[id(leaf)] = delim
 916         if leaf.type in OPENING_BRACKETS:
 917             self.bracket_match[self.depth, BRACKET[leaf.type]] = leaf
 918             self.depth += 1
 919         self.previous = leaf
 920         self.maybe_increment_lambda_arguments(leaf)
 921         self.maybe_increment_for_loop_variable(leaf)
 922
 923     def any_open_brackets(self) -> bool:
 924         """Return True if there is an yet unmatched open bracket on the line."""
 925         return bool(self.bracket_match)
 926
 927     def max_delimiter_priority(self, exclude: Iterable[LeafID] = ()) -> int:
 928         """Return the highest priority of a delimiter found on the line.
 929
 930         Values are consistent with what `is_split_*_delimiter()` return.
 931         Raises ValueError on no delimiters.
 932         """
 933         return max(v for k, v in self.delimiters.items() if k not in exclude)
 934
 935     def delimiter_count_with_priority(self, priority: int = 0) -> int:
 936         """Return the number of delimiters with the given `priority`.
 937
 938         If no `priority` is passed, defaults to max priority on the line.
 939         """
 940         if not self.delimiters:
 941             return 0
 942
 943         priority = priority or self.max_delimiter_priority()
 944         return sum(1 for p in self.delimiters.values() if p == priority)
 945
 946     def maybe_increment_for_loop_variable(self, leaf: Leaf) -> bool:
 947         """In a for loop, or comprehension, the variables are often unpacks.
 948
 949         To avoid splitting on the comma in this situation, increase the depth of
 950         tokens between `for` and `in`.
 951         """
 952         if leaf.type == token.NAME and leaf.value == "for":
 953             self.depth += 1
 954             self._for_loop_variable += 1
 955             return True
 956
 957         return False
 958
 959     def maybe_decrement_after_for_loop_variable(self, leaf: Leaf) -> bool:
 960         """See `maybe_increment_for_loop_variable` above for explanation."""
 961         if self._for_loop_variable and leaf.type == token.NAME and leaf.value == "in":
 962             self.depth -= 1
 963             self._for_loop_variable -= 1
 964             return True
 965
 966         return False
 967
 968     def maybe_increment_lambda_arguments(self, leaf: Leaf) -> bool:
 969         """In a lambda expression, there might be more than one argument.
 970
 971         To avoid splitting on the comma in this situation, increase the depth of
 972         tokens between `lambda` and `:`.
 973         """
 974         if leaf.type == token.NAME and leaf.value == "lambda":
 975             self.depth += 1
 976             self._lambda_arguments += 1
 977             return True
 978
 979         return False
 980
 981     def maybe_decrement_after_lambda_arguments(self, leaf: Leaf) -> bool:
 982         """See `maybe_increment_lambda_arguments` above for explanation."""
 983         if self._lambda_arguments and leaf.type == token.COLON:
 984             self.depth -= 1
 985             self._lambda_arguments -= 1
 986             return True
 987
 988         return False
 989
 990     def get_open_lsqb(self) -> Optional[Leaf]:
 991         """Return the most recent opening square bracket (if any)."""
 992         return self.bracket_match.get((self.depth - 1, token.RSQB))
 993
 994
 995 @dataclass
 996 class Line:
 997     """Holds leaves and comments. Can be printed with `str(line)`."""
 998
 999     depth: int = 0
1000     leaves: List[Leaf] = Factory(list)
1001     comments: List[Tuple[Index, Leaf]] = Factory(list)
1002     bracket_tracker: BracketTracker = Factory(BracketTracker)
1003     inside_brackets: bool = False
1004     should_explode: bool = False
1005
1006     def append(self, leaf: Leaf, preformatted: bool = False) -> None:
1007         """Add a new `leaf` to the end of the line.
1008
1009         Unless `preformatted` is True, the `leaf` will receive a new consistent
1010         whitespace prefix and metadata applied by :class:`BracketTracker`.
1011         Trailing commas are maybe removed, unpacked for loop variables are
1012         demoted from being delimiters.
1013
1014         Inline comments are put aside.
1015         """
1016         has_value = leaf.type in BRACKETS or bool(leaf.value.strip())
1017         if not has_value:
1018             return
1019
1020         if token.COLON == leaf.type and self.is_class_paren_empty:
1021             del self.leaves[-2:]
1022         if self.leaves and not preformatted:
1023             # Note: at this point leaf.prefix should be empty except for
1024             # imports, for which we only preserve newlines.
1025             leaf.prefix += whitespace(
1026                 leaf, complex_subscript=self.is_complex_subscript(leaf)
1027             )
1028         if self.inside_brackets or not preformatted:
1029             self.bracket_tracker.mark(leaf)
1030             self.maybe_remove_trailing_comma(leaf)
1031         if not self.append_comment(leaf):
1032             self.leaves.append(leaf)
1033
1034     def append_safe(self, leaf: Leaf, preformatted: bool = False) -> None:
1035         """Like :func:`append()` but disallow invalid standalone comment structure.
1036
1037         Raises ValueError when any `leaf` is appended after a standalone comment
1038         or when a standalone comment is not the first leaf on the line.
1039         """
1040         if self.bracket_tracker.depth == 0:
1041             if self.is_comment:
1042                 raise ValueError("cannot append to standalone comments")
1043
1044             if self.leaves and leaf.type == STANDALONE_COMMENT:
1045                 raise ValueError(
1046                     "cannot append standalone comments to a populated line"
1047                 )
1048
1049         self.append(leaf, preformatted=preformatted)
1050
1051     @property
1052     def is_comment(self) -> bool:
1053         """Is this line a standalone comment?"""
1054         return len(self.leaves) == 1 and self.leaves[0].type == STANDALONE_COMMENT
1055
1056     @property
1057     def is_decorator(self) -> bool:
1058         """Is this line a decorator?"""
1059         return bool(self) and self.leaves[0].type == token.AT
1060
1061     @property
1062     def is_import(self) -> bool:
1063         """Is this an import line?"""
1064         return bool(self) and is_import(self.leaves[0])
1065
1066     @property
1067     def is_class(self) -> bool:
1068         """Is this line a class definition?"""
1069         return (
1070             bool(self)
1071             and self.leaves[0].type == token.NAME
1072             and self.leaves[0].value == "class"
1073         )
1074
1075     @property
1076     def is_stub_class(self) -> bool:
1077         """Is this line a class definition with a body consisting only of "..."?"""
1078         return self.is_class and self.leaves[-3:] == [
1079             Leaf(token.DOT, ".") for _ in range(3)
1080         ]
1081
1082     @property
1083     def is_def(self) -> bool:
1084         """Is this a function definition? (Also returns True for async defs.)"""
1085         try:
1086             first_leaf = self.leaves[0]
1087         except IndexError:
1088             return False
1089
1090         try:
1091             second_leaf: Optional[Leaf] = self.leaves[1]
1092         except IndexError:
1093             second_leaf = None
1094         return (first_leaf.type == token.NAME and first_leaf.value == "def") or (
1095             first_leaf.type == token.ASYNC
1096             and second_leaf is not None
1097             and second_leaf.type == token.NAME
1098             and second_leaf.value == "def"
1099         )
1100
1101     @property
1102     def is_class_paren_empty(self) -> bool:
1103         """Is this a class with no base classes but using parentheses?
1104
1105         Those are unnecessary and should be removed.
1106         """
1107         return (
1108             bool(self)
1109             and len(self.leaves) == 4
1110             and self.is_class
1111             and self.leaves[2].type == token.LPAR
1112             and self.leaves[2].value == "("
1113             and self.leaves[3].type == token.RPAR
1114             and self.leaves[3].value == ")"
1115         )
1116
1117     @property
1118     def is_triple_quoted_string(self) -> bool:
1119         """Is the line a triple quoted string?"""
1120         return (
1121             bool(self)
1122             and self.leaves[0].type == token.STRING
1123             and self.leaves[0].value.startswith(('"""', "'''"))
1124         )
1125
1126     def contains_standalone_comments(self, depth_limit: int = sys.maxsize) -> bool:
1127         """If so, needs to be split before emitting."""
1128         for leaf in self.leaves:
1129             if leaf.type == STANDALONE_COMMENT:
1130                 if leaf.bracket_depth <= depth_limit:
1131                     return True
1132
1133         return False
1134
1135     def contains_multiline_strings(self) -> bool:
1136         for leaf in self.leaves:
1137             if is_multiline_string(leaf):
1138                 return True
1139
1140         return False
1141
1142     def maybe_remove_trailing_comma(self, closing: Leaf) -> bool:
1143         """Remove trailing comma if there is one and it's safe."""
1144         if not (
1145             self.leaves
1146             and self.leaves[-1].type == token.COMMA
1147             and closing.type in CLOSING_BRACKETS
1148         ):
1149             return False
1150
1151         if closing.type == token.RBRACE:
1152             self.remove_trailing_comma()
1153             return True
1154
1155         if closing.type == token.RSQB:
1156             comma = self.leaves[-1]
1157             if comma.parent and comma.parent.type == syms.listmaker:
1158                 self.remove_trailing_comma()
1159                 return True
1160
1161         # For parens let's check if it's safe to remove the comma.
1162         # Imports are always safe.
1163         if self.is_import:
1164             self.remove_trailing_comma()
1165             return True
1166
1167         # Otheriwsse, if the trailing one is the only one, we might mistakenly
1168         # change a tuple into a different type by removing the comma.
1169         depth = closing.bracket_depth + 1
1170         commas = 0
1171         opening = closing.opening_bracket
1172         for _opening_index, leaf in enumerate(self.leaves):
1173             if leaf is opening:
1174                 break
1175
1176         else:
1177             return False
1178
1179         for leaf in self.leaves[_opening_index + 1 :]:
1180             if leaf is closing:
1181                 break
1182
1183             bracket_depth = leaf.bracket_depth
1184             if bracket_depth == depth and leaf.type == token.COMMA:
1185                 commas += 1
1186                 if leaf.parent and leaf.parent.type == syms.arglist:
1187                     commas += 1
1188                     break
1189
1190         if commas > 1:
1191             self.remove_trailing_comma()
1192             return True
1193
1194         return False
1195
1196     def append_comment(self, comment: Leaf) -> bool:
1197         """Add an inline or standalone comment to the line."""
1198         if (
1199             comment.type == STANDALONE_COMMENT
1200             and self.bracket_tracker.any_open_brackets()
1201         ):
1202             comment.prefix = ""
1203             return False
1204
1205         if comment.type != token.COMMENT:
1206             return False
1207
1208         after = len(self.leaves) - 1
1209         if after == -1:
1210             comment.type = STANDALONE_COMMENT
1211             comment.prefix = ""
1212             return False
1213
1214         else:
1215             self.comments.append((after, comment))
1216             return True
1217
1218     def comments_after(self, leaf: Leaf, _index: int = -1) -> Iterator[Leaf]:
1219         """Generate comments that should appear directly after `leaf`.
1220
1221         Provide a non-negative leaf `_index` to speed up the function.
1222         """
1223         if not self.comments:
1224             return
1225
1226         if _index == -1:
1227             for _index, _leaf in enumerate(self.leaves):
1228                 if leaf is _leaf:
1229                     break
1230
1231             else:
1232                 return
1233
1234         for index, comment_after in self.comments:
1235             if _index == index:
1236                 yield comment_after
1237
1238     def remove_trailing_comma(self) -> None:
1239         """Remove the trailing comma and moves the comments attached to it."""
1240         comma_index = len(self.leaves) - 1
1241         for i in range(len(self.comments)):
1242             comment_index, comment = self.comments[i]
1243             if comment_index == comma_index:
1244                 self.comments[i] = (comma_index - 1, comment)
1245         self.leaves.pop()
1246
1247     def is_complex_subscript(self, leaf: Leaf) -> bool:
1248         """Return True iff `leaf` is part of a slice with non-trivial exprs."""
1249         open_lsqb = self.bracket_tracker.get_open_lsqb()
1250         if open_lsqb is None:
1251             return False
1252
1253         subscript_start = open_lsqb.next_sibling
1254
1255         if isinstance(subscript_start, Node):
1256             if subscript_start.type == syms.listmaker:
1257                 return False
1258
1259             if subscript_start.type == syms.subscriptlist:
1260                 subscript_start = child_towards(subscript_start, leaf)
1261         return subscript_start is not None and any(
1262             n.type in TEST_DESCENDANTS for n in subscript_start.pre_order()
1263         )
1264
1265     def __str__(self) -> str:
1266         """Render the line."""
1267         if not self:
1268             return "\n"
1269
1270         indent = "    " * self.depth
1271         leaves = iter(self.leaves)
1272         first = next(leaves)
1273         res = f"{first.prefix}{indent}{first.value}"
1274         for leaf in leaves:
1275             res += str(leaf)
1276         for _, comment in self.comments:
1277             res += str(comment)
1278         return res + "\n"
1279
1280     def __bool__(self) -> bool:
1281         """Return True if the line has leaves or comments."""
1282         return bool(self.leaves or self.comments)
1283
1284
1285 @dataclass
1286 class EmptyLineTracker:
1287     """Provides a stateful method that returns the number of potential extra
1288     empty lines needed before and after the currently processed line.
1289
1290     Note: this tracker works on lines that haven't been split yet.  It assumes
1291     the prefix of the first leaf consists of optional newlines.  Those newlines
1292     are consumed by `maybe_empty_lines()` and included in the computation.
1293     """
1294
1295     is_pyi: bool = False
1296     previous_line: Optional[Line] = None
1297     previous_after: int = 0
1298     previous_defs: List[int] = Factory(list)
1299
1300     def maybe_empty_lines(self, current_line: Line) -> Tuple[int, int]:
1301         """Return the number of extra empty lines before and after the `current_line`.
1302
1303         This is for separating `def`, `async def` and `class` with extra empty
1304         lines (two on module-level).
1305         """
1306         before, after = self._maybe_empty_lines(current_line)
1307         before -= self.previous_after
1308         self.previous_after = after
1309         self.previous_line = current_line
1310         return before, after
1311
1312     def _maybe_empty_lines(self, current_line: Line) -> Tuple[int, int]:
1313         max_allowed = 1
1314         if current_line.depth == 0:
1315             max_allowed = 1 if self.is_pyi else 2
1316         if current_line.leaves:
1317             # Consume the first leaf's extra newlines.
1318             first_leaf = current_line.leaves[0]
1319             before = first_leaf.prefix.count("\n")
1320             before = min(before, max_allowed)
1321             first_leaf.prefix = ""
1322         else:
1323             before = 0
1324         depth = current_line.depth
1325         while self.previous_defs and self.previous_defs[-1] >= depth:
1326             self.previous_defs.pop()
1327             if self.is_pyi:
1328                 before = 0 if depth else 1
1329             else:
1330                 before = 1 if depth else 2
1331         if current_line.is_decorator or current_line.is_def or current_line.is_class:
1332             return self._maybe_empty_lines_for_class_or_def(current_line, before)
1333
1334         if (
1335             self.previous_line
1336             and self.previous_line.is_import
1337             and not current_line.is_import
1338             and depth == self.previous_line.depth
1339         ):
1340             return (before or 1), 0
1341
1342         if (
1343             self.previous_line
1344             and self.previous_line.is_class
1345             and current_line.is_triple_quoted_string
1346         ):
1347             return before, 1
1348
1349         return before, 0
1350
1351     def _maybe_empty_lines_for_class_or_def(
1352         self, current_line: Line, before: int
1353     ) -> Tuple[int, int]:
1354         if not current_line.is_decorator:
1355             self.previous_defs.append(current_line.depth)
1356         if self.previous_line is None:
1357             # Don't insert empty lines before the first line in the file.
1358             return 0, 0
1359
1360         if self.previous_line.is_decorator:
1361             return 0, 0
1362
1363         if self.previous_line.depth < current_line.depth and (
1364             self.previous_line.is_class or self.previous_line.is_def
1365         ):
1366             return 0, 0
1367
1368         if (
1369             self.previous_line.is_comment
1370             and self.previous_line.depth == current_line.depth
1371             and before == 0
1372         ):
1373             return 0, 0
1374
1375         if self.is_pyi:
1376             if self.previous_line.depth > current_line.depth:
1377                 newlines = 1
1378             elif current_line.is_class or self.previous_line.is_class:
1379                 if current_line.is_stub_class and self.previous_line.is_stub_class:
1380                     # No blank line between classes with an emty body
1381                     newlines = 0
1382                 else:
1383                     newlines = 1
1384             elif current_line.is_def and not self.previous_line.is_def:
1385                 # Blank line between a block of functions and a block of non-functions
1386                 newlines = 1
1387             else:
1388                 newlines = 0
1389         else:
1390             newlines = 2
1391         if current_line.depth and newlines:
1392             newlines -= 1
1393         return newlines, 0
1394
1395
1396 @dataclass
1397 class LineGenerator(Visitor[Line]):
1398     """Generates reformatted Line objects.  Empty lines are not emitted.
1399
1400     Note: destroys the tree it's visiting by mutating prefixes of its leaves
1401     in ways that will no longer stringify to valid Python code on the tree.
1402     """
1403
1404     is_pyi: bool = False
1405     normalize_strings: bool = True
1406     current_line: Line = Factory(Line)
1407     remove_u_prefix: bool = False
1408     allow_underscores: bool = False
1409
1410     def line(self, indent: int = 0) -> Iterator[Line]:
1411         """Generate a line.
1412
1413         If the line is empty, only emit if it makes sense.
1414         If the line is too long, split it first and then generate.
1415
1416         If any lines were generated, set up a new current_line.
1417         """
1418         if not self.current_line:
1419             self.current_line.depth += indent
1420             return  # Line is empty, don't emit. Creating a new one unnecessary.
1421
1422         complete_line = self.current_line
1423         self.current_line = Line(depth=complete_line.depth + indent)
1424         yield complete_line
1425
1426     def visit_default(self, node: LN) -> Iterator[Line]:
1427         """Default `visit_*()` implementation. Recurses to children of `node`."""
1428         if isinstance(node, Leaf):
1429             any_open_brackets = self.current_line.bracket_tracker.any_open_brackets()
1430             for comment in generate_comments(node):
1431                 if any_open_brackets:
1432                     # any comment within brackets is subject to splitting
1433                     self.current_line.append(comment)
1434                 elif comment.type == token.COMMENT:
1435                     # regular trailing comment
1436                     self.current_line.append(comment)
1437                     yield from self.line()
1438
1439                 else:
1440                     # regular standalone comment
1441                     yield from self.line()
1442
1443                     self.current_line.append(comment)
1444                     yield from self.line()
1445
1446             normalize_prefix(node, inside_brackets=any_open_brackets)
1447             if self.normalize_strings and node.type == token.STRING:
1448                 normalize_string_prefix(node, remove_u_prefix=self.remove_u_prefix)
1449                 normalize_string_quotes(node)
1450             if node.type == token.NUMBER:
1451                 normalize_numeric_literal(node, self.allow_underscores)
1452             if node.type not in WHITESPACE:
1453                 self.current_line.append(node)
1454         yield from super().visit_default(node)
1455
1456     def visit_INDENT(self, node: Node) -> Iterator[Line]:
1457         """Increase indentation level, maybe yield a line."""
1458         # In blib2to3 INDENT never holds comments.
1459         yield from self.line(+1)
1460         yield from self.visit_default(node)
1461
1462     def visit_DEDENT(self, node: Node) -> Iterator[Line]:
1463         """Decrease indentation level, maybe yield a line."""
1464         # The current line might still wait for trailing comments.  At DEDENT time
1465         # there won't be any (they would be prefixes on the preceding NEWLINE).
1466         # Emit the line then.
1467         yield from self.line()
1468
1469         # While DEDENT has no value, its prefix may contain standalone comments
1470         # that belong to the current indentation level.  Get 'em.
1471         yield from self.visit_default(node)
1472
1473         # Finally, emit the dedent.
1474         yield from self.line(-1)
1475
1476     def visit_stmt(
1477         self, node: Node, keywords: Set[str], parens: Set[str]
1478     ) -> Iterator[Line]:
1479         """Visit a statement.
1480
1481         This implementation is shared for `if`, `while`, `for`, `try`, `except`,
1482         `def`, `with`, `class`, `assert` and assignments.
1483
1484         The relevant Python language `keywords` for a given statement will be
1485         NAME leaves within it. This methods puts those on a separate line.
1486
1487         `parens` holds a set of string leaf values immediately after which
1488         invisible parens should be put.
1489         """
1490         normalize_invisible_parens(node, parens_after=parens)
1491         for child in node.children:
1492             if child.type == token.NAME and child.value in keywords:  # type: ignore
1493                 yield from self.line()
1494
1495             yield from self.visit(child)
1496
1497     def visit_suite(self, node: Node) -> Iterator[Line]:
1498         """Visit a suite."""
1499         if self.is_pyi and is_stub_suite(node):
1500             yield from self.visit(node.children[2])
1501         else:
1502             yield from self.visit_default(node)
1503
1504     def visit_simple_stmt(self, node: Node) -> Iterator[Line]:
1505         """Visit a statement without nested statements."""
1506         is_suite_like = node.parent and node.parent.type in STATEMENT
1507         if is_suite_like:
1508             if self.is_pyi and is_stub_body(node):
1509                 yield from self.visit_default(node)
1510             else:
1511                 yield from self.line(+1)
1512                 yield from self.visit_default(node)
1513                 yield from self.line(-1)
1514
1515         else:
1516             if not self.is_pyi or not node.parent or not is_stub_suite(node.parent):
1517                 yield from self.line()
1518             yield from self.visit_default(node)
1519
1520     def visit_async_stmt(self, node: Node) -> Iterator[Line]:
1521         """Visit `async def`, `async for`, `async with`."""
1522         yield from self.line()
1523
1524         children = iter(node.children)
1525         for child in children:
1526             yield from self.visit(child)
1527
1528             if child.type == token.ASYNC:
1529                 break
1530
1531         internal_stmt = next(children)
1532         for child in internal_stmt.children:
1533             yield from self.visit(child)
1534
1535     def visit_decorators(self, node: Node) -> Iterator[Line]:
1536         """Visit decorators."""
1537         for child in node.children:
1538             yield from self.line()
1539             yield from self.visit(child)
1540
1541     def visit_SEMI(self, leaf: Leaf) -> Iterator[Line]:
1542         """Remove a semicolon and put the other statement on a separate line."""
1543         yield from self.line()
1544
1545     def visit_ENDMARKER(self, leaf: Leaf) -> Iterator[Line]:
1546         """End of file. Process outstanding comments and end with a newline."""
1547         yield from self.visit_default(leaf)
1548         yield from self.line()
1549
1550     def visit_STANDALONE_COMMENT(self, leaf: Leaf) -> Iterator[Line]:
1551         if not self.current_line.bracket_tracker.any_open_brackets():
1552             yield from self.line()
1553         yield from self.visit_default(leaf)
1554
1555     def __attrs_post_init__(self) -> None:
1556         """You are in a twisty little maze of passages."""
1557         v = self.visit_stmt
1558         Ø: Set[str] = set()
1559         self.visit_assert_stmt = partial(v, keywords={"assert"}, parens={"assert", ","})
1560         self.visit_if_stmt = partial(
1561             v, keywords={"if", "else", "elif"}, parens={"if", "elif"}
1562         )
1563         self.visit_while_stmt = partial(v, keywords={"while", "else"}, parens={"while"})
1564         self.visit_for_stmt = partial(v, keywords={"for", "else"}, parens={"for", "in"})
1565         self.visit_try_stmt = partial(
1566             v, keywords={"try", "except", "else", "finally"}, parens=Ø
1567         )
1568         self.visit_except_clause = partial(v, keywords={"except"}, parens=Ø)
1569         self.visit_with_stmt = partial(v, keywords={"with"}, parens=Ø)
1570         self.visit_funcdef = partial(v, keywords={"def"}, parens=Ø)
1571         self.visit_classdef = partial(v, keywords={"class"}, parens=Ø)
1572         self.visit_expr_stmt = partial(v, keywords=Ø, parens=ASSIGNMENTS)
1573         self.visit_return_stmt = partial(v, keywords={"return"}, parens={"return"})
1574         self.visit_import_from = partial(v, keywords=Ø, parens={"import"})
1575         self.visit_async_funcdef = self.visit_async_stmt
1576         self.visit_decorated = self.visit_decorators
1577
1578
1579 IMPLICIT_TUPLE = {syms.testlist, syms.testlist_star_expr, syms.exprlist}
1580 BRACKET = {token.LPAR: token.RPAR, token.LSQB: token.RSQB, token.LBRACE: token.RBRACE}
1581 OPENING_BRACKETS = set(BRACKET.keys())
1582 CLOSING_BRACKETS = set(BRACKET.values())
1583 BRACKETS = OPENING_BRACKETS | CLOSING_BRACKETS
1584 ALWAYS_NO_SPACE = CLOSING_BRACKETS | {token.COMMA, STANDALONE_COMMENT}
1585
1586
1587 def whitespace(leaf: Leaf, *, complex_subscript: bool) -> str:  # noqa C901
1588     """Return whitespace prefix if needed for the given `leaf`.
1589
1590     `complex_subscript` signals whether the given leaf is part of a subscription
1591     which has non-trivial arguments, like arithmetic expressions or function calls.
1592     """
1593     NO = ""
1594     SPACE = " "
1595     DOUBLESPACE = "  "
1596     t = leaf.type
1597     p = leaf.parent
1598     v = leaf.value
1599     if t in ALWAYS_NO_SPACE:
1600         return NO
1601
1602     if t == token.COMMENT:
1603         return DOUBLESPACE
1604
1605     assert p is not None, f"INTERNAL ERROR: hand-made leaf without parent: {leaf!r}"
1606     if t == token.COLON and p.type not in {
1607         syms.subscript,
1608         syms.subscriptlist,
1609         syms.sliceop,
1610     }:
1611         return NO
1612
1613     prev = leaf.prev_sibling
1614     if not prev:
1615         prevp = preceding_leaf(p)
1616         if not prevp or prevp.type in OPENING_BRACKETS:
1617             return NO
1618
1619         if t == token.COLON:
1620             if prevp.type == token.COLON:
1621                 return NO
1622
1623             elif prevp.type != token.COMMA and not complex_subscript:
1624                 return NO
1625
1626             return SPACE
1627
1628         if prevp.type == token.EQUAL:
1629             if prevp.parent:
1630                 if prevp.parent.type in {
1631                     syms.arglist,
1632                     syms.argument,
1633                     syms.parameters,
1634                     syms.varargslist,
1635                 }:
1636                     return NO
1637
1638                 elif prevp.parent.type == syms.typedargslist:
1639                     # A bit hacky: if the equal sign has whitespace, it means we
1640                     # previously found it's a typed argument.  So, we're using
1641                     # that, too.
1642                     return prevp.prefix
1643
1644         elif prevp.type in STARS:
1645             if is_vararg(prevp, within=VARARGS_PARENTS | UNPACKING_PARENTS):
1646                 return NO
1647
1648         elif prevp.type == token.COLON:
1649             if prevp.parent and prevp.parent.type in {syms.subscript, syms.sliceop}:
1650                 return SPACE if complex_subscript else NO
1651
1652         elif (
1653             prevp.parent
1654             and prevp.parent.type == syms.factor
1655             and prevp.type in MATH_OPERATORS
1656         ):
1657             return NO
1658
1659         elif (
1660             prevp.type == token.RIGHTSHIFT
1661             and prevp.parent
1662             and prevp.parent.type == syms.shift_expr
1663             and prevp.prev_sibling
1664             and prevp.prev_sibling.type == token.NAME
1665             and prevp.prev_sibling.value == "print"  # type: ignore
1666         ):
1667             # Python 2 print chevron
1668             return NO
1669
1670     elif prev.type in OPENING_BRACKETS:
1671         return NO
1672
1673     if p.type in {syms.parameters, syms.arglist}:
1674         # untyped function signatures or calls
1675         if not prev or prev.type != token.COMMA:
1676             return NO
1677
1678     elif p.type == syms.varargslist:
1679         # lambdas
1680         if prev and prev.type != token.COMMA:
1681             return NO
1682
1683     elif p.type == syms.typedargslist:
1684         # typed function signatures
1685         if not prev:
1686             return NO
1687
1688         if t == token.EQUAL:
1689             if prev.type != syms.tname:
1690                 return NO
1691
1692         elif prev.type == token.EQUAL:
1693             # A bit hacky: if the equal sign has whitespace, it means we
1694             # previously found it's a typed argument.  So, we're using that, too.
1695             return prev.prefix
1696
1697         elif prev.type != token.COMMA:
1698             return NO
1699
1700     elif p.type == syms.tname:
1701         # type names
1702         if not prev:
1703             prevp = preceding_leaf(p)
1704             if not prevp or prevp.type != token.COMMA:
1705                 return NO
1706
1707     elif p.type == syms.trailer:
1708         # attributes and calls
1709         if t == token.LPAR or t == token.RPAR:
1710             return NO
1711
1712         if not prev:
1713             if t == token.DOT:
1714                 prevp = preceding_leaf(p)
1715                 if not prevp or prevp.type != token.NUMBER:
1716                     return NO
1717
1718             elif t == token.LSQB:
1719                 return NO
1720
1721         elif prev.type != token.COMMA:
1722             return NO
1723
1724     elif p.type == syms.argument:
1725         # single argument
1726         if t == token.EQUAL:
1727             return NO
1728
1729         if not prev:
1730             prevp = preceding_leaf(p)
1731             if not prevp or prevp.type == token.LPAR:
1732                 return NO
1733
1734         elif prev.type in {token.EQUAL} | STARS:
1735             return NO
1736
1737     elif p.type == syms.decorator:
1738         # decorators
1739         return NO
1740
1741     elif p.type == syms.dotted_name:
1742         if prev:
1743             return NO
1744
1745         prevp = preceding_leaf(p)
1746         if not prevp or prevp.type == token.AT or prevp.type == token.DOT:
1747             return NO
1748
1749     elif p.type == syms.classdef:
1750         if t == token.LPAR:
1751             return NO
1752
1753         if prev and prev.type == token.LPAR:
1754             return NO
1755
1756     elif p.type in {syms.subscript, syms.sliceop}:
1757         # indexing
1758         if not prev:
1759             assert p.parent is not None, "subscripts are always parented"
1760             if p.parent.type == syms.subscriptlist:
1761                 return SPACE
1762
1763             return NO
1764
1765         elif not complex_subscript:
1766             return NO
1767
1768     elif p.type == syms.atom:
1769         if prev and t == token.DOT:
1770             # dots, but not the first one.
1771             return NO
1772
1773     elif p.type == syms.dictsetmaker:
1774         # dict unpacking
1775         if prev and prev.type == token.DOUBLESTAR:
1776             return NO
1777
1778     elif p.type in {syms.factor, syms.star_expr}:
1779         # unary ops
1780         if not prev:
1781             prevp = preceding_leaf(p)
1782             if not prevp or prevp.type in OPENING_BRACKETS:
1783                 return NO
1784
1785             prevp_parent = prevp.parent
1786             assert prevp_parent is not None
1787             if prevp.type == token.COLON and prevp_parent.type in {
1788                 syms.subscript,
1789                 syms.sliceop,
1790             }:
1791                 return NO
1792
1793             elif prevp.type == token.EQUAL and prevp_parent.type == syms.argument:
1794                 return NO
1795
1796         elif t in {token.NAME, token.NUMBER, token.STRING}:
1797             return NO
1798
1799     elif p.type == syms.import_from:
1800         if t == token.DOT:
1801             if prev and prev.type == token.DOT:
1802                 return NO
1803
1804         elif t == token.NAME:
1805             if v == "import":
1806                 return SPACE
1807
1808             if prev and prev.type == token.DOT:
1809                 return NO
1810
1811     elif p.type == syms.sliceop:
1812         return NO
1813
1814     return SPACE
1815
1816
1817 def preceding_leaf(node: Optional[LN]) -> Optional[Leaf]:
1818     """Return the first leaf that precedes `node`, if any."""
1819     while node:
1820         res = node.prev_sibling
1821         if res:
1822             if isinstance(res, Leaf):
1823                 return res
1824
1825             try:
1826                 return list(res.leaves())[-1]
1827
1828             except IndexError:
1829                 return None
1830
1831         node = node.parent
1832     return None
1833
1834
1835 def child_towards(ancestor: Node, descendant: LN) -> Optional[LN]:
1836     """Return the child of `ancestor` that contains `descendant`."""
1837     node: Optional[LN] = descendant
1838     while node and node.parent != ancestor:
1839         node = node.parent
1840     return node
1841
1842
1843 def container_of(leaf: Leaf) -> LN:
1844     """Return `leaf` or one of its ancestors that is the topmost container of it.
1845
1846     By "container" we mean a node where `leaf` is the very first child.
1847     """
1848     same_prefix = leaf.prefix
1849     container: LN = leaf
1850     while container:
1851         parent = container.parent
1852         if parent is None:
1853             break
1854
1855         if parent.children[0].prefix != same_prefix:
1856             break
1857
1858         if parent.type == syms.file_input:
1859             break
1860
1861         if parent.prev_sibling is not None and parent.prev_sibling.type in BRACKETS:
1862             break
1863
1864         container = parent
1865     return container
1866
1867
1868 def is_split_after_delimiter(leaf: Leaf, previous: Leaf = None) -> int:
1869     """Return the priority of the `leaf` delimiter, given a line break after it.
1870
1871     The delimiter priorities returned here are from those delimiters that would
1872     cause a line break after themselves.
1873
1874     Higher numbers are higher priority.
1875     """
1876     if leaf.type == token.COMMA:
1877         return COMMA_PRIORITY
1878
1879     return 0
1880
1881
1882 def is_split_before_delimiter(leaf: Leaf, previous: Leaf = None) -> int:
1883     """Return the priority of the `leaf` delimiter, given a line before after it.
1884
1885     The delimiter priorities returned here are from those delimiters that would
1886     cause a line break before themselves.
1887
1888     Higher numbers are higher priority.
1889     """
1890     if is_vararg(leaf, within=VARARGS_PARENTS | UNPACKING_PARENTS):
1891         # * and ** might also be MATH_OPERATORS but in this case they are not.
1892         # Don't treat them as a delimiter.
1893         return 0
1894
1895     if (
1896         leaf.type == token.DOT
1897         and leaf.parent
1898         and leaf.parent.type not in {syms.import_from, syms.dotted_name}
1899         and (previous is None or previous.type in CLOSING_BRACKETS)
1900     ):
1901         return DOT_PRIORITY
1902
1903     if (
1904         leaf.type in MATH_OPERATORS
1905         and leaf.parent
1906         and leaf.parent.type not in {syms.factor, syms.star_expr}
1907     ):
1908         return MATH_PRIORITIES[leaf.type]
1909
1910     if leaf.type in COMPARATORS:
1911         return COMPARATOR_PRIORITY
1912
1913     if (
1914         leaf.type == token.STRING
1915         and previous is not None
1916         and previous.type == token.STRING
1917     ):
1918         return STRING_PRIORITY
1919
1920     if leaf.type != token.NAME:
1921         return 0
1922
1923     if (
1924         leaf.value == "for"
1925         and leaf.parent
1926         and leaf.parent.type in {syms.comp_for, syms.old_comp_for}
1927     ):
1928         return COMPREHENSION_PRIORITY
1929
1930     if (
1931         leaf.value == "if"
1932         and leaf.parent
1933         and leaf.parent.type in {syms.comp_if, syms.old_comp_if}
1934     ):
1935         return COMPREHENSION_PRIORITY
1936
1937     if leaf.value in {"if", "else"} and leaf.parent and leaf.parent.type == syms.test:
1938         return TERNARY_PRIORITY
1939
1940     if leaf.value == "is":
1941         return COMPARATOR_PRIORITY
1942
1943     if (
1944         leaf.value == "in"
1945         and leaf.parent
1946         and leaf.parent.type in {syms.comp_op, syms.comparison}
1947         and not (
1948             previous is not None
1949             and previous.type == token.NAME
1950             and previous.value == "not"
1951         )
1952     ):
1953         return COMPARATOR_PRIORITY
1954
1955     if (
1956         leaf.value == "not"
1957         and leaf.parent
1958         and leaf.parent.type == syms.comp_op
1959         and not (
1960             previous is not None
1961             and previous.type == token.NAME
1962             and previous.value == "is"
1963         )
1964     ):
1965         return COMPARATOR_PRIORITY
1966
1967     if leaf.value in LOGIC_OPERATORS and leaf.parent:
1968         return LOGIC_PRIORITY
1969
1970     return 0
1971
1972
1973 FMT_OFF = {"# fmt: off", "# fmt:off", "# yapf: disable"}
1974 FMT_ON = {"# fmt: on", "# fmt:on", "# yapf: enable"}
1975
1976
1977 def generate_comments(leaf: LN) -> Iterator[Leaf]:
1978     """Clean the prefix of the `leaf` and generate comments from it, if any.
1979
1980     Comments in lib2to3 are shoved into the whitespace prefix.  This happens
1981     in `pgen2/driver.py:Driver.parse_tokens()`.  This was a brilliant implementation
1982     move because it does away with modifying the grammar to include all the
1983     possible places in which comments can be placed.
1984
1985     The sad consequence for us though is that comments don't "belong" anywhere.
1986     This is why this function generates simple parentless Leaf objects for
1987     comments.  We simply don't know what the correct parent should be.
1988
1989     No matter though, we can live without this.  We really only need to
1990     differentiate between inline and standalone comments.  The latter don't
1991     share the line with any code.
1992
1993     Inline comments are emitted as regular token.COMMENT leaves.  Standalone
1994     are emitted with a fake STANDALONE_COMMENT token identifier.
1995     """
1996     for pc in list_comments(leaf.prefix, is_endmarker=leaf.type == token.ENDMARKER):
1997         yield Leaf(pc.type, pc.value, prefix="\n" * pc.newlines)
1998
1999
2000 @dataclass
2001 class ProtoComment:
2002     type: int  # token.COMMENT or STANDALONE_COMMENT
2003     value: str  # content of the comment
2004     newlines: int  # how many newlines before the comment
2005     consumed: int  # how many characters of the original leaf's prefix did we consume
2006
2007
2008 @lru_cache(maxsize=4096)
2009 def list_comments(prefix: str, *, is_endmarker: bool) -> List[ProtoComment]:
2010     result: List[ProtoComment] = []
2011     if not prefix or "#" not in prefix:
2012         return result
2013
2014     consumed = 0
2015     nlines = 0
2016     for index, line in enumerate(prefix.split("\n")):
2017         consumed += len(line) + 1  # adding the length of the split '\n'
2018         line = line.lstrip()
2019         if not line:
2020             nlines += 1
2021         if not line.startswith("#"):
2022             continue
2023
2024         if index == 0 and not is_endmarker:
2025             comment_type = token.COMMENT  # simple trailing comment
2026         else:
2027             comment_type = STANDALONE_COMMENT
2028         comment = make_comment(line)
2029         result.append(
2030             ProtoComment(
2031                 type=comment_type, value=comment, newlines=nlines, consumed=consumed
2032             )
2033         )
2034         nlines = 0
2035     return result
2036
2037
2038 def make_comment(content: str) -> str:
2039     """Return a consistently formatted comment from the given `content` string.
2040
2041     All comments (except for "##", "#!", "#:") should have a single space between
2042     the hash sign and the content.
2043
2044     If `content` didn't start with a hash sign, one is provided.
2045     """
2046     content = content.rstrip()
2047     if not content:
2048         return "#"
2049
2050     if content[0] == "#":
2051         content = content[1:]
2052     if content and content[0] not in " !:#":
2053         content = " " + content
2054     return "#" + content
2055
2056
2057 def split_line(
2058     line: Line, line_length: int, inner: bool = False, py36: bool = False
2059 ) -> Iterator[Line]:
2060     """Split a `line` into potentially many lines.
2061
2062     They should fit in the allotted `line_length` but might not be able to.
2063     `inner` signifies that there were a pair of brackets somewhere around the
2064     current `line`, possibly transitively. This means we can fallback to splitting
2065     by delimiters if the LHS/RHS don't yield any results.
2066
2067     If `py36` is True, splitting may generate syntax that is only compatible
2068     with Python 3.6 and later.
2069     """
2070     if line.is_comment:
2071         yield line
2072         return
2073
2074     line_str = str(line).strip("\n")
2075     if not line.should_explode and is_line_short_enough(
2076         line, line_length=line_length, line_str=line_str
2077     ):
2078         yield line
2079         return
2080
2081     split_funcs: List[SplitFunc]
2082     if line.is_def:
2083         split_funcs = [left_hand_split]
2084     else:
2085
2086         def rhs(line: Line, py36: bool = False) -> Iterator[Line]:
2087             for omit in generate_trailers_to_omit(line, line_length):
2088                 lines = list(right_hand_split(line, line_length, py36, omit=omit))
2089                 if is_line_short_enough(lines[0], line_length=line_length):
2090                     yield from lines
2091                     return
2092
2093             # All splits failed, best effort split with no omits.
2094             # This mostly happens to multiline strings that are by definition
2095             # reported as not fitting a single line.
2096             yield from right_hand_split(line, py36)
2097
2098         if line.inside_brackets:
2099             split_funcs = [delimiter_split, standalone_comment_split, rhs]
2100         else:
2101             split_funcs = [rhs]
2102     for split_func in split_funcs:
2103         # We are accumulating lines in `result` because we might want to abort
2104         # mission and return the original line in the end, or attempt a different
2105         # split altogether.
2106         result: List[Line] = []
2107         try:
2108             for l in split_func(line, py36):
2109                 if str(l).strip("\n") == line_str:
2110                     raise CannotSplit("Split function returned an unchanged result")
2111
2112                 result.extend(
2113                     split_line(l, line_length=line_length, inner=True, py36=py36)
2114                 )
2115         except CannotSplit as cs:
2116             continue
2117
2118         else:
2119             yield from result
2120             break
2121
2122     else:
2123         yield line
2124
2125
2126 def left_hand_split(line: Line, py36: bool = False) -> Iterator[Line]:
2127     """Split line into many lines, starting with the first matching bracket pair.
2128
2129     Note: this usually looks weird, only use this for function definitions.
2130     Prefer RHS otherwise.  This is why this function is not symmetrical with
2131     :func:`right_hand_split` which also handles optional parentheses.
2132     """
2133     head = Line(depth=line.depth)
2134     body = Line(depth=line.depth + 1, inside_brackets=True)
2135     tail = Line(depth=line.depth)
2136     tail_leaves: List[Leaf] = []
2137     body_leaves: List[Leaf] = []
2138     head_leaves: List[Leaf] = []
2139     current_leaves = head_leaves
2140     matching_bracket = None
2141     for leaf in line.leaves:
2142         if (
2143             current_leaves is body_leaves
2144             and leaf.type in CLOSING_BRACKETS
2145             and leaf.opening_bracket is matching_bracket
2146         ):
2147             current_leaves = tail_leaves if body_leaves else head_leaves
2148         current_leaves.append(leaf)
2149         if current_leaves is head_leaves:
2150             if leaf.type in OPENING_BRACKETS:
2151                 matching_bracket = leaf
2152                 current_leaves = body_leaves
2153     # Since body is a new indent level, remove spurious leading whitespace.
2154     if body_leaves:
2155         normalize_prefix(body_leaves[0], inside_brackets=True)
2156     # Build the new lines.
2157     for result, leaves in (head, head_leaves), (body, body_leaves), (tail, tail_leaves):
2158         for leaf in leaves:
2159             result.append(leaf, preformatted=True)
2160             for comment_after in line.comments_after(leaf):
2161                 result.append(comment_after, preformatted=True)
2162     bracket_split_succeeded_or_raise(head, body, tail)
2163     for result in (head, body, tail):
2164         if result:
2165             yield result
2166
2167
2168 def right_hand_split(
2169     line: Line, line_length: int, py36: bool = False, omit: Collection[LeafID] = ()
2170 ) -> Iterator[Line]:
2171     """Split line into many lines, starting with the last matching bracket pair.
2172
2173     If the split was by optional parentheses, attempt splitting without them, too.
2174     `omit` is a collection of closing bracket IDs that shouldn't be considered for
2175     this split.
2176
2177     Note: running this function modifies `bracket_depth` on the leaves of `line`.
2178     """
2179     head = Line(depth=line.depth)
2180     body = Line(depth=line.depth + 1, inside_brackets=True)
2181     tail = Line(depth=line.depth)
2182     tail_leaves: List[Leaf] = []
2183     body_leaves: List[Leaf] = []
2184     head_leaves: List[Leaf] = []
2185     current_leaves = tail_leaves
2186     opening_bracket = None
2187     closing_bracket = None
2188     for leaf in reversed(line.leaves):
2189         if current_leaves is body_leaves:
2190             if leaf is opening_bracket:
2191                 current_leaves = head_leaves if body_leaves else tail_leaves
2192         current_leaves.append(leaf)
2193         if current_leaves is tail_leaves:
2194             if leaf.type in CLOSING_BRACKETS and id(leaf) not in omit:
2195                 opening_bracket = leaf.opening_bracket
2196                 closing_bracket = leaf
2197                 current_leaves = body_leaves
2198     tail_leaves.reverse()
2199     body_leaves.reverse()
2200     head_leaves.reverse()
2201     # Since body is a new indent level, remove spurious leading whitespace.
2202     if body_leaves:
2203         normalize_prefix(body_leaves[0], inside_brackets=True)
2204     if not head_leaves:
2205         # No `head` means the split failed. Either `tail` has all content or
2206         # the matching `opening_bracket` wasn't available on `line` anymore.
2207         raise CannotSplit("No brackets found")
2208
2209     # Build the new lines.
2210     for result, leaves in (head, head_leaves), (body, body_leaves), (tail, tail_leaves):
2211         for leaf in leaves:
2212             result.append(leaf, preformatted=True)
2213             for comment_after in line.comments_after(leaf):
2214                 result.append(comment_after, preformatted=True)
2215     assert opening_bracket and closing_bracket
2216     body.should_explode = should_explode(body, opening_bracket)
2217     bracket_split_succeeded_or_raise(head, body, tail)
2218     if (
2219         # the body shouldn't be exploded
2220         not body.should_explode
2221         # the opening bracket is an optional paren
2222         and opening_bracket.type == token.LPAR
2223         and not opening_bracket.value
2224         # the closing bracket is an optional paren
2225         and closing_bracket.type == token.RPAR
2226         and not closing_bracket.value
2227         # it's not an import (optional parens are the only thing we can split on
2228         # in this case; attempting a split without them is a waste of time)
2229         and not line.is_import
2230         # there are no standalone comments in the body
2231         and not body.contains_standalone_comments(0)
2232         # and we can actually remove the parens
2233         and can_omit_invisible_parens(body, line_length)
2234     ):
2235         omit = {id(closing_bracket), *omit}
2236         try:
2237             yield from right_hand_split(line, line_length, py36=py36, omit=omit)
2238             return
2239
2240         except CannotSplit:
2241             if not (
2242                 can_be_split(body)
2243                 or is_line_short_enough(body, line_length=line_length)
2244             ):
2245                 raise CannotSplit(
2246                     "Splitting failed, body is still too long and can't be split."
2247                 )
2248
2249             elif head.contains_multiline_strings() or tail.contains_multiline_strings():
2250                 raise CannotSplit(
2251                     "The current optional pair of parentheses is bound to fail to "
2252                     "satisfy the splitting algorithm because the head or the tail "
2253                     "contains multiline strings which by definition never fit one "
2254                     "line."
2255                 )
2256
2257     ensure_visible(opening_bracket)
2258     ensure_visible(closing_bracket)
2259     for result in (head, body, tail):
2260         if result:
2261             yield result
2262
2263
2264 def bracket_split_succeeded_or_raise(head: Line, body: Line, tail: Line) -> None:
2265     """Raise :exc:`CannotSplit` if the last left- or right-hand split failed.
2266
2267     Do nothing otherwise.
2268
2269     A left- or right-hand split is based on a pair of brackets. Content before
2270     (and including) the opening bracket is left on one line, content inside the
2271     brackets is put on a separate line, and finally content starting with and
2272     following the closing bracket is put on a separate line.
2273
2274     Those are called `head`, `body`, and `tail`, respectively. If the split
2275     produced the same line (all content in `head`) or ended up with an empty `body`
2276     and the `tail` is just the closing bracket, then it's considered failed.
2277     """
2278     tail_len = len(str(tail).strip())
2279     if not body:
2280         if tail_len == 0:
2281             raise CannotSplit("Splitting brackets produced the same line")
2282
2283         elif tail_len < 3:
2284             raise CannotSplit(
2285                 f"Splitting brackets on an empty body to save "
2286                 f"{tail_len} characters is not worth it"
2287             )
2288
2289
2290 def dont_increase_indentation(split_func: SplitFunc) -> SplitFunc:
2291     """Normalize prefix of the first leaf in every line returned by `split_func`.
2292
2293     This is a decorator over relevant split functions.
2294     """
2295
2296     @wraps(split_func)
2297     def split_wrapper(line: Line, py36: bool = False) -> Iterator[Line]:
2298         for l in split_func(line, py36):
2299             normalize_prefix(l.leaves[0], inside_brackets=True)
2300             yield l
2301
2302     return split_wrapper
2303
2304
2305 @dont_increase_indentation
2306 def delimiter_split(line: Line, py36: bool = False) -> Iterator[Line]:
2307     """Split according to delimiters of the highest priority.
2308
2309     If `py36` is True, the split will add trailing commas also in function
2310     signatures that contain `*` and `**`.
2311     """
2312     try:
2313         last_leaf = line.leaves[-1]
2314     except IndexError:
2315         raise CannotSplit("Line empty")
2316
2317     bt = line.bracket_tracker
2318     try:
2319         delimiter_priority = bt.max_delimiter_priority(exclude={id(last_leaf)})
2320     except ValueError:
2321         raise CannotSplit("No delimiters found")
2322
2323     if delimiter_priority == DOT_PRIORITY:
2324         if bt.delimiter_count_with_priority(delimiter_priority) == 1:
2325             raise CannotSplit("Splitting a single attribute from its owner looks wrong")
2326
2327     current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2328     lowest_depth = sys.maxsize
2329     trailing_comma_safe = True
2330
2331     def append_to_line(leaf: Leaf) -> Iterator[Line]:
2332         """Append `leaf` to current line or to new line if appending impossible."""
2333         nonlocal current_line
2334         try:
2335             current_line.append_safe(leaf, preformatted=True)
2336         except ValueError as ve:
2337             yield current_line
2338
2339             current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2340             current_line.append(leaf)
2341
2342     for index, leaf in enumerate(line.leaves):
2343         yield from append_to_line(leaf)
2344
2345         for comment_after in line.comments_after(leaf, index):
2346             yield from append_to_line(comment_after)
2347
2348         lowest_depth = min(lowest_depth, leaf.bracket_depth)
2349         if leaf.bracket_depth == lowest_depth and is_vararg(
2350             leaf, within=VARARGS_PARENTS
2351         ):
2352             trailing_comma_safe = trailing_comma_safe and py36
2353         leaf_priority = bt.delimiters.get(id(leaf))
2354         if leaf_priority == delimiter_priority:
2355             yield current_line
2356
2357             current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2358     if current_line:
2359         if (
2360             trailing_comma_safe
2361             and delimiter_priority == COMMA_PRIORITY
2362             and current_line.leaves[-1].type != token.COMMA
2363             and current_line.leaves[-1].type != STANDALONE_COMMENT
2364         ):
2365             current_line.append(Leaf(token.COMMA, ","))
2366         yield current_line
2367
2368
2369 @dont_increase_indentation
2370 def standalone_comment_split(line: Line, py36: bool = False) -> Iterator[Line]:
2371     """Split standalone comments from the rest of the line."""
2372     if not line.contains_standalone_comments(0):
2373         raise CannotSplit("Line does not have any standalone comments")
2374
2375     current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2376
2377     def append_to_line(leaf: Leaf) -> Iterator[Line]:
2378         """Append `leaf` to current line or to new line if appending impossible."""
2379         nonlocal current_line
2380         try:
2381             current_line.append_safe(leaf, preformatted=True)
2382         except ValueError as ve:
2383             yield current_line
2384
2385             current_line = Line(depth=line.depth, inside_brackets=line.inside_brackets)
2386             current_line.append(leaf)
2387
2388     for index, leaf in enumerate(line.leaves):
2389         yield from append_to_line(leaf)
2390
2391         for comment_after in line.comments_after(leaf, index):
2392             yield from append_to_line(comment_after)
2393
2394     if current_line:
2395         yield current_line
2396
2397
2398 def is_import(leaf: Leaf) -> bool:
2399     """Return True if the given leaf starts an import statement."""
2400     p = leaf.parent
2401     t = leaf.type
2402     v = leaf.value
2403     return bool(
2404         t == token.NAME
2405         and (
2406             (v == "import" and p and p.type == syms.import_name)
2407             or (v == "from" and p and p.type == syms.import_from)
2408         )
2409     )
2410
2411
2412 def normalize_prefix(leaf: Leaf, *, inside_brackets: bool) -> None:
2413     """Leave existing extra newlines if not `inside_brackets`. Remove everything
2414     else.
2415
2416     Note: don't use backslashes for formatting or you'll lose your voting rights.
2417     """
2418     if not inside_brackets:
2419         spl = leaf.prefix.split("#")
2420         if "\\" not in spl[0]:
2421             nl_count = spl[-1].count("\n")
2422             if len(spl) > 1:
2423                 nl_count -= 1
2424             leaf.prefix = "\n" * nl_count
2425             return
2426
2427     leaf.prefix = ""
2428
2429
2430 def normalize_string_prefix(leaf: Leaf, remove_u_prefix: bool = False) -> None:
2431     """Make all string prefixes lowercase.
2432
2433     If remove_u_prefix is given, also removes any u prefix from the string.
2434
2435     Note: Mutates its argument.
2436     """
2437     match = re.match(r"^([furbFURB]*)(.*)$", leaf.value, re.DOTALL)
2438     assert match is not None, f"failed to match string {leaf.value!r}"
2439     orig_prefix = match.group(1)
2440     new_prefix = orig_prefix.lower()
2441     if remove_u_prefix:
2442         new_prefix = new_prefix.replace("u", "")
2443     leaf.value = f"{new_prefix}{match.group(2)}"
2444
2445
2446 def normalize_string_quotes(leaf: Leaf) -> None:
2447     """Prefer double quotes but only if it doesn't cause more escaping.
2448
2449     Adds or removes backslashes as appropriate. Doesn't parse and fix
2450     strings nested in f-strings (yet).
2451
2452     Note: Mutates its argument.
2453     """
2454     value = leaf.value.lstrip("furbFURB")
2455     if value[:3] == '"""':
2456         return
2457
2458     elif value[:3] == "'''":
2459         orig_quote = "'''"
2460         new_quote = '"""'
2461     elif value[0] == '"':
2462         orig_quote = '"'
2463         new_quote = "'"
2464     else:
2465         orig_quote = "'"
2466         new_quote = '"'
2467     first_quote_pos = leaf.value.find(orig_quote)
2468     if first_quote_pos == -1:
2469         return  # There's an internal error
2470
2471     prefix = leaf.value[:first_quote_pos]
2472     unescaped_new_quote = re.compile(rf"(([^\\]|^)(\\\\)*){new_quote}")
2473     escaped_new_quote = re.compile(rf"([^\\]|^)\\((?:\\\\)*){new_quote}")
2474     escaped_orig_quote = re.compile(rf"([^\\]|^)\\((?:\\\\)*){orig_quote}")
2475     body = leaf.value[first_quote_pos + len(orig_quote) : -len(orig_quote)]
2476     if "r" in prefix.casefold():
2477         if unescaped_new_quote.search(body):
2478             # There's at least one unescaped new_quote in this raw string
2479             # so converting is impossible
2480             return
2481
2482         # Do not introduce or remove backslashes in raw strings
2483         new_body = body
2484     else:
2485         # remove unnecessary escapes
2486         new_body = sub_twice(escaped_new_quote, rf"\1\2{new_quote}", body)
2487         if body != new_body:
2488             # Consider the string without unnecessary escapes as the original
2489             body = new_body
2490             leaf.value = f"{prefix}{orig_quote}{body}{orig_quote}"
2491         new_body = sub_twice(escaped_orig_quote, rf"\1\2{orig_quote}", new_body)
2492         new_body = sub_twice(unescaped_new_quote, rf"\1\\{new_quote}", new_body)
2493     if "f" in prefix.casefold():
2494         matches = re.findall(r"[^{]\{(.*?)\}[^}]", new_body)
2495         for m in matches:
2496             if "\\" in str(m):
2497                 # Do not introduce backslashes in interpolated expressions
2498                 return
2499     if new_quote == '"""' and new_body[-1:] == '"':
2500         # edge case:
2501         new_body = new_body[:-1] + '\\"'
2502     orig_escape_count = body.count("\\")
2503     new_escape_count = new_body.count("\\")
2504     if new_escape_count > orig_escape_count:
2505         return  # Do not introduce more escaping
2506
2507     if new_escape_count == orig_escape_count and orig_quote == '"':
2508         return  # Prefer double quotes
2509
2510     leaf.value = f"{prefix}{new_quote}{new_body}{new_quote}"
2511
2512
2513 def normalize_numeric_literal(leaf: Leaf, allow_underscores: bool) -> None:
2514     """Normalizes numeric (float, int, and complex) literals."""
2515     # We want all letters (e in exponents, j in complex literals, a-f
2516     # in hex literals) to be lowercase.
2517     text = leaf.value.lower()
2518     if text.startswith(("0o", "0x", "0b")):
2519         # Leave octal, hex, and binary literals alone for now.
2520         pass
2521     elif "e" in text:
2522         before, after = text.split("e")
2523         if after.startswith("-"):
2524             after = after[1:]
2525             sign = "-"
2526         elif after.startswith("+"):
2527             after = after[1:]
2528             sign = ""
2529         else:
2530             sign = ""
2531         before = format_float_or_int_string(before, allow_underscores)
2532         after = format_int_string(after, allow_underscores)
2533         text = f"{before}e{sign}{after}"
2534     # Complex numbers and Python 2 longs
2535     elif "j" in text or "l" in text:
2536         number = text[:-1]
2537         suffix = text[-1]
2538         text = f"{format_float_or_int_string(number, allow_underscores)}{suffix}"
2539     else:
2540         text = format_float_or_int_string(text, allow_underscores)
2541     leaf.value = text
2542
2543
2544 def format_float_or_int_string(text: str, allow_underscores: bool) -> str:
2545     """Formats a float string like "1.0"."""
2546     if "." not in text:
2547         return format_int_string(text, allow_underscores)
2548
2549     before, after = text.split(".")
2550     before = format_int_string(before, allow_underscores) if before else "0"
2551     after = format_int_string(after, allow_underscores) if after else "0"
2552     return f"{before}.{after}"
2553
2554
2555 def format_int_string(text: str, allow_underscores: bool) -> str:
2556     """Normalizes underscores in a string to e.g. 1_000_000.
2557
2558     Input must be a string consisting only of digits and underscores.
2559     """
2560     if not allow_underscores:
2561         return text
2562
2563     text = text.replace("_", "")
2564     if len(text) <= 6:
2565         # No underscores for numbers <= 6 digits long.
2566         return text
2567
2568     return format(int(text), "3_")
2569
2570
2571 def normalize_invisible_parens(node: Node, parens_after: Set[str]) -> None:
2572     """Make existing optional parentheses invisible or create new ones.
2573
2574     `parens_after` is a set of string leaf values immeditely after which parens
2575     should be put.
2576
2577     Standardizes on visible parentheses for single-element tuples, and keeps
2578     existing visible parentheses for other tuples and generator expressions.
2579     """
2580     for pc in list_comments(node.prefix, is_endmarker=False):
2581         if pc.value in FMT_OFF:
2582             # This `node` has a prefix with `# fmt: off`, don't mess with parens.
2583             return
2584
2585     check_lpar = False
2586     for index, child in enumerate(list(node.children)):
2587         if check_lpar:
2588             if child.type == syms.atom:
2589                 maybe_make_parens_invisible_in_atom(child)
2590             elif is_one_tuple(child):
2591                 # wrap child in visible parentheses
2592                 lpar = Leaf(token.LPAR, "(")
2593                 rpar = Leaf(token.RPAR, ")")
2594                 child.remove()
2595                 node.insert_child(index, Node(syms.atom, [lpar, child, rpar]))
2596             elif node.type == syms.import_from:
2597                 # "import from" nodes store parentheses directly as part of
2598                 # the statement
2599                 if child.type == token.LPAR:
2600                     # make parentheses invisible
2601                     child.value = ""  # type: ignore
2602                     node.children[-1].value = ""  # type: ignore
2603                 elif child.type != token.STAR:
2604                     # insert invisible parentheses
2605                     node.insert_child(index, Leaf(token.LPAR, ""))
2606                     node.append_child(Leaf(token.RPAR, ""))
2607                 break
2608
2609             elif not (isinstance(child, Leaf) and is_multiline_string(child)):
2610                 # wrap child in invisible parentheses
2611                 lpar = Leaf(token.LPAR, "")
2612                 rpar = Leaf(token.RPAR, "")
2613                 index = child.remove() or 0
2614                 node.insert_child(index, Node(syms.atom, [lpar, child, rpar]))
2615
2616         check_lpar = isinstance(child, Leaf) and child.value in parens_after
2617
2618
2619 def normalize_fmt_off(node: Node) -> None:
2620     """Convert content between `# fmt: off`/`# fmt: on` into standalone comments."""
2621     try_again = True
2622     while try_again:
2623         try_again = convert_one_fmt_off_pair(node)
2624
2625
2626 def convert_one_fmt_off_pair(node: Node) -> bool:
2627     """Convert content of a single `# fmt: off`/`# fmt: on` into a standalone comment.
2628
2629     Returns True if a pair was converted.
2630     """
2631     for leaf in node.leaves():
2632         previous_consumed = 0
2633         for comment in list_comments(leaf.prefix, is_endmarker=False):
2634             if comment.value in FMT_OFF:
2635                 # We only want standalone comments. If there's no previous leaf or
2636                 # the previous leaf is indentation, it's a standalone comment in
2637                 # disguise.
2638                 if comment.type != STANDALONE_COMMENT:
2639                     prev = preceding_leaf(leaf)
2640                     if prev and prev.type not in WHITESPACE:
2641                         continue
2642
2643                 ignored_nodes = list(generate_ignored_nodes(leaf))
2644                 if not ignored_nodes:
2645                     continue
2646
2647                 first = ignored_nodes[0]  # Can be a container node with the `leaf`.
2648                 parent = first.parent
2649                 prefix = first.prefix
2650                 first.prefix = prefix[comment.consumed :]
2651                 hidden_value = (
2652                     comment.value + "\n" + "".join(str(n) for n in ignored_nodes)
2653                 )
2654                 if hidden_value.endswith("\n"):
2655                     # That happens when one of the `ignored_nodes` ended with a NEWLINE
2656                     # leaf (possibly followed by a DEDENT).
2657                     hidden_value = hidden_value[:-1]
2658                 first_idx = None
2659                 for ignored in ignored_nodes:
2660                     index = ignored.remove()
2661                     if first_idx is None:
2662                         first_idx = index
2663                 assert parent is not None, "INTERNAL ERROR: fmt: on/off handling (1)"
2664                 assert first_idx is not None, "INTERNAL ERROR: fmt: on/off handling (2)"
2665                 parent.insert_child(
2666                     first_idx,
2667                     Leaf(
2668                         STANDALONE_COMMENT,
2669                         hidden_value,
2670                         prefix=prefix[:previous_consumed] + "\n" * comment.newlines,
2671                     ),
2672                 )
2673                 return True
2674
2675             previous_consumed = comment.consumed
2676
2677     return False
2678
2679
2680 def generate_ignored_nodes(leaf: Leaf) -> Iterator[LN]:
2681     """Starting from the container of `leaf`, generate all leaves until `# fmt: on`.
2682
2683     Stops at the end of the block.
2684     """
2685     container: Optional[LN] = container_of(leaf)
2686     while container is not None and container.type != token.ENDMARKER:
2687         for comment in list_comments(container.prefix, is_endmarker=False):
2688             if comment.value in FMT_ON:
2689                 return
2690
2691         yield container
2692
2693         container = container.next_sibling
2694
2695
2696 def maybe_make_parens_invisible_in_atom(node: LN) -> bool:
2697     """If it's safe, make the parens in the atom `node` invisible, recursively."""
2698     if (
2699         node.type != syms.atom
2700         or is_empty_tuple(node)
2701         or is_one_tuple(node)
2702         or is_yield(node)
2703         or max_delimiter_priority_in_atom(node) >= COMMA_PRIORITY
2704     ):
2705         return False
2706
2707     first = node.children[0]
2708     last = node.children[-1]
2709     if first.type == token.LPAR and last.type == token.RPAR:
2710         # make parentheses invisible
2711         first.value = ""  # type: ignore
2712         last.value = ""  # type: ignore
2713         if len(node.children) > 1:
2714             maybe_make_parens_invisible_in_atom(node.children[1])
2715         return True
2716
2717     return False
2718
2719
2720 def is_empty_tuple(node: LN) -> bool:
2721     """Return True if `node` holds an empty tuple."""
2722     return (
2723         node.type == syms.atom
2724         and len(node.children) == 2
2725         and node.children[0].type == token.LPAR
2726         and node.children[1].type == token.RPAR
2727     )
2728
2729
2730 def is_one_tuple(node: LN) -> bool:
2731     """Return True if `node` holds a tuple with one element, with or without parens."""
2732     if node.type == syms.atom:
2733         if len(node.children) != 3:
2734             return False
2735
2736         lpar, gexp, rpar = node.children
2737         if not (
2738             lpar.type == token.LPAR
2739             and gexp.type == syms.testlist_gexp
2740             and rpar.type == token.RPAR
2741         ):
2742             return False
2743
2744         return len(gexp.children) == 2 and gexp.children[1].type == token.COMMA
2745
2746     return (
2747         node.type in IMPLICIT_TUPLE
2748         and len(node.children) == 2
2749         and node.children[1].type == token.COMMA
2750     )
2751
2752
2753 def is_yield(node: LN) -> bool:
2754     """Return True if `node` holds a `yield` or `yield from` expression."""
2755     if node.type == syms.yield_expr:
2756         return True
2757
2758     if node.type == token.NAME and node.value == "yield":  # type: ignore
2759         return True
2760
2761     if node.type != syms.atom:
2762         return False
2763
2764     if len(node.children) != 3:
2765         return False
2766
2767     lpar, expr, rpar = node.children
2768     if lpar.type == token.LPAR and rpar.type == token.RPAR:
2769         return is_yield(expr)
2770
2771     return False
2772
2773
2774 def is_vararg(leaf: Leaf, within: Set[NodeType]) -> bool:
2775     """Return True if `leaf` is a star or double star in a vararg or kwarg.
2776
2777     If `within` includes VARARGS_PARENTS, this applies to function signatures.
2778     If `within` includes UNPACKING_PARENTS, it applies to right hand-side
2779     extended iterable unpacking (PEP 3132) and additional unpacking
2780     generalizations (PEP 448).
2781     """
2782     if leaf.type not in STARS or not leaf.parent:
2783         return False
2784
2785     p = leaf.parent
2786     if p.type == syms.star_expr:
2787         # Star expressions are also used as assignment targets in extended
2788         # iterable unpacking (PEP 3132).  See what its parent is instead.
2789         if not p.parent:
2790             return False
2791
2792         p = p.parent
2793
2794     return p.type in within
2795
2796
2797 def is_multiline_string(leaf: Leaf) -> bool:
2798     """Return True if `leaf` is a multiline string that actually spans many lines."""
2799     value = leaf.value.lstrip("furbFURB")
2800     return value[:3] in {'"""', "'''"} and "\n" in value
2801
2802
2803 def is_stub_suite(node: Node) -> bool:
2804     """Return True if `node` is a suite with a stub body."""
2805     if (
2806         len(node.children) != 4
2807         or node.children[0].type != token.NEWLINE
2808         or node.children[1].type != token.INDENT
2809         or node.children[3].type != token.DEDENT
2810     ):
2811         return False
2812
2813     return is_stub_body(node.children[2])
2814
2815
2816 def is_stub_body(node: LN) -> bool:
2817     """Return True if `node` is a simple statement containing an ellipsis."""
2818     if not isinstance(node, Node) or node.type != syms.simple_stmt:
2819         return False
2820
2821     if len(node.children) != 2:
2822         return False
2823
2824     child = node.children[0]
2825     return (
2826         child.type == syms.atom
2827         and len(child.children) == 3
2828         and all(leaf == Leaf(token.DOT, ".") for leaf in child.children)
2829     )
2830
2831
2832 def max_delimiter_priority_in_atom(node: LN) -> int:
2833     """Return maximum delimiter priority inside `node`.
2834
2835     This is specific to atoms with contents contained in a pair of parentheses.
2836     If `node` isn't an atom or there are no enclosing parentheses, returns 0.
2837     """
2838     if node.type != syms.atom:
2839         return 0
2840
2841     first = node.children[0]
2842     last = node.children[-1]
2843     if not (first.type == token.LPAR and last.type == token.RPAR):
2844         return 0
2845
2846     bt = BracketTracker()
2847     for c in node.children[1:-1]:
2848         if isinstance(c, Leaf):
2849             bt.mark(c)
2850         else:
2851             for leaf in c.leaves():
2852                 bt.mark(leaf)
2853     try:
2854         return bt.max_delimiter_priority()
2855
2856     except ValueError:
2857         return 0
2858
2859
2860 def ensure_visible(leaf: Leaf) -> None:
2861     """Make sure parentheses are visible.
2862
2863     They could be invisible as part of some statements (see
2864     :func:`normalize_invible_parens` and :func:`visit_import_from`).
2865     """
2866     if leaf.type == token.LPAR:
2867         leaf.value = "("
2868     elif leaf.type == token.RPAR:
2869         leaf.value = ")"
2870
2871
2872 def should_explode(line: Line, opening_bracket: Leaf) -> bool:
2873     """Should `line` immediately be split with `delimiter_split()` after RHS?"""
2874     if not (
2875         opening_bracket.parent
2876         and opening_bracket.parent.type in {syms.atom, syms.import_from}
2877         and opening_bracket.value in "[{("
2878     ):
2879         return False
2880
2881     try:
2882         last_leaf = line.leaves[-1]
2883         exclude = {id(last_leaf)} if last_leaf.type == token.COMMA else set()
2884         max_priority = line.bracket_tracker.max_delimiter_priority(exclude=exclude)
2885     except (IndexError, ValueError):
2886         return False
2887
2888     return max_priority == COMMA_PRIORITY
2889
2890
2891 def is_python36(node: Node) -> bool:
2892     """Return True if the current file is using Python 3.6+ features.
2893
2894     Currently looking for:
2895     - f-strings; and
2896     - trailing commas after * or ** in function signatures and calls.
2897     """
2898     for n in node.pre_order():
2899         if n.type == token.STRING:
2900             value_head = n.value[:2]  # type: ignore
2901             if value_head in {'f"', 'F"', "f'", "F'", "rf", "fr", "RF", "FR"}:
2902                 return True
2903
2904         elif (
2905             n.type in {syms.typedargslist, syms.arglist}
2906             and n.children
2907             and n.children[-1].type == token.COMMA
2908         ):
2909             for ch in n.children:
2910                 if ch.type in STARS:
2911                     return True
2912
2913                 if ch.type == syms.argument:
2914                     for argch in ch.children:
2915                         if argch.type in STARS:
2916                             return True
2917
2918     return False
2919
2920
2921 def generate_trailers_to_omit(line: Line, line_length: int) -> Iterator[Set[LeafID]]:
2922     """Generate sets of closing bracket IDs that should be omitted in a RHS.
2923
2924     Brackets can be omitted if the entire trailer up to and including
2925     a preceding closing bracket fits in one line.
2926
2927     Yielded sets are cumulative (contain results of previous yields, too).  First
2928     set is empty.
2929     """
2930
2931     omit: Set[LeafID] = set()
2932     yield omit
2933
2934     length = 4 * line.depth
2935     opening_bracket = None
2936     closing_bracket = None
2937     optional_brackets: Set[LeafID] = set()
2938     inner_brackets: Set[LeafID] = set()
2939     for index, leaf, leaf_length in enumerate_with_length(line, reversed=True):
2940         length += leaf_length
2941         if length > line_length:
2942             break
2943
2944         has_inline_comment = leaf_length > len(leaf.value) + len(leaf.prefix)
2945         if leaf.type == STANDALONE_COMMENT or has_inline_comment:
2946             break
2947
2948         optional_brackets.discard(id(leaf))
2949         if opening_bracket:
2950             if leaf is opening_bracket:
2951                 opening_bracket = None
2952             elif leaf.type in CLOSING_BRACKETS:
2953                 inner_brackets.add(id(leaf))
2954         elif leaf.type in CLOSING_BRACKETS:
2955             if not leaf.value:
2956                 optional_brackets.add(id(opening_bracket))
2957                 continue
2958
2959             if index > 0 and line.leaves[index - 1].type in OPENING_BRACKETS:
2960                 # Empty brackets would fail a split so treat them as "inner"
2961                 # brackets (e.g. only add them to the `omit` set if another
2962                 # pair of brackets was good enough.
2963                 inner_brackets.add(id(leaf))
2964                 continue
2965
2966             opening_bracket = leaf.opening_bracket
2967             if closing_bracket:
2968                 omit.add(id(closing_bracket))
2969                 omit.update(inner_brackets)
2970                 inner_brackets.clear()
2971                 yield omit
2972             closing_bracket = leaf
2973
2974
2975 def get_future_imports(node: Node) -> Set[str]:
2976     """Return a set of __future__ imports in the file."""
2977     imports: Set[str] = set()
2978
2979     def get_imports_from_children(children: List[LN]) -> Generator[str, None, None]:
2980         for child in children:
2981             if isinstance(child, Leaf):
2982                 if child.type == token.NAME:
2983                     yield child.value
2984             elif child.type == syms.import_as_name:
2985                 orig_name = child.children[0]
2986                 assert isinstance(orig_name, Leaf), "Invalid syntax parsing imports"
2987                 assert orig_name.type == token.NAME, "Invalid syntax parsing imports"
2988                 yield orig_name.value
2989             elif child.type == syms.import_as_names:
2990                 yield from get_imports_from_children(child.children)
2991             else:
2992                 assert False, "Invalid syntax parsing imports"
2993
2994     for child in node.children:
2995         if child.type != syms.simple_stmt:
2996             break
2997         first_child = child.children[0]
2998         if isinstance(first_child, Leaf):
2999             # Continue looking if we see a docstring; otherwise stop.
3000             if (
3001                 len(child.children) == 2
3002                 and first_child.type == token.STRING
3003                 and child.children[1].type == token.NEWLINE
3004             ):
3005                 continue
3006             else:
3007                 break
3008         elif first_child.type == syms.import_from:
3009             module_name = first_child.children[1]
3010             if not isinstance(module_name, Leaf) or module_name.value != "__future__":
3011                 break
3012             imports |= set(get_imports_from_children(first_child.children[3:]))
3013         else:
3014             break
3015     return imports
3016
3017
3018 def gen_python_files_in_dir(
3019     path: Path,
3020     root: Path,
3021     include: Pattern[str],
3022     exclude: Pattern[str],
3023     report: "Report",
3024 ) -> Iterator[Path]:
3025     """Generate all files under `path` whose paths are not excluded by the
3026     `exclude` regex, but are included by the `include` regex.
3027
3028     Symbolic links pointing outside of the `root` directory are ignored.
3029
3030     `report` is where output about exclusions goes.
3031     """
3032     assert root.is_absolute(), f"INTERNAL ERROR: `root` must be absolute but is {root}"
3033     for child in path.iterdir():
3034         try:
3035             normalized_path = "/" + child.resolve().relative_to(root).as_posix()
3036         except ValueError:
3037             if child.is_symlink():
3038                 report.path_ignored(
3039                     child, f"is a symbolic link that points outside {root}"
3040                 )
3041                 continue
3042
3043             raise
3044
3045         if child.is_dir():
3046             normalized_path += "/"
3047         exclude_match = exclude.search(normalized_path)
3048         if exclude_match and exclude_match.group(0):
3049             report.path_ignored(child, f"matches the --exclude regular expression")
3050             continue
3051
3052         if child.is_dir():
3053             yield from gen_python_files_in_dir(child, root, include, exclude, report)
3054
3055         elif child.is_file():
3056             include_match = include.search(normalized_path)
3057             if include_match:
3058                 yield child
3059
3060
3061 @lru_cache()
3062 def find_project_root(srcs: Iterable[str]) -> Path:
3063     """Return a directory containing .git, .hg, or pyproject.toml.
3064
3065     That directory can be one of the directories passed in `srcs` or their
3066     common parent.
3067
3068     If no directory in the tree contains a marker that would specify it's the
3069     project root, the root of the file system is returned.
3070     """
3071     if not srcs:
3072         return Path("/").resolve()
3073
3074     common_base = min(Path(src).resolve() for src in srcs)
3075     if common_base.is_dir():
3076         # Append a fake file so `parents` below returns `common_base_dir`, too.
3077         common_base /= "fake-file"
3078     for directory in common_base.parents:
3079         if (directory / ".git").is_dir():
3080             return directory
3081
3082         if (directory / ".hg").is_dir():
3083             return directory
3084
3085         if (directory / "pyproject.toml").is_file():
3086             return directory
3087
3088     return directory
3089
3090
3091 @dataclass
3092 class Report:
3093     """Provides a reformatting counter. Can be rendered with `str(report)`."""
3094
3095     check: bool = False
3096     quiet: bool = False
3097     verbose: bool = False
3098     change_count: int = 0
3099     same_count: int = 0
3100     failure_count: int = 0
3101
3102     def done(self, src: Path, changed: Changed) -> None:
3103         """Increment the counter for successful reformatting. Write out a message."""
3104         if changed is Changed.YES:
3105             reformatted = "would reformat" if self.check else "reformatted"
3106             if self.verbose or not self.quiet:
3107                 out(f"{reformatted} {src}")
3108             self.change_count += 1
3109         else:
3110             if self.verbose:
3111                 if changed is Changed.NO:
3112                     msg = f"{src} already well formatted, good job."
3113                 else:
3114                     msg = f"{src} wasn't modified on disk since last run."
3115                 out(msg, bold=False)
3116             self.same_count += 1
3117
3118     def failed(self, src: Path, message: str) -> None:
3119         """Increment the counter for failed reformatting. Write out a message."""
3120         err(f"error: cannot format {src}: {message}")
3121         self.failure_count += 1
3122
3123     def path_ignored(self, path: Path, message: str) -> None:
3124         if self.verbose:
3125             out(f"{path} ignored: {message}", bold=False)
3126
3127     @property
3128     def return_code(self) -> int:
3129         """Return the exit code that the app should use.
3130
3131         This considers the current state of changed files and failures:
3132         - if there were any failures, return 123;
3133         - if any files were changed and --check is being used, return 1;
3134         - otherwise return 0.
3135         """
3136         # According to http://tldp.org/LDP/abs/html/exitcodes.html starting with
3137         # 126 we have special returncodes reserved by the shell.
3138         if self.failure_count:
3139             return 123
3140
3141         elif self.change_count and self.check:
3142             return 1
3143
3144         return 0
3145
3146     def __str__(self) -> str:
3147         """Render a color report of the current state.
3148
3149         Use `click.unstyle` to remove colors.
3150         """
3151         if self.check:
3152             reformatted = "would be reformatted"
3153             unchanged = "would be left unchanged"
3154             failed = "would fail to reformat"
3155         else:
3156             reformatted = "reformatted"
3157             unchanged = "left unchanged"
3158             failed = "failed to reformat"
3159         report = []
3160         if self.change_count:
3161             s = "s" if self.change_count > 1 else ""
3162             report.append(
3163                 click.style(f"{self.change_count} file{s} {reformatted}", bold=True)
3164             )
3165         if self.same_count:
3166             s = "s" if self.same_count > 1 else ""
3167             report.append(f"{self.same_count} file{s} {unchanged}")
3168         if self.failure_count:
3169             s = "s" if self.failure_count > 1 else ""
3170             report.append(
3171                 click.style(f"{self.failure_count} file{s} {failed}", fg="red")
3172             )
3173         return ", ".join(report) + "."
3174
3175
3176 def assert_equivalent(src: str, dst: str) -> None:
3177     """Raise AssertionError if `src` and `dst` aren't equivalent."""
3178
3179     import ast
3180     import traceback
3181
3182     def _v(node: ast.AST, depth: int = 0) -> Iterator[str]:
3183         """Simple visitor generating strings to compare ASTs by content."""
3184         yield f"{'  ' * depth}{node.__class__.__name__}("
3185
3186         for field in sorted(node._fields):
3187             try:
3188                 value = getattr(node, field)
3189             except AttributeError:
3190                 continue
3191
3192             yield f"{'  ' * (depth+1)}{field}="
3193
3194             if isinstance(value, list):
3195                 for item in value:
3196                     if isinstance(item, ast.AST):
3197                         yield from _v(item, depth + 2)
3198
3199             elif isinstance(value, ast.AST):
3200                 yield from _v(value, depth + 2)
3201
3202             else:
3203                 yield f"{'  ' * (depth+2)}{value!r},  # {value.__class__.__name__}"
3204
3205         yield f"{'  ' * depth})  # /{node.__class__.__name__}"
3206
3207     try:
3208         src_ast = ast.parse(src)
3209     except Exception as exc:
3210         major, minor = sys.version_info[:2]
3211         raise AssertionError(
3212             f"cannot use --safe with this file; failed to parse source file "
3213             f"with Python {major}.{minor}'s builtin AST. Re-run with --fast "
3214             f"or stop using deprecated Python 2 syntax. AST error message: {exc}"
3215         )
3216
3217     try:
3218         dst_ast = ast.parse(dst)
3219     except Exception as exc:
3220         log = dump_to_file("".join(traceback.format_tb(exc.__traceback__)), dst)
3221         raise AssertionError(
3222             f"INTERNAL ERROR: Black produced invalid code: {exc}. "
3223             f"Please report a bug on https://github.com/ambv/black/issues.  "
3224             f"This invalid output might be helpful: {log}"
3225         ) from None
3226
3227     src_ast_str = "\n".join(_v(src_ast))
3228     dst_ast_str = "\n".join(_v(dst_ast))
3229     if src_ast_str != dst_ast_str:
3230         log = dump_to_file(diff(src_ast_str, dst_ast_str, "src", "dst"))
3231         raise AssertionError(
3232             f"INTERNAL ERROR: Black produced code that is not equivalent to "
3233             f"the source.  "
3234             f"Please report a bug on https://github.com/ambv/black/issues.  "
3235             f"This diff might be helpful: {log}"
3236         ) from None
3237
3238
3239 def assert_stable(
3240     src: str, dst: str, line_length: int, mode: FileMode = FileMode.AUTO_DETECT
3241 ) -> None:
3242     """Raise AssertionError if `dst` reformats differently the second time."""
3243     newdst = format_str(dst, line_length=line_length, mode=mode)
3244     if dst != newdst:
3245         log = dump_to_file(
3246             diff(src, dst, "source", "first pass"),
3247             diff(dst, newdst, "first pass", "second pass"),
3248         )
3249         raise AssertionError(
3250             f"INTERNAL ERROR: Black produced different code on the second pass "
3251             f"of the formatter.  "
3252             f"Please report a bug on https://github.com/ambv/black/issues.  "
3253             f"This diff might be helpful: {log}"
3254         ) from None
3255
3256
3257 def dump_to_file(*output: str) -> str:
3258     """Dump `output` to a temporary file. Return path to the file."""
3259     import tempfile
3260
3261     with tempfile.NamedTemporaryFile(
3262         mode="w", prefix="blk_", suffix=".log", delete=False, encoding="utf8"
3263     ) as f:
3264         for lines in output:
3265             f.write(lines)
3266             if lines and lines[-1] != "\n":
3267                 f.write("\n")
3268     return f.name
3269
3270
3271 def diff(a: str, b: str, a_name: str, b_name: str) -> str:
3272     """Return a unified diff string between strings `a` and `b`."""
3273     import difflib
3274
3275     a_lines = [line + "\n" for line in a.split("\n")]
3276     b_lines = [line + "\n" for line in b.split("\n")]
3277     return "".join(
3278         difflib.unified_diff(a_lines, b_lines, fromfile=a_name, tofile=b_name, n=5)
3279     )
3280
3281
3282 def cancel(tasks: Iterable[asyncio.Task]) -> None:
3283     """asyncio signal handler that cancels all `tasks` and reports to stderr."""
3284     err("Aborted!")
3285     for task in tasks:
3286         task.cancel()
3287
3288
3289 def shutdown(loop: BaseEventLoop) -> None:
3290     """Cancel all pending tasks on `loop`, wait for them, and close the loop."""
3291     try:
3292         # This part is borrowed from asyncio/runners.py in Python 3.7b2.
3293         to_cancel = [task for task in asyncio.Task.all_tasks(loop) if not task.done()]
3294         if not to_cancel:
3295             return
3296
3297         for task in to_cancel:
3298             task.cancel()
3299         loop.run_until_complete(
3300             asyncio.gather(*to_cancel, loop=loop, return_exceptions=True)
3301         )
3302     finally:
3303         # `concurrent.futures.Future` objects cannot be cancelled once they
3304         # are already running. There might be some when the `shutdown()` happened.
3305         # Silence their logger's spew about the event loop being closed.
3306         cf_logger = logging.getLogger("concurrent.futures")
3307         cf_logger.setLevel(logging.CRITICAL)
3308         loop.close()
3309
3310
3311 def sub_twice(regex: Pattern[str], replacement: str, original: str) -> str:
3312     """Replace `regex` with `replacement` twice on `original`.
3313
3314     This is used by string normalization to perform replaces on
3315     overlapping matches.
3316     """
3317     return regex.sub(replacement, regex.sub(replacement, original))
3318
3319
3320 def re_compile_maybe_verbose(regex: str) -> Pattern[str]:
3321     """Compile a regular expression string in `regex`.
3322
3323     If it contains newlines, use verbose mode.
3324     """
3325     if "\n" in regex:
3326         regex = "(?x)" + regex
3327     return re.compile(regex)
3328
3329
3330 def enumerate_reversed(sequence: Sequence[T]) -> Iterator[Tuple[Index, T]]:
3331     """Like `reversed(enumerate(sequence))` if that were possible."""
3332     index = len(sequence) - 1
3333     for element in reversed(sequence):
3334         yield (index, element)
3335         index -= 1
3336
3337
3338 def enumerate_with_length(
3339     line: Line, reversed: bool = False
3340 ) -> Iterator[Tuple[Index, Leaf, int]]:
3341     """Return an enumeration of leaves with their length.
3342
3343     Stops prematurely on multiline strings and standalone comments.
3344     """
3345     op = cast(
3346         Callable[[Sequence[Leaf]], Iterator[Tuple[Index, Leaf]]],
3347         enumerate_reversed if reversed else enumerate,
3348     )
3349     for index, leaf in op(line.leaves):
3350         length = len(leaf.prefix) + len(leaf.value)
3351         if "\n" in leaf.value:
3352             return  # Multiline strings, we can't continue.
3353
3354         comment: Optional[Leaf]
3355         for comment in line.comments_after(leaf, index):
3356             length += len(comment.value)
3357
3358         yield index, leaf, length
3359
3360
3361 def is_line_short_enough(line: Line, *, line_length: int, line_str: str = "") -> bool:
3362     """Return True if `line` is no longer than `line_length`.
3363
3364     Uses the provided `line_str` rendering, if any, otherwise computes a new one.
3365     """
3366     if not line_str:
3367         line_str = str(line).strip("\n")
3368     return (
3369         len(line_str) <= line_length
3370         and "\n" not in line_str  # multiline strings
3371         and not line.contains_standalone_comments()
3372     )
3373
3374
3375 def can_be_split(line: Line) -> bool:
3376     """Return False if the line cannot be split *for sure*.
3377
3378     This is not an exhaustive search but a cheap heuristic that we can use to
3379     avoid some unfortunate formattings (mostly around wrapping unsplittable code
3380     in unnecessary parentheses).
3381     """
3382     leaves = line.leaves
3383     if len(leaves) < 2:
3384         return False
3385
3386     if leaves[0].type == token.STRING and leaves[1].type == token.DOT:
3387         call_count = 0
3388         dot_count = 0
3389         next = leaves[-1]
3390         for leaf in leaves[-2::-1]:
3391             if leaf.type in OPENING_BRACKETS:
3392                 if next.type not in CLOSING_BRACKETS:
3393                     return False
3394
3395                 call_count += 1
3396             elif leaf.type == token.DOT:
3397                 dot_count += 1
3398             elif leaf.type == token.NAME:
3399                 if not (next.type == token.DOT or next.type in OPENING_BRACKETS):
3400                     return False
3401
3402             elif leaf.type not in CLOSING_BRACKETS:
3403                 return False
3404
3405             if dot_count > 1 and call_count > 1:
3406                 return False
3407
3408     return True
3409
3410
3411 def can_omit_invisible_parens(line: Line, line_length: int) -> bool:
3412     """Does `line` have a shape safe to reformat without optional parens around it?
3413
3414     Returns True for only a subset of potentially nice looking formattings but
3415     the point is to not return false positives that end up producing lines that
3416     are too long.
3417     """
3418     bt = line.bracket_tracker
3419     if not bt.delimiters:
3420         # Without delimiters the optional parentheses are useless.
3421         return True
3422
3423     max_priority = bt.max_delimiter_priority()
3424     if bt.delimiter_count_with_priority(max_priority) > 1:
3425         # With more than one delimiter of a kind the optional parentheses read better.
3426         return False
3427
3428     if max_priority == DOT_PRIORITY:
3429         # A single stranded method call doesn't require optional parentheses.
3430         return True
3431
3432     assert len(line.leaves) >= 2, "Stranded delimiter"
3433
3434     first = line.leaves[0]
3435     second = line.leaves[1]
3436     penultimate = line.leaves[-2]
3437     last = line.leaves[-1]
3438
3439     # With a single delimiter, omit if the expression starts or ends with
3440     # a bracket.
3441     if first.type in OPENING_BRACKETS and second.type not in CLOSING_BRACKETS:
3442         remainder = False
3443         length = 4 * line.depth
3444         for _index, leaf, leaf_length in enumerate_with_length(line):
3445             if leaf.type in CLOSING_BRACKETS and leaf.opening_bracket is first:
3446                 remainder = True
3447             if remainder:
3448                 length += leaf_length
3449                 if length > line_length:
3450                     break
3451
3452                 if leaf.type in OPENING_BRACKETS:
3453                     # There are brackets we can further split on.
3454                     remainder = False
3455
3456         else:
3457             # checked the entire string and line length wasn't exceeded
3458             if len(line.leaves) == _index + 1:
3459                 return True
3460
3461         # Note: we are not returning False here because a line might have *both*
3462         # a leading opening bracket and a trailing closing bracket.  If the
3463         # opening bracket doesn't match our rule, maybe the closing will.
3464
3465     if (
3466         last.type == token.RPAR
3467         or last.type == token.RBRACE
3468         or (
3469             # don't use indexing for omitting optional parentheses;
3470             # it looks weird
3471             last.type == token.RSQB
3472             and last.parent
3473             and last.parent.type != syms.trailer
3474         )
3475     ):
3476         if penultimate.type in OPENING_BRACKETS:
3477             # Empty brackets don't help.
3478             return False
3479
3480         if is_multiline_string(first):
3481             # Additional wrapping of a multiline string in this situation is
3482             # unnecessary.
3483             return True
3484
3485         length = 4 * line.depth
3486         seen_other_brackets = False
3487         for _index, leaf, leaf_length in enumerate_with_length(line):
3488             length += leaf_length
3489             if leaf is last.opening_bracket:
3490                 if seen_other_brackets or length <= line_length:
3491                     return True
3492
3493             elif leaf.type in OPENING_BRACKETS:
3494                 # There are brackets we can further split on.
3495                 seen_other_brackets = True
3496
3497     return False
3498
3499
3500 def get_cache_file(line_length: int, mode: FileMode) -> Path:
3501     return CACHE_DIR / f"cache.{line_length}.{mode.value}.pickle"
3502
3503
3504 def read_cache(line_length: int, mode: FileMode) -> Cache:
3505     """Read the cache if it exists and is well formed.
3506
3507     If it is not well formed, the call to write_cache later should resolve the issue.
3508     """
3509     cache_file = get_cache_file(line_length, mode)
3510     if not cache_file.exists():
3511         return {}
3512
3513     with cache_file.open("rb") as fobj:
3514         try:
3515             cache: Cache = pickle.load(fobj)
3516         except pickle.UnpicklingError:
3517             return {}
3518
3519     return cache
3520
3521
3522 def get_cache_info(path: Path) -> CacheInfo:
3523     """Return the information used to check if a file is already formatted or not."""
3524     stat = path.stat()
3525     return stat.st_mtime, stat.st_size
3526
3527
3528 def filter_cached(cache: Cache, sources: Iterable[Path]) -> Tuple[Set[Path], Set[Path]]:
3529     """Split an iterable of paths in `sources` into two sets.
3530
3531     The first contains paths of files that modified on disk or are not in the
3532     cache. The other contains paths to non-modified files.
3533     """
3534     todo, done = set(), set()
3535     for src in sources:
3536         src = src.resolve()
3537         if cache.get(src) != get_cache_info(src):
3538             todo.add(src)
3539         else:
3540             done.add(src)
3541     return todo, done
3542
3543
3544 def write_cache(
3545     cache: Cache, sources: Iterable[Path], line_length: int, mode: FileMode
3546 ) -> None:
3547     """Update the cache file."""
3548     cache_file = get_cache_file(line_length, mode)
3549     try:
3550         if not CACHE_DIR.exists():
3551             CACHE_DIR.mkdir(parents=True)
3552         new_cache = {**cache, **{src.resolve(): get_cache_info(src) for src in sources}}
3553         with cache_file.open("wb") as fobj:
3554             pickle.dump(new_cache, fobj, protocol=pickle.HIGHEST_PROTOCOL)
3555     except OSError:
3556         pass
3557
3558
3559 def patch_click() -> None:
3560     """Make Click not crash.
3561
3562     On certain misconfigured environments, Python 3 selects the ASCII encoding as the
3563     default which restricts paths that it can access during the lifetime of the
3564     application.  Click refuses to work in this scenario by raising a RuntimeError.
3565
3566     In case of Black the likelihood that non-ASCII characters are going to be used in
3567     file paths is minimal since it's Python source code.  Moreover, this crash was
3568     spurious on Python 3.7 thanks to PEP 538 and PEP 540.
3569     """
3570     try:
3571         from click import core
3572         from click import _unicodefun  # type: ignore
3573     except ModuleNotFoundError:
3574         return
3575
3576     for module in (core, _unicodefun):
3577         if hasattr(module, "_verify_python3_env"):
3578             module._verify_python3_env = lambda: None
3579
3580
3581 if __name__ == "__main__":
3582     patch_click()
3583     main()