Action: Support running in a docker container (#2748)

[etc/vim.git] / src / black_primer / lib.py
diff --git a/src/black_primer/lib.py b/src/black_primer/lib.py

index 3ce383f17ce2b1b6ef7d2509b66e3c364e784f9e..13724f431ce81c9ad0651dc9f715e38b0c4057fe 100644 (file)
--- a/src/black_primer/lib.py
+++ b/src/black_primer/lib.py
@@ -12,12 +12,23 @@ from shutil import rmtree, which
  from subprocess import CalledProcessError
  from sys import version_info
  from tempfile import TemporaryDirectory
-from typing import Any, Callable, Dict, NamedTuple, Optional, Sequence, Tuple
+from typing import (
+    Any,
+    Callable,
+    Dict,
+    List,
+    NamedTuple,
+    Optional,
+    Sequence,
+    Tuple,
+    Union,
+)
  from urllib.parse import urlparse
  
  import click
  
  
+TEN_MINUTES_SECONDS = 600
  WINDOWS = system() == "Windows"
  BLACK_BINARY = "black.exe" if WINDOWS else "black"
  GIT_BINARY = "git.exe" if WINDOWS else "git"
@@ -39,19 +50,21 @@ class Results(NamedTuple):
  
  async def _gen_check_output(
      cmd: Sequence[str],
-    timeout: float = 300,
+    timeout: float = TEN_MINUTES_SECONDS,
      env: Optional[Dict[str, str]] = None,
      cwd: Optional[Path] = None,
+    stdin: Optional[bytes] = None,
  ) -> Tuple[bytes, bytes]:
      process = await asyncio.create_subprocess_exec(
          *cmd,
+        stdin=asyncio.subprocess.PIPE,
          stdout=asyncio.subprocess.PIPE,
          stderr=asyncio.subprocess.STDOUT,
          env=env,
          cwd=cwd,
      )
      try:
-        (stdout, stderr) = await asyncio.wait_for(process.communicate(), timeout)
+        (stdout, stderr) = await asyncio.wait_for(process.communicate(stdin), timeout)
      except asyncio.TimeoutError:
          process.kill()
          await process.wait()
@@ -75,6 +88,18 @@ def analyze_results(project_count: int, results: Results) -> int:
      failed_pct = round(((results.stats["failed"] / project_count) * 100), 2)
      success_pct = round(((results.stats["success"] / project_count) * 100), 2)
  
+    if results.failed_projects:
+        click.secho("\nFailed projects:\n", bold=True)
+
+    for project_name, project_cpe in results.failed_projects.items():
+        print(f"## {project_name}:")
+        print(f" - Returned {project_cpe.returncode}")
+        if project_cpe.stderr:
+            print(f" - stderr:\n{project_cpe.stderr.decode('utf8')}")
+        if project_cpe.stdout:
+            print(f" - stdout:\n{project_cpe.stdout.decode('utf8')}")
+        print("")
+
      click.secho("-- primer results 📊 --\n", bold=True)
      click.secho(
          f"{results.stats['success']} / {project_count} succeeded ({success_pct}%) ✅",
@@ -97,46 +122,79 @@ def analyze_results(project_count: int, results: Results) -> int:
      )
  
      if results.failed_projects:
-        click.secho("\nFailed projects:\n", bold=True)
-
-    for project_name, project_cpe in results.failed_projects.items():
-        print(f"## {project_name}:")
-        print(f" - Returned {project_cpe.returncode}")
-        if project_cpe.stderr:
-            print(f" - stderr:\n{project_cpe.stderr.decode('utf8')}")
-        if project_cpe.stdout:
-            print(f" - stdout:\n{project_cpe.stdout.decode('utf8')}")
-        print("")
+        failed = ", ".join(results.failed_projects.keys())
+        click.secho(f"\nFailed projects: {failed}\n", bold=True)
  
      return results.stats["failed"]
  
  
+def _flatten_cli_args(cli_args: List[Union[Sequence[str], str]]) -> List[str]:
+    """Allow a user to put long arguments into a list of strs
+    to make the JSON human readable"""
+    flat_args = []
+    for arg in cli_args:
+        if isinstance(arg, str):
+            flat_args.append(arg)
+            continue
+
+        args_as_str = "".join(arg)
+        flat_args.append(args_as_str)
+
+    return flat_args
+
+
  async def black_run(
-    repo_path: Path,
+    project_name: str,
+    repo_path: Optional[Path],
      project_config: Dict[str, Any],
      results: Results,
      no_diff: bool = False,
  ) -> None:
      """Run Black and record failures"""
+    if not repo_path:
+        results.stats["failed"] += 1
+        results.failed_projects[project_name] = CalledProcessError(
+            69, [], f"{project_name} has no repo_path: {repo_path}".encode(), b""
+        )
+        return
+
+    stdin_test = project_name.upper() == "STDIN"
      cmd = [str(which(BLACK_BINARY))]
      if "cli_arguments" in project_config and project_config["cli_arguments"]:
-        cmd.extend(project_config["cli_arguments"])
+        cmd.extend(_flatten_cli_args(project_config["cli_arguments"]))
      cmd.append("--check")
-    if no_diff:
-        cmd.append(".")
+    if not no_diff:
+        cmd.append("--diff")
+
+    # Workout if we should read in a python file or search from cwd
+    stdin = None
+    if stdin_test:
+        cmd.append("-")
+        stdin = repo_path.read_bytes()
+    elif "base_path" in project_config:
+        cmd.append(project_config["base_path"])
      else:
-        cmd.extend(["--diff", "."])
+        cmd.append(".")
  
+    timeout = (
+        project_config["timeout_seconds"]
+        if "timeout_seconds" in project_config
+        else TEN_MINUTES_SECONDS
+    )
      with TemporaryDirectory() as tmp_path:
-        # Prevent reading top-level user configs by manipulating envionment variables
+        # Prevent reading top-level user configs by manipulating environment variables
          env = {
              **os.environ,
              "XDG_CONFIG_HOME": tmp_path,  # Unix-like
              "USERPROFILE": tmp_path,  # Windows (changes `Path.home()` output)
          }
  
+        cwd_path = repo_path.parent if stdin_test else repo_path
          try:
-            _stdout, _stderr = await _gen_check_output(cmd, cwd=repo_path, env=env)
+            LOG.debug(f"Running black for {project_name}: {' '.join(cmd)}")
+            _stdout, _stderr = await _gen_check_output(
+                cmd, cwd=cwd_path, env=env, stdin=stdin, timeout=timeout
+            )
          except asyncio.TimeoutError:
              results.stats["failed"] += 1
              LOG.error(f"Running black for {repo_path} timed out ({cmd})")
@@ -204,7 +262,7 @@ async def git_checkout_or_rebase(
  
  
  def handle_PermissionError(
-    func: Callable, path: Path, exc: Tuple[Any, Any, Any]
+    func: Callable[..., None], path: Path, exc: Tuple[Any, Any, Any]
  ) -> None:
      """
      Handle PermissionError during shutil.rmtree.
@@ -229,16 +287,16 @@ def handle_PermissionError(
  
  async def load_projects_queue(
      config_path: Path,
+    projects_to_run: List[str],
  ) -> Tuple[Dict[str, Any], asyncio.Queue]:
      """Load project config and fill queue with all the project names"""
      with config_path.open("r") as cfp:
          config = json.load(cfp)
  
      # TODO: Offer more options here
-    # e.g. Run on X random packages or specific sub list etc.
-    project_names = sorted(config["projects"].keys())
-    queue: asyncio.Queue = asyncio.Queue(maxsize=len(project_names))
-    for project in project_names:
+    # e.g. Run on X random packages etc.
+    queue: asyncio.Queue = asyncio.Queue(maxsize=len(projects_to_run))
+    for project in projects_to_run:
          await queue.put(project)
  
      return config, queue
@@ -289,12 +347,15 @@ async def project_runner(
              LOG.debug(f"Skipping {project_name} as it's configured as a long checkout")
              continue
  
-        repo_path = await git_checkout_or_rebase(work_path, project_config, rebase)
-        if not repo_path:
-            continue
-        await black_run(repo_path, project_config, results, no_diff)
+        repo_path: Optional[Path] = Path(__file__)
+        stdin_project = project_name.upper() == "STDIN"
+        if not stdin_project:
+            repo_path = await git_checkout_or_rebase(work_path, project_config, rebase)
+            if not repo_path:
+                continue
+        await black_run(project_name, repo_path, project_config, results, no_diff)
  
-        if not keep:
+        if not keep and not stdin_project:
              LOG.debug(f"Removing {repo_path}")
              rmtree_partial = partial(
                  rmtree, path=repo_path, onerror=handle_PermissionError
@@ -308,6 +369,7 @@ async def process_queue(
      config_file: str,
      work_path: Path,
      workers: int,
+    projects_to_run: List[str],
      keep: bool = False,
      long_checkouts: bool = False,
      rebase: bool = False,
@@ -326,7 +388,7 @@ async def process_queue(
      results.stats["success"] = 0
      results.stats["wrong_py_ver"] = 0
  
-    config, queue = await load_projects_queue(Path(config_file))
+    config, queue = await load_projects_queue(Path(config_file), projects_to_run)
      project_count = queue.qsize()
      s = "" if project_count == 1 else "s"
      LOG.info(f"{project_count} project{s} to run Black over")