crosvm/tools/impl/command.py
Dennis Kempin 11a48d4cca tools: refactoring: Split common.py into multiple files
This is a refactoring with no functionality change. The common.py
file is split up so we will be able to use the parts that have no
third party dependencies separately.

For now, keep common.py and re-export everything, so we do not
introduce issues in other tools.

BUG=b:267499599
TEST=presubmit

Change-Id: Idf6d45bd90f5cf448fb9dd88df540af3da0f7f88
Reviewed-on: https://chromium-review.googlesource.com/c/crosvm/crosvm/+/4482141
Reviewed-by: Zihan Chen <zihanchen@google.com>
Commit-Queue: Dennis Kempin <denniskempin@google.com>
2023-05-02 17:04:27 +00:00

612 lines
18 KiB
Python

#!/usr/bin/env python3
# Copyright 2023 The ChromiumOS Authors
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
"""
Provides helpers for writing shell-like scripts in Python.
It provides tools to execute commands with similar flexibility as shell scripts.
"""
import contextlib
import json
import os
import re
import shlex
import subprocess
import sys
from copy import deepcopy
from math import ceil
from multiprocessing.pool import ThreadPool
from pathlib import Path
from subprocess import DEVNULL, PIPE, STDOUT # type: ignore
from typing import (
Any,
Callable,
Dict,
Iterable,
List,
NamedTuple,
Optional,
TypeVar,
Union,
)
from .util import verbose, very_verbose, color_enabled
PathLike = Union[Path, str]
# Regex that matches ANSI escape sequences
ANSI_ESCAPE = re.compile(r"\x1B(?:[@-Z\\-_]|\[[0-?]*[ -/]*[@-~])")
class CommandResult(NamedTuple):
"""Results of a command execution as returned by Command.run()"""
stdout: str
stderr: str
returncode: int
class Command(object):
"""
Simplified subprocess handling for shell-like scripts.
## Example Usage
To run a program on behalf of the user:
>> cmd("cargo build").fg()
This will run the program with stdio passed to the user. Developer tools usually run a set of
actions on behalf of the user. These should be executed with fg().
To make calls in the background to gather information use success/stdout/lines:
>> cmd("git branch").lines()
>> cmd("git rev-parse foo").success()
These will capture all program output. Try to avoid using these to run mutating commands,
as they will remain hidden to the user even when using --verbose.
## Arguments
Arguments are provided as a list similar to subprocess.run():
>>> Command('cargo', 'build', '--workspace')
Command('cargo', 'build', '--workspace')
In contrast to subprocess.run, all strings are split by whitespaces similar to bash:
>>> Command('cargo build --workspace', '--features foo')
Command('cargo', 'build', '--workspace', '--features', 'foo')
In contrast to bash, globs are *not* evaluated, but can easily be provided using Path:
>>> Command('ls -l', *Path(CROSVM_ROOT).glob('*.toml'))
Command('ls', '-l', ...)
None or False are ignored to make it easy to include conditional arguments:
>>> all = False
>>> Command('cargo build', '--workspace' if all else None)
Command('cargo', 'build')
## Nesting
Commands can be nested, similar to $() subshells in bash. The sub-commands will be executed
right away and their output will undergo the usual splitting:
>>> Command('printf "(%s)"', Command('echo foo bar')).stdout()
'(foo)(bar)'
Arguments can be explicitly quoted to prevent splitting, it applies to both sub-commands
as well as strings:
>>> Command('printf "(%s)"', quoted(Command('echo foo bar'))).stdout()
'(foo bar)'
Commands can also be piped into one another:
>>> wc = Command('wc')
>>> Command('echo "abcd"').pipe(wc('-c')).stdout()
'5'
## Verbosity
The --verbose flag is intended for users and will show all command lines executed in the
foreground with fg(), it'll also include output of programs run with fg(quiet=True). Commands
executed in the background are not shown.
For script developers, the --very-verbose flag will print full details and output of all
executed command lines, including those run hidden from the user.
"""
def __init__(
self,
*args: Any,
stdin_cmd: Optional["Command"] = None,
env_vars: Dict[str, str] = {},
cwd: Optional[Path] = None,
):
self.args = Command.__parse_cmd(args)
self.stdin_cmd = stdin_cmd
self.env_vars = env_vars
self.cwd = cwd
### Builder API to construct commands
def with_args(self, *args: Any):
"""Returns a new Command with added arguments.
>>> cargo = Command('cargo')
>>> cargo.with_args('clippy')
Command('cargo', 'clippy')
"""
cmd = deepcopy(self)
cmd.args = [*self.args, *Command.__parse_cmd(args)]
return cmd
def with_cwd(self, cwd: Optional[Path]):
"""Changes the working directory the command is executed in.
>>> cargo = Command('pwd')
>>> cargo.with_cwd('/tmp').stdout()
'/tmp'
"""
cmd = deepcopy(self)
cmd.cwd = cwd
return cmd
def __call__(self, *args: Any):
"""Shorthand for Command.with_args"""
return self.with_args(*args)
def with_env(self, key: str, value: Optional[str]):
"""
Returns a command with an added env variable.
The variable is removed if value is None.
"""
return self.with_envs({key: value})
def with_envs(self, envs: Union[Dict[str, Optional[str]], Dict[str, str]]):
"""
Returns a command with an added env variable.
The variable is removed if value is None.
"""
cmd = deepcopy(self)
for key, value in envs.items():
if value is not None:
cmd.env_vars[key] = value
else:
if key in cmd.env_vars:
del cmd.env_vars[key]
return cmd
def with_path_env(self, new_path: str):
"""Returns a command with a path added to the PATH variable."""
path_var = self.env_vars.get("PATH", os.environ.get("PATH", ""))
return self.with_env("PATH", f"{path_var}:{new_path}")
def with_color_arg(
self,
always: Optional[str] = None,
never: Optional[str] = None,
):
"""Returns a command with an argument added to pass through enabled/disabled colors."""
new_cmd = self
if color_enabled():
if always:
new_cmd = new_cmd(always)
else:
if never:
new_cmd = new_cmd(never)
return new_cmd
def with_color_env(self, var_name: str):
"""Returns a command with an env var added to pass through enabled/disabled colors."""
return self.with_env(var_name, "1" if color_enabled() else "0")
def with_color_flag(self, flag: str = "--color"):
"""Returns a command with an added --color=always/never/auto flag."""
return self.with_color_arg(always=f"{flag}=always", never=f"{flag}=never")
def foreach(self, arguments: Iterable[Any], batch_size: int = 1):
"""
Yields a new command for each entry in `arguments`.
The argument is appended to each command and is intended to be used in
conjunction with `parallel()` to execute a command on a list of arguments in
parallel.
>>> parallel(*cmd('echo').foreach((1, 2, 3))).stdout()
['1', '2', '3']
Arguments can also be batched by setting batch_size > 1, which will append multiple
arguments to each command.
>>> parallel(*cmd('echo').foreach((1, 2, 3), batch_size=2)).stdout()
['1 2', '3']
"""
for batch in batched(arguments, batch_size):
yield self(*batch)
def pipe(self, *args: Any):
"""
Pipes the output of this command into another process.
The target can either be another Command or the argument list to build a new command.
"""
if len(args) == 1 and isinstance(args[0], Command):
cmd = Command(stdin_cmd=self)
cmd.args = args[0].args
cmd.env_vars = self.env_vars.copy()
return cmd
else:
return Command(*args, stdin_cmd=self, env_vars=self.env_vars)
### Executing programs in the foreground
def run_foreground(
self,
quiet: bool = False,
check: bool = True,
dry_run: bool = False,
style: Optional[Callable[["subprocess.Popen[str]"], None]] = None,
):
"""
Runs a program in the foreground with output streamed to the user.
>>> Command('true').fg()
0
Non-zero exit codes will trigger an Exception
>>> Command('false').fg()
Traceback (most recent call last):
...
subprocess.CalledProcessError...
But can be disabled:
>>> Command('false').fg(check=False)
1
Output can be hidden by setting quiet=True:
>>> Command("echo foo").fg(quiet=True)
0
This will hide the programs stdout and stderr unless the program fails.
More sophisticated means of outputting stdout/err are available via `Styles`:
>>> Command("echo foo").fg(style=Styles.live_truncated())
foo
0
Will output the results of the command but truncate output after a few lines. See `Styles`
for more options.
Arguments:
quiet: Do not show stdout/stderr unless the program failed.
check: Raise an exception if the program returned an error code.
style: A function to present the output of the program. See `Styles`
Returns: The return code of the program.
"""
if dry_run:
print(f"Not running: {self}")
return 0
if quiet:
def quiet_style(process: "subprocess.Popen[str]"):
"Won't print anything unless the command failed."
assert process.stdout
stdout = process.stdout.read()
if process.wait() != 0:
print(stdout, end="")
style = quiet_style
if verbose():
print(f"$ {self}")
if style is None or verbose():
return self.__run(stdout=None, stderr=None, check=check).returncode
else:
process = self.popen(stdout=PIPE, stderr=STDOUT)
style(process)
returncode = process.wait()
if returncode != 0 and check:
assert process.stdout
raise subprocess.CalledProcessError(returncode, process.args)
return returncode
def fg(
self,
quiet: bool = False,
check: bool = True,
dry_run: bool = False,
style: Optional[Callable[["subprocess.Popen[str]"], None]] = None,
):
"""
Shorthand for Command.run_foreground()
"""
return self.run_foreground(quiet, check, dry_run, style)
def write_to(self, filename: Path):
"""
Writes stdout to the provided file.
"""
if verbose():
print(f"$ {self} > {filename}")
with open(filename, "w") as file:
file.write(self.__run(stdout=PIPE, stderr=PIPE).stdout)
def append_to(self, filename: Path):
"""
Appends stdout to the provided file.
"""
if verbose():
print(f"$ {self} >> {filename}")
with open(filename, "a") as file:
file.write(self.__run(stdout=PIPE, stderr=PIPE).stdout)
### API for executing commands hidden from the user
def success(self):
"""
Returns True if the program succeeded (i.e. returned 0).
The program will not be visible to the user unless --very-verbose is specified.
"""
if very_verbose():
print(f"$ {self}")
return self.__run(stdout=PIPE, stderr=PIPE, check=False).returncode == 0
def stdout(self, check: bool = True, stderr: int = PIPE):
"""
Runs a program and returns stdout.
The program will not be visible to the user unless --very-verbose is specified.
"""
if very_verbose():
print(f"$ {self}")
return self.__run(stdout=PIPE, stderr=stderr, check=check).stdout.strip()
def json(self, check: bool = True) -> Any:
"""
Runs a program and returns stdout parsed as json.
The program will not be visible to the user unless --very-verbose is specified.
"""
stdout = self.stdout(check=check)
if stdout:
return json.loads(stdout)
else:
return None
def lines(self, check: bool = True, stderr: int = PIPE):
"""
Runs a program and returns stdout line by line.
The program will not be visible to the user unless --very-verbose is specified.
"""
return self.stdout(check=check, stderr=stderr).splitlines()
### Utilities
def __str__(self):
stdin = ""
if self.stdin_cmd:
stdin = str(self.stdin_cmd) + " | "
return stdin + shlex.join(self.args)
def __repr__(self):
stdin = ""
if self.stdin_cmd:
stdin = ", stdin_cmd=" + repr(self.stdin_cmd)
return f"Command({', '.join(repr(a) for a in self.args)}{stdin})"
### Private implementation details
def __run(
self,
stdout: Optional[int],
stderr: Optional[int],
check: bool = True,
) -> CommandResult:
"Run this command in subprocess.run()"
if very_verbose():
print(f"cwd: {Path().resolve()}")
for k, v in self.env_vars.items():
print(f"env: {k}={v}")
result = subprocess.run(
self.args,
cwd=self.cwd,
stdout=stdout,
stderr=stderr,
stdin=self.__stdin_stream(),
env={**os.environ, **self.env_vars},
check=check,
text=True,
)
if very_verbose():
if result.stdout:
for line in result.stdout.splitlines():
print("stdout:", line)
if result.stderr:
for line in result.stderr.splitlines():
print("stderr:", line)
print("returncode:", result.returncode)
if check and result.returncode != 0:
raise subprocess.CalledProcessError(result.returncode, str(self), result.stdout)
return CommandResult(result.stdout, result.stderr, result.returncode)
def __stdin_stream(self):
if self.stdin_cmd:
return self.stdin_cmd.popen(stdout=PIPE, stderr=PIPE).stdout
return None
def popen(self, **kwargs: Any) -> "subprocess.Popen[str]":
"""
Runs a program and returns the Popen object of the running process.
"""
return subprocess.Popen(
self.args,
cwd=self.cwd,
stdin=self.__stdin_stream(),
env={**os.environ, **self.env_vars},
text=True,
**kwargs,
)
@staticmethod
def __parse_cmd(args: Iterable[Any]) -> List[str]:
"""Parses command line arguments for Command."""
res = [parsed for arg in args for parsed in Command.__parse_cmd_args(arg)]
return res
@staticmethod
def __parse_cmd_args(arg: Any) -> List[str]:
"""Parses a mixed type command line argument into a list of strings."""
if isinstance(arg, Path):
return [str(arg)]
elif isinstance(arg, QuotedString):
return [arg.value]
elif isinstance(arg, Command):
return [*shlex.split(arg.stdout())]
elif arg is None or arg is False:
return []
else:
return [*shlex.split(str(arg))]
class ParallelCommands(object):
"""
Allows commands to be run in parallel.
>>> parallel(cmd('true'), cmd('false')).fg(check=False)
[0, 1]
>>> parallel(cmd('echo a'), cmd('echo b')).stdout()
['a', 'b']
"""
def __init__(self, *commands: Command):
self.commands = commands
def fg(self, quiet: bool = False, check: bool = True):
with ThreadPool(1 if very_verbose() else os.cpu_count()) as pool:
return pool.map(lambda command: command.fg(quiet=quiet, check=check), self.commands)
def stdout(self):
with ThreadPool(1 if very_verbose() else os.cpu_count()) as pool:
return pool.map(lambda command: command.stdout(), self.commands)
def success(self):
results = self.fg(check=False, quiet=True)
return all(result == 0 for result in results)
class Remote(object):
"""
Wrapper around the cmd() API and allow execution of commands via SSH."
"""
def __init__(self, host: str, opts: Dict[str, str]):
self.host = host
ssh_opts = [f"-o{k}={v}" for k, v in opts.items()]
self.ssh_cmd = cmd("ssh", host, "-T", *ssh_opts)
self.scp_cmd = cmd("scp", *ssh_opts)
def ssh(self, cmd: Command, remote_cwd: Optional[Path] = None):
# Use huponexit to ensure the process is killed if the connection is lost.
# Use shlex to properly quote the command.
wrapped_cmd = f"bash -O huponexit -c {shlex.quote(str(cmd))}"
if remote_cwd is not None:
wrapped_cmd = f"cd {remote_cwd} && {wrapped_cmd}"
# The whole command to pass it to SSH for remote execution.
return self.ssh_cmd.with_args(quoted(wrapped_cmd))
def scp(self, sources: List[Path], target: str, quiet: bool = False):
return self.scp_cmd.with_args(*sources, f"{self.host}:{target}").fg(quiet=quiet)
@contextlib.contextmanager
def cwd_context(path: PathLike):
"""Context for temporarily changing the cwd.
>>> with cwd('/tmp'):
... os.getcwd()
'/tmp'
"""
cwd = os.getcwd()
try:
chdir(path)
yield
finally:
chdir(cwd)
def chdir(path: PathLike):
if very_verbose():
print("cd", path)
os.chdir(path)
class QuotedString(object):
"""
Prevents the provided string from being split.
Commands will be executed and their stdout is quoted.
"""
def __init__(self, value: Any):
if isinstance(value, Command):
self.value = value.stdout()
else:
self.value = str(value)
def __str__(self):
return f'"{self.value}"'
T = TypeVar("T")
def batched(source: Iterable[T], max_batch_size: int) -> Iterable[List[T]]:
"""
Returns an iterator over batches of elements from source_list.
>>> list(batched([1, 2, 3, 4, 5], 2))
[[1, 2], [3, 4], [5]]
"""
source_list = list(source)
# Calculate batch size that spreads elements evenly across all batches
batch_count = ceil(len(source_list) / max_batch_size)
batch_size = ceil(len(source_list) / batch_count)
for index in range(0, len(source_list), batch_size):
yield source_list[index : min(index + batch_size, len(source_list))]
# Shorthands
quoted = QuotedString
cmd = Command
cwd = cwd_context
parallel = ParallelCommands
if __name__ == "__main__":
import doctest
(failures, num_tests) = doctest.testmod(optionflags=doctest.ELLIPSIS)
sys.exit(1 if failures > 0 else 0)