python · ericsnowcurrently · Mar 18, 2021 · Mar 19, 2021 · Mar 19, 2021 · Mar 19, 2021
diff --git a/doc/benchmarks.rst b/doc/benchmarks.rst
@@ -54,6 +54,17 @@ depending on the Python version.
    them, and more generally to not modify them.
 
 
+azure_cli
+---------
+
+Exercise the `Azure CLI <https://github.com/Azure/azure-cli>`_ in a very
+rough approximation of a regular usage workload.  (At the moment we run
+a small subset of the azure-cli test suite.)
+
+Note that ``azure_cli_tests`` and ``azure_cli_verify`` are similar, but
+take a lot longer to run (on the order of 10-20 minutes).
+
+
 chameleon
 ---------
 

diff --git a/pyperformance/.gitignore b/pyperformance/.gitignore
@@ -0,0 +1,2 @@
+
+azure-cli
diff --git a/pyperformance/benchmarks/__init__.py b/pyperformance/benchmarks/__init__.py
@@ -1,12 +1,15 @@
 import logging
 
+from pyperformance.cli import fast_requested
 from pyperformance.run import run_perf_script
 
 
 # Benchmark groups. The "default" group is what's run if no -b option is
 # specified.
 DEFAULT_GROUP = [
     '2to3',
+    'azure_cli',
+    # Note that we leave azure_cli_* out.  (They're really slow.)
     'chameleon',
     'chaos',
     'crypto_pyaes',
@@ -73,16 +76,55 @@
                   "pickle", "unpickle",
                   "xml_etree",
                   "json_dumps", "json_loads"],
-    "apps": ["2to3", "chameleon", "html5lib", "tornado_http"],
+    "apps": ["2to3", "chameleon", "html5lib", "tornado_http", "azure_cli"],
     "math": ["float", "nbody", "pidigits"],
     "template": ["django_template", "mako"],
+    "slow": [],
 }
 
 
+def slow(func):
+    """A decorator to mark a benchmark as slow."""
+    if not func.__name__.startswith("BM_"):
+        raise NotImplementedError(func)
+    name = func.__name__[3:].lower()
+    BENCH_GROUPS["slow"].append(name)
+    return func
+
+
+def maybe_slow(func):
+    return func if fast_requested() else slow(func)
+
+
 def BM_2to3(python, options):
     return run_perf_script(python, options, "2to3")
 
 
+def BM_azure_cli(python, options):
+    return run_perf_script(python, options, "azure_cli",
+                           extra_args=[
+                               "--install",
+                            ])
+
+
+@maybe_slow
+def BM_azure_cli_tests(python, options):
+    return run_perf_script(python, options, "azure_cli",
+                           extra_args=[
+                               "--install",
+                               "--kind", "tests",
+                           ])
+
+
+@maybe_slow
+def BM_azure_cli_verify(python, options):
+    return run_perf_script(python, options, "azure_cli",
+                           extra_args=[
+                               "--install",
+                               "--kind", "verify",
+                           ])
+
+
 # def BM_hg_startup(python, options):
 #     return run_perf_script(python, options, "hg_startup")
 
@@ -127,7 +169,6 @@ def BM_unpickle(python, options):
 def BM_pickle_list(python, options):
     return pickle_benchmark(python, options, "pickle_list")
 
-
 def BM_pickle_dict(python, options):
     return pickle_benchmark(python, options, "pickle_dict")
 
@@ -296,6 +337,9 @@ def get_benchmarks():
 
     # create the 'all' group
     bench_groups["all"] = sorted(bench_funcs)
+    bench_groups["fast"] = [name
+                            for name in bench_groups["all"]
+                            if name not in bench_groups["slow"]]
 
     return (bench_funcs, bench_groups)
 

diff --git a/pyperformance/benchmarks/bm_azure_cli.py b/pyperformance/benchmarks/bm_azure_cli.py
@@ -0,0 +1,282 @@
+"""Test the performance of the Azure CLI.
+
+The test suite is an adequate proxy for regular usage of the CLI.
+"""
+
+# The code for this benchmark is based on the manual steps defined
+# for the azure-cli repo.
+
+# See:
+#  - azure-pipelines.yml
+#  - https://github.com/Azure/azure-cli-dev-tools
+#
+# sudo apt install python3.8
+# sudo apt install python3.8-venv
+# sudo apt install python3.8-devel
+# git clone https://github.com/Azure/azure-cli
+# cd azure-cli
+# python3.8 -m venv .venv
+# source .venv/bin/activate
+# python3 -m pip install azdev
+# azdev setup --cli .
+#
+# azdev test
+# (PYTHONPATH=tools python3 -m automation test --cli .)
+# PYTHONPATH=tools python3 -m automation verify commands
+# (./scripts/ci/unittest.sh)
+# (./scripts/ci/test_automation.sh)
+# (./scripts/ci/test_integration.sh)
+
+import os
+import os.path
+import pyperf
+import shlex
+import subprocess
+import sys
+
+import pyperformance.venv
+
+
+AZURE_CLI_UPSTREAM = "https://github.com/Azure/azure-cli"
+AZURE_CLI_REPO = os.path.join(os.path.dirname(__file__), 'data', 'azure-cli')
+
+
+def _run_bench_command_env(runner, name, command, env):
+    if runner.args.inherit_environ:
+        runner.args.inherit_environ.extend(env)
+    else:
+        runner.args.inherit_environ = list(env)
+
+    env_before = dict(os.environ)
+    os.environ.update(env)
+    try:
+        return runner.bench_command(name, command)
+    finally:
+        os.environ.clear()
+        os.environ.update(env_before)
+
+
+def _resolve_virtual_env(pypath=None):
+    # This is roughly equivalent to ensuring the env is activated.
+    env = pyperformance.venv.resolve_env_vars()
+
+    if pypath:
+        if not isinstance(pypath, str):
+            pypath = os.pathsep.join(pypath)
+        env["PYTHONPATH"] = pypath
+
+    return env
+
+
+def _run(argv, **kwargs):
+    cmd_str = ' '.join(map(shlex.quote, argv))
+    print("Execute: %s" % cmd_str)
+    sys.stdout.flush()
+    sys.stderr.flush()
+    proc = subprocess.run(argv, **kwargs)
+    proc.check_returncode()
+
+
+###################
+# azure-cli helpers
+
+# This global allows us to only check the install once per proc.
+INSTALL_ENSURED = False
+
+
+def install(force=False):
+    global INSTALL_ENSURED
+
+    print("=========================================")
+    print("installing for the azure_cli benchmark...")
+    if force:
+        _install()
+    elif INSTALL_ENSURED:
+        print("already checked")
+    elif _already_installed():
+        print("already installed")
+    else:
+        _install()
+    print("...done")
+    print("=========================================")
+
+    INSTALL_ENSURED = True
+
+
+def _already_installed():
+    try:
+        import azure.cli
+    except ImportError:
+        return False
+    else:
+        return True
+
+
+def _install():
+    if os.path.exists(AZURE_CLI_REPO):
+        print("local repo already exists (skipping)")
+    else:
+        _run(["git", "clone", AZURE_CLI_UPSTREAM, AZURE_CLI_REPO])
+
+    print("...setting up...")
+    env = _resolve_virtual_env()
+    env['PYTHONHASHSEED'] = '0'
+    # XXX Do not run this again if already done.
+    _run(
+        [sys.executable, "-m", "azdev", "setup", "--cli", AZURE_CLI_REPO],
+        env=env,
+    )
+
+
+TESTS_FAST = [
+    # XXX Is this a good sample of tests (to ~ represent the workload)?
+    ("src/azure-cli/azure/cli/command_modules/ams/tests/latest/test_ams_account_scenarios.py",
+     "AmsAccountTests.test_ams_check_name"),
+]
+TESTS_MEDIUM = [
+]
+
+
+def _get_tests_cmd(tests='<fast>'):
+    if not tests:
+        tests = '<all>'
+    if isinstance(tests, str):
+        if tests == '<all>':
+            tests = []  # slow
+        elif tests == '<slow>':
+            tests = []  # slow
+        elif tests == '<medium>':
+            tests = TESTS_MEDIUM
+        elif tests == '<fast>':
+            tests = TESTS_FAST
+        else:
+            if tests.startswith('<'):
+                raise ValueError('unsupported "test" ({!r})'.format(tests))
+            raise NotImplementedError
+    else:
+        raise NotImplementedError
+    testargs = [file + ":" + name for file, name in tests]
+
+    cmd = ["azdev", "test"] + testargs
+    return cmd
+
+
+###################
+# benchmarks
+
+def run_sample(runner):
+    # For now we run just a small subset of azure-cli test suite.
+    env = _resolve_virtual_env()
+    cmd = _get_tests_cmd(tests='<fast>')
+    return _run_bench_command_env(
+        runner,
+        "azure_cli",
+        cmd,
+        env,
+    )
+
+    # XXX It may make sense for this test to instead manually invoke
+    # the Azure CLI in 3-5 different ways.
+    #def func():
+    #    raise NotImplementedError
+    #return runner.bench_func("azure_cli", func)
+
+
+def run_tests(runner):
+    env = _resolve_virtual_env()
+    tests = '<fast>' if runner.args.fast else '<all>'
+    cmd = _get_tests_cmd(tests)
+    return _run_bench_command_env(
+        runner,
+        "azure_cli",
+        cmd,
+        env,
+    )
+
+
+def run_verify(runner):
+    pypath = os.path.join(AZURE_CLI_REPO, 'tools')
+    env = _resolve_virtual_env(pypath)
+    cmd = [
+        sys.executable,
+        "-m", "automation",
+        "verify",
+        "commands",
+    ]
+    if runner.args.fast:
+        cmd.extend([
+            # XXX Is this a good enough proxy?
+            "--prefix", "account",
+        ])
+    return _run_bench_command_env(
+        runner,
+        "azure_cli_verify",
+        cmd,
+        env,
+    )
+
+
+###################
+# the script
+
+def get_runner():
+    def add_cmdline_args(cmd, args):
+        # Preserve --kind.
+        kind = getattr(args, 'kind', 'sample')
+        cmd.extend(["--kind", kind])
+        # Note that we do not preserve --install.  We don't need
+        # the worker to duplicate the work.
+        if args.fast:
+            cmd.append('--fast')
+
+    runner = pyperf.Runner(
+        add_cmdline_args=add_cmdline_args,
+        metadata={
+            "description": "Performance of the Azure CLI",
+        },
+    )
+
+    runner.argparser.add_argument("--kind",
+                                  choices=["sample", "tests", "verify", "install"],
+                                  default="sample")
+    runner.argparser.add_argument("--install",
+                                  action="store_const", const="<ensure>",
+                                  default="<ensure>")
+    runner.argparser.add_argument("--force-install", dest="install",
+                                  action="store_const", const="<force>")
+    runner.argparser.add_argument("--no-install", dest="install",
+                                  action="store_const", const=None)
+
+    return runner
+
+
+def main():
+    runner = get_runner()
+    args = runner.parse_args()
+
+    if args.install == "<ensure>":
+        install(force=False)
+    elif args.install == "<force>":
+        install(force=True)
+    elif args.install:
+        raise NotImplementedError(args.install)
+
+    if args.kind == "sample":
+        # fast(er)
+        run_sample(runner)
+    elif args.kind == "tests":
+        # slow
+        #runner.values = 1
+        run_tests(runner)
+    elif args.kind == "verify":
+        # slow
+        #runner.values = 1
+        run_verify(runner)
+    elif args.kind == "install":
+        return
+    else:
+        raise NotImplementedError(args.kind)
+
+
+if __name__ == '__main__':
+    main()