azdev/operations/performance.py

# ----------------------------------------------------------------------------- # Copyright (c) Microsoft Corporation. All rights reserved. # Licensed under the MIT License. See License.txt in the project root for # license information. # ----------------------------------------------------------------------------- import re import timeit from knack.log import get_logger from knack.util import CLIError from azdev.utilities import ( display, heading, subheading, cmd, py_cmd, require_azure_cli) logger = get_logger(__name__) TOTAL = 'ALL' TOTAL_THRESHOLD = 300 DEFAULT_THRESHOLD = 10 THRESHOLDS = { # threshold value: num of exceptions allowed 50: 2, 40: 3 } # pylint: disable=too-many-statements def check_load_time(runs=3): require_azure_cli() heading('Module Load Performance') regex = r"[^']*'(?P<mod>[^']*)'[\D]*(?P<val>[\d\.]*)" results = {TOTAL: []} # Time the module loading X times for i in range(0, runs + 1): lines = cmd('az -h --debug', show_stderr=True).result if i == 0: # Ignore the first run since it can be longer due to *.pyc file compilation continue try: lines = lines.decode().splitlines() except AttributeError: lines = lines.splitlines() total_time = 0 for line in lines: if line.startswith('DEBUG: Loaded module'): matches = re.match(regex, line) mod = matches.group('mod') val = float(matches.group('val')) * 1000 total_time = total_time + val if mod in results: results[mod].append(val) else: results[mod] = [val] results[TOTAL].append(total_time) passed_mods = {} failed_mods = {} def _claim_higher_threshold(val): avail_thresholds = {k: v for k, v in THRESHOLDS.items() if v} new_threshold = None for threshold in sorted(avail_thresholds): if val < threshold: THRESHOLDS[threshold] = THRESHOLDS[threshold] - 1 new_threshold = threshold break return new_threshold mods = sorted(results.keys()) for mod in mods: val = results[mod] mean_val = mean(val) stdev_val = pstdev(val) threshold = TOTAL_THRESHOLD if mod == TOTAL else DEFAULT_THRESHOLD statistics = { 'average': mean_val, 'stdev': stdev_val, 'threshold': threshold, 'values': val } if mean_val > threshold: # claim a threshold exception if available new_threshold = _claim_higher_threshold(mean_val) if new_threshold: statistics['threshold'] = new_threshold passed_mods[mod] = statistics else: failed_mods[mod] = statistics else: passed_mods[mod] = statistics subheading('Results') if failed_mods: display('== PASSED MODULES ==') display_table(passed_mods) display('\nFAILED MODULES') display_table(failed_mods) raise CLIError(""" FAILED: Some modules failed. If values are close to the threshold, rerun. If values are large, check that you do not have top-level imports like azure.mgmt or msrestazure in any modified files. """) display("== PASSED MODULES ==") display_table(passed_mods) display( "\nPASSED: Average load time all modules: {} ms".format( int(passed_mods[TOTAL]["average"]) ) ) def mean(data): """Return the sample arithmetic mean of data.""" n = len(data) if n < 1: raise ValueError("len < 1") return sum(data) / float(n) def sq_deviation(data): """Return sum of square deviations of sequence data.""" c = mean(data) return sum((x - c) ** 2 for x in data) def pstdev(data): """Calculates the population standard deviation.""" n = len(data) if n < 2: raise ValueError('len < 2') ss = sq_deviation(data) return (ss / n) ** 0.5 def display_table(data): display('{:<20} {:>12} {:>12} {:>12} {:>25}'.format('Module', 'Average', 'Threshold', 'Stdev', 'Values')) for key, val in data.items(): display('{:<20} {:>12.0f} {:>12.0f} {:>12.0f} {:>25}'.format( key, val['average'], val['threshold'], val['stdev'], str(val['values']))) # require azdev setup def benchmark(commands=None, runs=20): if runs <= 0: raise CLIError("Number of runs must be greater than 0.") if not commands: commands = _benchmark_load_all_commands() result = [] import multiprocessing # Measure every wanted commands for raw_command in commands: logger.info("Measuring %s...", raw_command) # pylint: disable=consider-using-with pool = multiprocessing.Pool(multiprocessing.cpu_count(), _benchmark_process_pool_init) # try/except like this because of a bug of Python multiprocessing.Pool (https://bugs.python.org/issue8296) # Discussion on StackOverflow: # https://stackoverflow.com/questions/1408356/keyboard-interrupts-with-pythons-multiprocessing-pool/1408476 try: time_series = pool.map_async(_benchmark_cmd_timer, [raw_command] * runs).get(1000) except multiprocessing.TimeoutError: pool.terminate() break else: pool.close() pool.join() staticstic = _benchmark_cmd_staticstic(time_series) staticstic.update({ "Command": raw_command, "Runs": runs, }) logger.info(staticstic) result.append(staticstic) return result def _benchmark_load_all_commands(): try: from azure.cli.core import get_default_cli from azure.cli.core.file_util import create_invoker_and_load_cmds_and_args except ImportError: raise CLIError("Azure CLI is not installed") az_cli = get_default_cli() create_invoker_and_load_cmds_and_args(az_cli) commands = list(az_cli.invocation.commands_loader.command_table.keys()) commands = [cmd + " --help" for cmd in commands] return sorted(commands) def _benchmark_process_pool_init(): import signal signal.signal(signal.SIGINT, signal.SIG_IGN) def _benchmark_cmd_timer(raw_command): s = timeit.default_timer() py_cmd("azure.cli {}".format(raw_command), is_module=True) e = timeit.default_timer() return round(e - s, 4) def _benchmark_cmd_staticstic(time_series: list): from math import sqrt time_series.sort() size = len(time_series) if size % 2 == 0: mid_time = (time_series[size // 2 - 1] + time_series[size // 2]) / 2 else: mid_time = time_series[(size - 1) // 2] min_time = time_series[0] max_time = time_series[-1] avg_time = sum(time_series) / size std_deviation = sqrt( sum((t - avg_time) * (t - avg_time) for t in time_series) / size ) return { "Min": round(min_time, 4), "Max": round(max_time, 4), "Media": round(mid_time, 4), "Avg": round(avg_time, 4), "Std": round(std_deviation, 4), }

azdev/operations/performance.py (171 lines of code) (raw):