openoker
/
ray


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160
							#!/usr/bin/env python3
import json
import pathlib
import argparse
import sys


def parse_args():
    parser = argparse.ArgumentParser(
        description="Automate the process of calculating relative change in "
        "perf_metrics. This makes catching regressions much easier."
    )
    parser.add_argument(
        "old_dir_name",
        type=str,
        help="The name of the directory containing the last release "
        "performance logs, e.g. 2.2.0",
    )
    parser.add_argument(
        "new_dir_name",
        type=str,
        help="The name of the directory containing the new release "
        "performance logs, e.g. 2.3.0",
    )
    args = parser.parse_args()
    return args


def main(old_dir_name, new_dir_name):

    old_paths = paths_without_root_dir(walk(old_dir_name))
    new_paths = paths_without_root_dir(walk(new_dir_name))
    to_compare, missing_in_new, missing_in_old = get_compare_list(old_paths, new_paths)

    for path in missing_in_new:
        print(new_dir_name, "does not have", path)

    for path in missing_in_old:
        print(old_dir_name, "does not have", path)

    throughput_regressions = []
    latency_regressions = []
    missing_in_new = []
    missing_in_old = []
    for path in to_compare:
        old = pathlib.Path(old_dir_name, *path.parts)
        new = pathlib.Path(new_dir_name, *path.parts)

        throughput, latency, new, old = get_regressions(old, new)

        throughput_regressions.extend(throughput)
        latency_regressions.extend(latency)
        missing_in_new.extend(new)
        missing_in_old.extend(old)

    for perf_metric in missing_in_new:
        print(f"{new} does not have {perf_metric}")

    for perf_metric in missing_in_old:
        print(f"{old} does not have {perf_metric}")

    throughput_regressions.sort()
    for _, regression in throughput_regressions:
        print(regression)

    latency_regressions.sort(reverse=True)
    for _, regression in latency_regressions:
        print(regression)


def walk(dir_name):
    stack = [pathlib.Path(dir_name)]
    while stack:
        root = stack.pop()
        if not root.is_dir():
            yield root
        else:
            stack.extend(root.iterdir())


def paths_without_root_dir(paths):
    for p in paths:
        yield pathlib.Path(*p.parts[1:])


def get_compare_list(old, new):
    old_set = set(old)
    new_set = set(new)

    return (
        old_set.intersection(new_set),
        old_set.difference(new_set),
        new_set.difference(old_set),
    )


def get_regressions(old_path, new_path):

    with open(old_path, "r") as f:
        old = json.load(f)

    with open(new_path, "r") as f:
        new = json.load(f)

    def perf_metrics(root):
        return root["perf_metrics"]

    def types(perf_metric):
        return perf_metric["perf_metric_type"]

    def values(perf_metric):
        return perf_metric["perf_metric_value"]

    def names(perf_metric):
        return perf_metric["perf_metric_name"]

    def list_to_dict(input_list, key_selector, value_selector):
        return {key_selector(e): value_selector(e) for e in input_list}

    old_values = list_to_dict(perf_metrics(old), names, values)

    new_values = list_to_dict(perf_metrics(new), names, values)

    perf_metric_types = {
        **list_to_dict(perf_metrics(old), names, types),
        **list_to_dict(perf_metrics(new), names, types),
    }

    to_compare, missing_in_new, missing_in_old = get_compare_list(
        old_values.keys(),
        new_values.keys(),
    )

    regressions = []
    throughput_regressions = []
    latency_regression = []
    for perf_metric_name in to_compare:
        perf_type = perf_metric_types[perf_metric_name]
        old_value = old_values[perf_metric_name]
        new_value = new_values[perf_metric_name]

        ratio = new_value / old_value
        ratio_str = f"{100 * abs(ratio - 1):.02f}%"
        regression_message = f"""REGRESSION {ratio_str}: {perf_metric_name} ({perf_type}) regresses from {old_value} to {new_value} ({ratio_str}) in {new_path}"""

        if perf_type == "THROUGHPUT":
            if ratio < 1.0:
                throughput_regressions.append((ratio, regression_message))
        elif perf_type == "LATENCY":
            if ratio > 1.0:
                latency_regression.append((ratio, regression_message))
        else:
            raise ValueError(f"perf_metric_name not of expected type {perf_type}")

    return throughput_regressions, latency_regression, missing_in_new, missing_in_old


if __name__ == "__main__":
    args = parse_args()
    sys.exit(main(args.old_dir_name, args.new_dir_name))