toolchain-utils/crosperf/generate_report.py

*760c253cSXin Li#!/usr/bin/env python3
*760c253cSXin Li# -*- coding: utf-8 -*-
*760c253cSXin Li# Copyright 2016 The ChromiumOS Authors
*760c253cSXin Li# Use of this source code is governed by a BSD-style license that can be
*760c253cSXin Li# found in the LICENSE file.
*760c253cSXin Li
*760c253cSXin Li"""Given a specially-formatted JSON object, generates results report(s).
*760c253cSXin Li
*760c253cSXin LiThe JSON object should look like:
*760c253cSXin Li{"data": BenchmarkData, "platforms": BenchmarkPlatforms}
*760c253cSXin Li
*760c253cSXin LiBenchmarkPlatforms is a [str], each of which names a platform the benchmark
*760c253cSXin Li  was run on (e.g. peppy, shamu, ...). Note that the order of this list is
*760c253cSXin Li  related with the order of items in BenchmarkData.
*760c253cSXin Li
*760c253cSXin LiBenchmarkData is a {str: [PlatformData]}. The str is the name of the benchmark,
*760c253cSXin Liand a PlatformData is a set of data for a given platform. There must be one
*760c253cSXin LiPlatformData for each benchmark, for each element in BenchmarkPlatforms.
*760c253cSXin Li
*760c253cSXin LiA PlatformData is a [{str: float}], where each str names a metric we recorded,
*760c253cSXin Liand the float is the value for that metric. Each element is considered to be
*760c253cSXin Lithe metrics collected from an independent run of this benchmark. NOTE: Each
*760c253cSXin LiPlatformData is expected to have a "retval" key, with the return value of
*760c253cSXin Lithe benchmark. If the benchmark is successful, said return value should be 0.
*760c253cSXin LiOtherwise, this will break some of our JSON functionality.
*760c253cSXin Li
*760c253cSXin LiPutting it all together, a JSON object will end up looking like:
*760c253cSXin Li  { "platforms": ["peppy", "peppy-new-crosstool"],
*760c253cSXin Li    "data": {
*760c253cSXin Li      "bench_draw_line": [
*760c253cSXin Li        [{"time (ms)": 1.321, "memory (mb)": 128.1, "retval": 0},
*760c253cSXin Li         {"time (ms)": 1.920, "memory (mb)": 128.4, "retval": 0}],
*760c253cSXin Li        [{"time (ms)": 1.221, "memory (mb)": 124.3, "retval": 0},
*760c253cSXin Li         {"time (ms)": 1.423, "memory (mb)": 123.9, "retval": 0}]
*760c253cSXin Li      ]
*760c253cSXin Li    }
*760c253cSXin Li  }
*760c253cSXin Li
*760c253cSXin LiWhich says that we ran a benchmark on platforms named peppy, and
*760c253cSXin Li  peppy-new-crosstool.
*760c253cSXin LiWe ran one benchmark, named bench_draw_line.
*760c253cSXin LiIt was run twice on each platform.
*760c253cSXin LiPeppy's runs took 1.321ms and 1.920ms, while peppy-new-crosstool's took 1.221ms
*760c253cSXin Li  and 1.423ms. None of the runs failed to complete.
*760c253cSXin Li"""
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Liimport argparse
*760c253cSXin Liimport functools
*760c253cSXin Liimport json
*760c253cSXin Liimport os
*760c253cSXin Liimport sys
*760c253cSXin Liimport traceback
*760c253cSXin Li
*760c253cSXin Lifrom results_report import BenchmarkResults
*760c253cSXin Lifrom results_report import HTMLResultsReport
*760c253cSXin Lifrom results_report import JSONResultsReport
*760c253cSXin Lifrom results_report import TextResultsReport
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef CountBenchmarks(benchmark_runs):
*760c253cSXin Li    """Counts the number of iterations for each benchmark in benchmark_runs."""
*760c253cSXin Li
*760c253cSXin Li    # Example input for benchmark_runs:
*760c253cSXin Li    # {"bench": [[run1, run2, run3], [run1, run2, run3, run4]]}
*760c253cSXin Li    def _MaxLen(results):
*760c253cSXin Li        return 0 if not results else max(len(r) for r in results)
*760c253cSXin Li
*760c253cSXin Li    return [
*760c253cSXin Li        (name, _MaxLen(results)) for name, results in benchmark_runs.items()
*760c253cSXin Li    ]
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef CutResultsInPlace(results, max_keys=50, complain_on_update=True):
*760c253cSXin Li    """Limits the given benchmark results to max_keys keys in-place.
*760c253cSXin Li
*760c253cSXin Li    This takes the `data` field from the benchmark input, and mutates each
*760c253cSXin Li    benchmark run to contain `max_keys` elements (ignoring special elements, like
*760c253cSXin Li    "retval"). At the moment, it just selects the first `max_keys` keyvals,
*760c253cSXin Li    alphabetically.
*760c253cSXin Li
*760c253cSXin Li    If complain_on_update is true, this will print a message noting that a
*760c253cSXin Li    truncation occurred.
*760c253cSXin Li
*760c253cSXin Li    This returns the `results` object that was passed in, for convenience.
*760c253cSXin Li
*760c253cSXin Li    e.g.
*760c253cSXin Li    >>> benchmark_data = {
*760c253cSXin Li    ...   "bench_draw_line": [
*760c253cSXin Li    ...     [{"time (ms)": 1.321, "memory (mb)": 128.1, "retval": 0},
*760c253cSXin Li    ...      {"time (ms)": 1.920, "memory (mb)": 128.4, "retval": 0}],
*760c253cSXin Li    ...     [{"time (ms)": 1.221, "memory (mb)": 124.3, "retval": 0},
*760c253cSXin Li    ...      {"time (ms)": 1.423, "memory (mb)": 123.9, "retval": 0}]
*760c253cSXin Li    ...   ]
*760c253cSXin Li    ... }
*760c253cSXin Li    >>> CutResultsInPlace(benchmark_data, max_keys=1, complain_on_update=False)
*760c253cSXin Li    {
*760c253cSXin Li      'bench_draw_line': [
*760c253cSXin Li        [{'memory (mb)': 128.1, 'retval': 0},
*760c253cSXin Li         {'memory (mb)': 128.4, 'retval': 0}],
*760c253cSXin Li        [{'memory (mb)': 124.3, 'retval': 0},
*760c253cSXin Li         {'memory (mb)': 123.9, 'retval': 0}]
*760c253cSXin Li      ]
*760c253cSXin Li    }
*760c253cSXin Li    """
*760c253cSXin Li    actually_updated = False
*760c253cSXin Li    for bench_results in results.values():
*760c253cSXin Li        for platform_results in bench_results:
*760c253cSXin Li            for i, result in enumerate(platform_results):
*760c253cSXin Li                # Keep the keys that come earliest when sorted alphabetically.
*760c253cSXin Li                # Forcing alphabetical order is arbitrary, but necessary; otherwise,
*760c253cSXin Li                # the keyvals we'd emit would depend on our iteration order through a
*760c253cSXin Li                # map.
*760c253cSXin Li                removable_keys = sorted(k for k in result if k != "retval")
*760c253cSXin Li                retained_keys = removable_keys[:max_keys]
*760c253cSXin Li                platform_results[i] = {k: result[k] for k in retained_keys}
*760c253cSXin Li                # retval needs to be passed through all of the time.
*760c253cSXin Li                retval = result.get("retval")
*760c253cSXin Li                if retval is not None:
*760c253cSXin Li                    platform_results[i]["retval"] = retval
*760c253cSXin Li                actually_updated = actually_updated or len(
*760c253cSXin Li                    retained_keys
*760c253cSXin Li                ) != len(removable_keys)
*760c253cSXin Li
*760c253cSXin Li    if actually_updated and complain_on_update:
*760c253cSXin Li        print(
*760c253cSXin Li            "Warning: Some benchmark keyvals have been truncated.",
*760c253cSXin Li            file=sys.stderr,
*760c253cSXin Li        )
*760c253cSXin Li    return results
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef _PositiveInt(s):
*760c253cSXin Li    i = int(s)
*760c253cSXin Li    if i < 0:
*760c253cSXin Li        raise argparse.ArgumentTypeError("%d is not a positive integer." % (i,))
*760c253cSXin Li    return i
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef _AccumulateActions(args):
*760c253cSXin Li    """Given program arguments, determines what actions we want to run.
*760c253cSXin Li
*760c253cSXin Li    Returns [(ResultsReportCtor, str)], where ResultsReportCtor can construct a
*760c253cSXin Li    ResultsReport, and the str is the file extension for the given report.
*760c253cSXin Li    """
*760c253cSXin Li    results = []
*760c253cSXin Li    # The order of these is arbitrary.
*760c253cSXin Li    if args.json:
*760c253cSXin Li        results.append((JSONResultsReport, "json"))
*760c253cSXin Li    if args.text:
*760c253cSXin Li        results.append((TextResultsReport, "txt"))
*760c253cSXin Li    if args.email:
*760c253cSXin Li        email_ctor = functools.partial(TextResultsReport, email=True)
*760c253cSXin Li        results.append((email_ctor, "email"))
*760c253cSXin Li    # We emit HTML if nothing else was specified.
*760c253cSXin Li    if args.html or not results:
*760c253cSXin Li        results.append((HTMLResultsReport, "html"))
*760c253cSXin Li    return results
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Li# Note: get_contents is a function, because it may be expensive (generating some
*760c253cSXin Li# HTML reports takes O(seconds) on my machine, depending on the size of the
*760c253cSXin Li# input data).
*760c253cSXin Lidef WriteFile(output_prefix, extension, get_contents, overwrite, verbose):
*760c253cSXin Li    """Writes `contents` to a file named "${output_prefix}.${extension}".
*760c253cSXin Li
*760c253cSXin Li    get_contents should be a zero-args function that returns a string (of the
*760c253cSXin Li    contents to write).
*760c253cSXin Li    If output_prefix == '-', this writes to stdout.
*760c253cSXin Li    If overwrite is False, this will not overwrite files.
*760c253cSXin Li    """
*760c253cSXin Li    if output_prefix == "-":
*760c253cSXin Li        if verbose:
*760c253cSXin Li            print("Writing %s report to stdout" % (extension,), file=sys.stderr)
*760c253cSXin Li        sys.stdout.write(get_contents())
*760c253cSXin Li        return
*760c253cSXin Li
*760c253cSXin Li    file_name = "%s.%s" % (output_prefix, extension)
*760c253cSXin Li    if not overwrite and os.path.exists(file_name):
*760c253cSXin Li        raise IOError(
*760c253cSXin Li            "Refusing to write %s -- it already exists" % (file_name,)
*760c253cSXin Li        )
*760c253cSXin Li
*760c253cSXin Li    with open(file_name, "w") as out_file:
*760c253cSXin Li        if verbose:
*760c253cSXin Li            print(
*760c253cSXin Li                "Writing %s report to %s" % (extension, file_name),
*760c253cSXin Li                file=sys.stderr,
*760c253cSXin Li            )
*760c253cSXin Li        out_file.write(get_contents())
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef RunActions(actions, benchmark_results, output_prefix, overwrite, verbose):
*760c253cSXin Li    """Runs `actions`, returning True if all succeeded."""
*760c253cSXin Li    failed = False
*760c253cSXin Li
*760c253cSXin Li    report_ctor = None  # Make the linter happy
*760c253cSXin Li    for report_ctor, extension in actions:
*760c253cSXin Li        try:
*760c253cSXin Li            get_contents = lambda: report_ctor(benchmark_results).GetReport()
*760c253cSXin Li            WriteFile(
*760c253cSXin Li                output_prefix, extension, get_contents, overwrite, verbose
*760c253cSXin Li            )
*760c253cSXin Li        except Exception:
*760c253cSXin Li            # Complain and move along; we may have more actions that might complete
*760c253cSXin Li            # successfully.
*760c253cSXin Li            failed = True
*760c253cSXin Li            traceback.print_exc()
*760c253cSXin Li    return not failed
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef PickInputFile(input_name):
*760c253cSXin Li    """Given program arguments, returns file to read for benchmark input."""
*760c253cSXin Li    return sys.stdin if input_name == "-" else open(input_name)
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef _NoPerfReport(_label_name, _benchmark_name, _benchmark_iteration):
*760c253cSXin Li    return {}
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef _ParseArgs(argv):
*760c253cSXin Li    parser = argparse.ArgumentParser(
*760c253cSXin Li        description="Turns JSON into results " "report(s)."
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "-v",
*760c253cSXin Li        "--verbose",
*760c253cSXin Li        action="store_true",
*760c253cSXin Li        help="Be a tiny bit more verbose.",
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "-f",
*760c253cSXin Li        "--force",
*760c253cSXin Li        action="store_true",
*760c253cSXin Li        help="Overwrite existing results files.",
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "-o",
*760c253cSXin Li        "--output",
*760c253cSXin Li        default="report",
*760c253cSXin Li        type=str,
*760c253cSXin Li        help="Prefix of the output filename (default: report). "
*760c253cSXin Li        "- means stdout.",
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "-i",
*760c253cSXin Li        "--input",
*760c253cSXin Li        required=True,
*760c253cSXin Li        type=str,
*760c253cSXin Li        help="Where to read the JSON from. - means stdin.",
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "-l",
*760c253cSXin Li        "--statistic-limit",
*760c253cSXin Li        default=0,
*760c253cSXin Li        type=_PositiveInt,
*760c253cSXin Li        help="The maximum number of benchmark statistics to "
*760c253cSXin Li        "display from a single run. 0 implies unlimited.",
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "--json", action="store_true", help="Output a JSON report."
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "--text", action="store_true", help="Output a text report."
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "--email",
*760c253cSXin Li        action="store_true",
*760c253cSXin Li        help="Output a text report suitable for email.",
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "--html",
*760c253cSXin Li        action="store_true",
*760c253cSXin Li        help="Output an HTML report (this is the default if no "
*760c253cSXin Li        "other output format is specified).",
*760c253cSXin Li    )
*760c253cSXin Li    return parser.parse_args(argv)
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef Main(argv):
*760c253cSXin Li    args = _ParseArgs(argv)
*760c253cSXin Li    with PickInputFile(args.input) as in_file:
*760c253cSXin Li        raw_results = json.load(in_file)
*760c253cSXin Li
*760c253cSXin Li    platform_names = raw_results["platforms"]
*760c253cSXin Li    results = raw_results["data"]
*760c253cSXin Li    if args.statistic_limit:
*760c253cSXin Li        results = CutResultsInPlace(results, max_keys=args.statistic_limit)
*760c253cSXin Li    benches = CountBenchmarks(results)
*760c253cSXin Li    # In crosperf, a label is essentially a platform+configuration. So, a name of
*760c253cSXin Li    # a label and a name of a platform are equivalent for our purposes.
*760c253cSXin Li    bench_results = BenchmarkResults(
*760c253cSXin Li        label_names=platform_names,
*760c253cSXin Li        benchmark_names_and_iterations=benches,
*760c253cSXin Li        run_keyvals=results,
*760c253cSXin Li        read_perf_report=_NoPerfReport,
*760c253cSXin Li    )
*760c253cSXin Li    actions = _AccumulateActions(args)
*760c253cSXin Li    ok = RunActions(
*760c253cSXin Li        actions, bench_results, args.output, args.force, args.verbose
*760c253cSXin Li    )
*760c253cSXin Li    return 0 if ok else 1
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Liif __name__ == "__main__":
*760c253cSXin Li    sys.exit(Main(sys.argv[1:]))