toolchain-utils/crosperf/benchmark.py

*760c253cSXin Li# Copyright 2013 The ChromiumOS Authors
*760c253cSXin Li# Use of this source code is governed by a BSD-style license that can be
*760c253cSXin Li# found in the LICENSE file.
*760c253cSXin Li
*760c253cSXin Li"""Define a type that wraps a Benchmark instance."""
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Liimport math
*760c253cSXin Liimport statistics
*760c253cSXin Lifrom typing import Any
*760c253cSXin Li
*760c253cSXin Liimport numpy as np
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Li# See crbug.com/673558 for how these are estimated.
*760c253cSXin Li_estimated_stddev = {
*760c253cSXin Li    "octane": 0.015,
*760c253cSXin Li    "kraken": 0.019,
*760c253cSXin Li    "speedometer": 0.007,
*760c253cSXin Li    "speedometer2": 0.006,
*760c253cSXin Li    "dromaeo.domcoreattr": 0.023,
*760c253cSXin Li    "dromaeo.domcoremodify": 0.011,
*760c253cSXin Li    "graphics_WebGLAquarium": 0.008,
*760c253cSXin Li    "page_cycler_v2.typical_25": 0.021,
*760c253cSXin Li    "loading.desktop": 0.021,  # Copied from page_cycler initially
*760c253cSXin Li}
*760c253cSXin Li
*760c253cSXin Li# Numpy makes it hard to know the real type of some inputs
*760c253cSXin Li# and outputs, so this type alias is just for docs.
*760c253cSXin LiFloatLike = Any
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef isf(x: FloatLike, mu=0.0, sigma=1.0, pitch=0.01) -> FloatLike:
*760c253cSXin Li    """Compute the inverse survival function for value x.
*760c253cSXin Li
*760c253cSXin Li    In the abscence of using scipy.stats.norm's isf(), this function
*760c253cSXin Li    attempts to re-implement the inverse survival function by calculating
*760c253cSXin Li    the numerical inverse of the survival function, interpolating between
*760c253cSXin Li    table values. See bug b/284489250 for details.
*760c253cSXin Li
*760c253cSXin Li    Survival function as defined by:
*760c253cSXin Li    https://en.wikipedia.org/wiki/Survival_function
*760c253cSXin Li
*760c253cSXin Li    Examples:
*760c253cSXin Li        >>> -2.0e-16 < isf(0.5) <  2.0e-16
*760c253cSXin Li        True
*760c253cSXin Li
*760c253cSXin Li    Args:
*760c253cSXin Li        x: float or numpy array-like to compute the ISF for.
*760c253cSXin Li        mu: Center of the underlying normal distribution.
*760c253cSXin Li        sigma: Spread of the underlying normal distribution.
*760c253cSXin Li        pitch: Absolute spacing between y-value interpolation points.
*760c253cSXin Li
*760c253cSXin Li    Returns:
*760c253cSXin Li        float or numpy array-like representing the ISF of `x`.
*760c253cSXin Li    """
*760c253cSXin Li    norm = statistics.NormalDist(mu, sigma)
*760c253cSXin Li    # np.interp requires a monotonically increasing x table.
*760c253cSXin Li    # Because the survival table is monotonically decreasing, we have to
*760c253cSXin Li    # reverse the y_vals too.
*760c253cSXin Li    y_vals = np.flip(np.arange(-4.0, 4.0, pitch))
*760c253cSXin Li    survival_table = np.fromiter(
*760c253cSXin Li        (1.0 - norm.cdf(y) for y in y_vals), y_vals.dtype
*760c253cSXin Li    )
*760c253cSXin Li    return np.interp(x, survival_table, y_vals)
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Li# Get #samples needed to guarantee a given confidence interval, assuming the
*760c253cSXin Li# samples follow normal distribution.
*760c253cSXin Lidef _samples(b: str) -> int:
*760c253cSXin Li    # TODO: Make this an option
*760c253cSXin Li    # CI = (0.9, 0.02), i.e., 90% chance that |sample mean - true mean| < 2%.
*760c253cSXin Li    p = 0.9
*760c253cSXin Li    e = 0.02
*760c253cSXin Li    if b not in _estimated_stddev:
*760c253cSXin Li        return 1
*760c253cSXin Li    d = _estimated_stddev[b]
*760c253cSXin Li    # Get at least 2 samples so as to calculate standard deviation, which is
*760c253cSXin Li    # needed in T-test for p-value.
*760c253cSXin Li    n = int(math.ceil((isf((1 - p) / 2) * d / e) ** 2))
*760c253cSXin Li    return n if n > 1 else 2
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Liclass Benchmark(object):
*760c253cSXin Li    """Class representing a benchmark to be run.
*760c253cSXin Li
*760c253cSXin Li    Contains details of the benchmark suite, arguments to pass to the suite,
*760c253cSXin Li    iterations to run the benchmark suite and so on. Note that the benchmark name
*760c253cSXin Li    can be different to the test suite name. For example, you may want to have
*760c253cSXin Li    two different benchmarks which run the same test_name with different
*760c253cSXin Li    arguments.
*760c253cSXin Li    """
*760c253cSXin Li
*760c253cSXin Li    def __init__(
*760c253cSXin Li        self,
*760c253cSXin Li        name,
*760c253cSXin Li        test_name,
*760c253cSXin Li        test_args,
*760c253cSXin Li        iterations,
*760c253cSXin Li        rm_chroot_tmp,
*760c253cSXin Li        perf_args,
*760c253cSXin Li        suite="",
*760c253cSXin Li        show_all_results=False,
*760c253cSXin Li        retries=0,
*760c253cSXin Li        run_local=False,
*760c253cSXin Li        cwp_dso="",
*760c253cSXin Li        weight=0,
*760c253cSXin Li    ):
*760c253cSXin Li        self.name = name
*760c253cSXin Li        # For telemetry, this is the benchmark name.
*760c253cSXin Li        self.test_name = test_name
*760c253cSXin Li        # For telemetry, this is the data.
*760c253cSXin Li        self.test_args = test_args
*760c253cSXin Li        self.iterations = iterations if iterations > 0 else _samples(name)
*760c253cSXin Li        self.perf_args = perf_args
*760c253cSXin Li        self.rm_chroot_tmp = rm_chroot_tmp
*760c253cSXin Li        self.iteration_adjusted = False
*760c253cSXin Li        self.suite = suite
*760c253cSXin Li        self.show_all_results = show_all_results
*760c253cSXin Li        self.retries = retries
*760c253cSXin Li        if self.suite == "telemetry":
*760c253cSXin Li            self.show_all_results = True
*760c253cSXin Li        if run_local and self.suite != "telemetry_Crosperf":
*760c253cSXin Li            raise RuntimeError(
*760c253cSXin Li                "run_local is only supported by telemetry_Crosperf."
*760c253cSXin Li            )
*760c253cSXin Li        self.run_local = run_local
*760c253cSXin Li        self.cwp_dso = cwp_dso
*760c253cSXin Li        self.weight = weight