toolchain-utils/afdo_redaction/remove_cold_functions.py

*760c253cSXin Li#!/usr/bin/env python3
*760c253cSXin Li# -*- coding: utf-8 -*-
*760c253cSXin Li# Copyright 2020 The ChromiumOS Authors
*760c253cSXin Li# Use of this source code is governed by a BSD-style license that can be
*760c253cSXin Li# found in the LICENSE file.
*760c253cSXin Li
*760c253cSXin Li"""Script to remove cold functions in an textual AFDO profile.
*760c253cSXin Li
*760c253cSXin LiThe script will look through the AFDO profile to find all the function
*760c253cSXin Lirecords. Then it'll start with the functions with lowest sample count and
*760c253cSXin Liremove it from the profile, until the total remaining functions in the
*760c253cSXin Liprofile meets the given number. When there are many functions having the
*760c253cSXin Lisame sample count, we need to remove all of them in order to meet the
*760c253cSXin Litarget, so the result profile will always have less than or equal to the
*760c253cSXin Ligiven number of functions.
*760c253cSXin Li
*760c253cSXin LiThe script is intended to be used on production ChromeOS profiles, after
*760c253cSXin Liother redaction/trimming scripts. It can be used with given textual CWP
*760c253cSXin Liand benchmark profiles, in order to analyze how many removed functions are
*760c253cSXin Lifrom which profile (or both), which can be used an indicator of fairness
*760c253cSXin Liduring the removal.
*760c253cSXin Li
*760c253cSXin LiThis is part of the effort to stablize the impact of AFDO profile on
*760c253cSXin LiChrome binary size. See crbug.com/1062014 for more context.
*760c253cSXin Li"""
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Liimport argparse
*760c253cSXin Liimport collections
*760c253cSXin Liimport re
*760c253cSXin Liimport sys
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Li_function_line_re = re.compile(r"^([\w\$\.@]+):(\d+)(?::\d+)?$")
*760c253cSXin LiProfileRecord = collections.namedtuple(
*760c253cSXin Li    "ProfileRecord", ["function_count", "function_body", "function_name"]
*760c253cSXin Li)
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef _read_sample_count(line):
*760c253cSXin Li    m = _function_line_re.match(line)
*760c253cSXin Li    assert m, "Failed to interpret function line %s" % line
*760c253cSXin Li    return m.group(1), int(m.group(2))
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef _read_textual_afdo_profile(stream):
*760c253cSXin Li    """Parses an AFDO profile from a line stream into ProfileRecords."""
*760c253cSXin Li    # ProfileRecords are actually nested, due to inlining. For the purpose of
*760c253cSXin Li    # this script, that doesn't matter.
*760c253cSXin Li    lines = (line.rstrip() for line in stream)
*760c253cSXin Li    function_line = None
*760c253cSXin Li    samples = []
*760c253cSXin Li    ret = []
*760c253cSXin Li    for line in lines:
*760c253cSXin Li        if not line:
*760c253cSXin Li            continue
*760c253cSXin Li
*760c253cSXin Li        if line[0].isspace():
*760c253cSXin Li            assert (
*760c253cSXin Li                function_line is not None
*760c253cSXin Li            ), "sample exists outside of a function?"
*760c253cSXin Li            samples.append(line)
*760c253cSXin Li            continue
*760c253cSXin Li
*760c253cSXin Li        if function_line is not None:
*760c253cSXin Li            name, count = _read_sample_count(function_line)
*760c253cSXin Li            body = [function_line] + samples
*760c253cSXin Li            ret.append(
*760c253cSXin Li                ProfileRecord(
*760c253cSXin Li                    function_count=count, function_body=body, function_name=name
*760c253cSXin Li                )
*760c253cSXin Li            )
*760c253cSXin Li        function_line = line
*760c253cSXin Li        samples = []
*760c253cSXin Li
*760c253cSXin Li    if function_line is not None:
*760c253cSXin Li        name, count = _read_sample_count(function_line)
*760c253cSXin Li        body = [function_line] + samples
*760c253cSXin Li        ret.append(
*760c253cSXin Li            ProfileRecord(
*760c253cSXin Li                function_count=count, function_body=body, function_name=name
*760c253cSXin Li            )
*760c253cSXin Li        )
*760c253cSXin Li    return ret
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef write_textual_afdo_profile(stream, records):
*760c253cSXin Li    for r in records:
*760c253cSXin Li        print("\n".join(r.function_body), file=stream)
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef analyze_functions(records, cwp, benchmark):
*760c253cSXin Li    cwp_functions = {x.function_name for x in cwp}
*760c253cSXin Li    benchmark_functions = {x.function_name for x in benchmark}
*760c253cSXin Li    all_functions = {x.function_name for x in records}
*760c253cSXin Li    cwp_only_functions = len(
*760c253cSXin Li        (all_functions & cwp_functions) - benchmark_functions
*760c253cSXin Li    )
*760c253cSXin Li    benchmark_only_functions = len(
*760c253cSXin Li        (all_functions & benchmark_functions) - cwp_functions
*760c253cSXin Li    )
*760c253cSXin Li    common_functions = len(all_functions & benchmark_functions & cwp_functions)
*760c253cSXin Li    none_functions = len(all_functions - benchmark_functions - cwp_functions)
*760c253cSXin Li
*760c253cSXin Li    assert not none_functions
*760c253cSXin Li    return cwp_only_functions, benchmark_only_functions, common_functions
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef run(input_stream, output_stream, goal, cwp=None, benchmark=None):
*760c253cSXin Li    records = _read_textual_afdo_profile(input_stream)
*760c253cSXin Li    num_functions = len(records)
*760c253cSXin Li    if not num_functions:
*760c253cSXin Li        return
*760c253cSXin Li    assert goal, "It's invalid to remove all functions in the profile"
*760c253cSXin Li
*760c253cSXin Li    if cwp and benchmark:
*760c253cSXin Li        cwp_records = _read_textual_afdo_profile(cwp)
*760c253cSXin Li        benchmark_records = _read_textual_afdo_profile(benchmark)
*760c253cSXin Li        cwp_num, benchmark_num, common_num = analyze_functions(
*760c253cSXin Li            records, cwp_records, benchmark_records
*760c253cSXin Li        )
*760c253cSXin Li
*760c253cSXin Li    records.sort(key=lambda x: (-x.function_count, x.function_name))
*760c253cSXin Li    records = records[:goal]
*760c253cSXin Li
*760c253cSXin Li    print(
*760c253cSXin Li        "Retained %d/%d (%.1f%%) functions in the profile"
*760c253cSXin Li        % (len(records), num_functions, 100.0 * len(records) / num_functions),
*760c253cSXin Li        file=sys.stderr,
*760c253cSXin Li    )
*760c253cSXin Li    write_textual_afdo_profile(output_stream, records)
*760c253cSXin Li
*760c253cSXin Li    if cwp and benchmark:
*760c253cSXin Li        (
*760c253cSXin Li            cwp_num_after,
*760c253cSXin Li            benchmark_num_after,
*760c253cSXin Li            common_num_after,
*760c253cSXin Li        ) = analyze_functions(records, cwp_records, benchmark_records)
*760c253cSXin Li        print(
*760c253cSXin Li            "Retained %d/%d (%.1f%%) functions only appear in the CWP profile"
*760c253cSXin Li            % (cwp_num_after, cwp_num, 100.0 * cwp_num_after / cwp_num),
*760c253cSXin Li            file=sys.stderr,
*760c253cSXin Li        )
*760c253cSXin Li        print(
*760c253cSXin Li            "Retained %d/%d (%.1f%%) functions only appear in the benchmark profile"
*760c253cSXin Li            % (
*760c253cSXin Li                benchmark_num_after,
*760c253cSXin Li                benchmark_num,
*760c253cSXin Li                100.0 * benchmark_num_after / benchmark_num,
*760c253cSXin Li            ),
*760c253cSXin Li            file=sys.stderr,
*760c253cSXin Li        )
*760c253cSXin Li        print(
*760c253cSXin Li            "Retained %d/%d (%.1f%%) functions appear in both CWP and benchmark"
*760c253cSXin Li            " profiles"
*760c253cSXin Li            % (
*760c253cSXin Li                common_num_after,
*760c253cSXin Li                common_num,
*760c253cSXin Li                100.0 * common_num_after / common_num,
*760c253cSXin Li            ),
*760c253cSXin Li            file=sys.stderr,
*760c253cSXin Li        )
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Lidef main():
*760c253cSXin Li    parser = argparse.ArgumentParser(
*760c253cSXin Li        description=__doc__,
*760c253cSXin Li        formatter_class=argparse.RawDescriptionHelpFormatter,
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "--input",
*760c253cSXin Li        default="/dev/stdin",
*760c253cSXin Li        help="File to read from. Defaults to stdin.",
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "--output",
*760c253cSXin Li        default="/dev/stdout",
*760c253cSXin Li        help="File to write to. Defaults to stdout.",
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "--number",
*760c253cSXin Li        type=int,
*760c253cSXin Li        required=True,
*760c253cSXin Li        help="Number of functions to retain in the profile.",
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "--cwp", help="Textualized CWP profiles, used for further analysis"
*760c253cSXin Li    )
*760c253cSXin Li    parser.add_argument(
*760c253cSXin Li        "--benchmark",
*760c253cSXin Li        help="Textualized benchmark profile, used for further analysis",
*760c253cSXin Li    )
*760c253cSXin Li    args = parser.parse_args()
*760c253cSXin Li
*760c253cSXin Li    if not args.number:
*760c253cSXin Li        parser.error("It's invalid to remove the number of functions to 0.")
*760c253cSXin Li
*760c253cSXin Li    if (args.cwp and not args.benchmark) or (not args.cwp and args.benchmark):
*760c253cSXin Li        parser.error("Please specify both --cwp and --benchmark")
*760c253cSXin Li
*760c253cSXin Li    with open(args.input) as stdin:
*760c253cSXin Li        with open(args.output, "w") as stdout:
*760c253cSXin Li            # When user specify textualized cwp and benchmark profiles, perform
*760c253cSXin Li            # the analysis. Otherwise, just trim the cold functions from profile.
*760c253cSXin Li            if args.cwp and args.benchmark:
*760c253cSXin Li                with open(args.cwp) as cwp:
*760c253cSXin Li                    with open(args.benchmark) as benchmark:
*760c253cSXin Li                        run(stdin, stdout, args.number, cwp, benchmark)
*760c253cSXin Li            else:
*760c253cSXin Li                run(stdin, stdout, args.number)
*760c253cSXin Li
*760c253cSXin Li
*760c253cSXin Liif __name__ == "__main__":
*760c253cSXin Li    main()