_autoserv (revision 9c5db1993ded3edbeafc8092d69fe5de2ee02df7) - OpenGrok cross reference for /aosp_15_r20/external/autotest/server/_autoserv

*9c5db199SXin Li#!/usr/bin/python3 -u
*9c5db199SXin Li# Copyright 2007-2008 Martin J. Bligh <[email protected]>, Google Inc.
*9c5db199SXin Li# Released under the GPL v2
*9c5db199SXin Li
*9c5db199SXin Li"""
*9c5db199SXin LiRun a control file through the server side engine
*9c5db199SXin Li"""
*9c5db199SXin Li
*9c5db199SXin Liimport datetime
*9c5db199SXin Liimport contextlib
*9c5db199SXin Liimport getpass
*9c5db199SXin Liimport logging
*9c5db199SXin Liimport os
*9c5db199SXin Liimport re
*9c5db199SXin Liimport shutil
*9c5db199SXin Liimport signal
*9c5db199SXin Liimport socket
*9c5db199SXin Liimport sys
*9c5db199SXin Liimport traceback
*9c5db199SXin Liimport time
*9c5db199SXin Liimport six
*9c5db199SXin Lifrom six.moves import urllib
*9c5db199SXin Li
*9c5db199SXin Liimport common
*9c5db199SXin Lifrom autotest_lib.client.bin.result_tools import utils as result_utils
*9c5db199SXin Lifrom autotest_lib.client.bin.result_tools import view as result_view
*9c5db199SXin Lifrom autotest_lib.client.common_lib import control_data
*9c5db199SXin Lifrom autotest_lib.client.common_lib import autotest_enum
*9c5db199SXin Lifrom autotest_lib.client.common_lib import error
*9c5db199SXin Lifrom autotest_lib.client.common_lib import global_config
*9c5db199SXin Lifrom autotest_lib.client.common_lib import host_queue_entry_states
*9c5db199SXin Lifrom autotest_lib.client.common_lib import host_states
*9c5db199SXin Lifrom autotest_lib.client.common_lib import seven
*9c5db199SXin Lifrom autotest_lib.server.cros.dynamic_suite import suite
*9c5db199SXin Li
*9c5db199SXin Litry:
*9c5db199SXin Li    from autotest_lib.utils.frozen_chromite.lib import metrics
*9c5db199SXin Li    from autotest_lib.utils.frozen_chromite.lib import cloud_trace
*9c5db199SXin Liexcept ImportError as e:
*9c5db199SXin Li    from autotest_lib.client.common_lib import utils as common_utils
*9c5db199SXin Li    metrics = common_utils.metrics_mock
*9c5db199SXin Li    import mock
*9c5db199SXin Li    cloud_trace = mock.MagicMock()
*9c5db199SXin Li
*9c5db199SXin Li# Number of seconds to wait before returning if testing mode is enabled
*9c5db199SXin LiTESTING_MODE_SLEEP_SECS = 1
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lifrom autotest_lib.server import frontend
*9c5db199SXin Lifrom autotest_lib.server import server_logging_config
*9c5db199SXin Lifrom autotest_lib.server import server_job, utils, autoserv_parser, autotest
*9c5db199SXin Lifrom autotest_lib.server import utils as server_utils
*9c5db199SXin Lifrom autotest_lib.server import site_utils
*9c5db199SXin Lifrom autotest_lib.server.cros.dynamic_suite import frontend_wrappers
*9c5db199SXin Lifrom autotest_lib.site_utils import job_directories
*9c5db199SXin Lifrom autotest_lib.site_utils import lxc
*9c5db199SXin Lifrom autotest_lib.site_utils.lxc import utils as lxc_utils
*9c5db199SXin Lifrom autotest_lib.client.common_lib import pidfile, logging_manager
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Li# Control segment to stage server-side package.
*9c5db199SXin LiSTAGE_SERVER_SIDE_PACKAGE_CONTROL_FILE = server_job._control_segment_path(
*9c5db199SXin Li        'stage_server_side_package')
*9c5db199SXin Li
*9c5db199SXin Li# Command line to start servod in a moblab.
*9c5db199SXin LiSTART_SERVOD_CMD = 'sudo start servod BOARD=%s PORT=%s'
*9c5db199SXin LiSTOP_SERVOD_CMD = 'sudo stop servod'
*9c5db199SXin Li
*9c5db199SXin Li_AUTOTEST_ROOT = os.path.realpath(os.path.join(os.path.dirname(__file__), '..'))
*9c5db199SXin Li_CONTROL_FILE_FROM_CONTROL_NAME = 'control.from_control_name'
*9c5db199SXin Li
*9c5db199SXin Li_LXC_JOB_FOLDER = 'lxc_job_folder'
*9c5db199SXin Li
*9c5db199SXin Lidef log_alarm(signum, frame):
*9c5db199SXin Li    logging.error("Received SIGALARM. Ignoring and continuing on.")
*9c5db199SXin Li    sys.exit(1)
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _get_companions(parser):
*9c5db199SXin Li    """Get a list of companion devices from command line arg -ch.
*9c5db199SXin Li
*9c5db199SXin Li    @param parser: Parser for the command line arguments.
*9c5db199SXin Li
*9c5db199SXin Li    @return: A list of companion devices from command line arg -ch.
*9c5db199SXin Li    """
*9c5db199SXin Li    if parser.options.companion_hosts:
*9c5db199SXin Li        companions = parser.options.companion_hosts.replace(',', ' ').strip().split()
*9c5db199SXin Li    else:
*9c5db199SXin Li        companions = []
*9c5db199SXin Li
*9c5db199SXin Li    if companions:
*9c5db199SXin Li        for companion in companions:
*9c5db199SXin Li            if not companion or re.search('\s', companion):
*9c5db199SXin Li                parser.parser.error("Invalid companion: %s" % str(companion))
*9c5db199SXin Li        companions = list(set(companions))
*9c5db199SXin Li        companions.sort()
*9c5db199SXin Li    return companions
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _get_dutservers(parser):
*9c5db199SXin Li    """Get a list of DUT server addresses from command line arg --dut_servers.
*9c5db199SXin Li
*9c5db199SXin Li    @param parser: Parser for the command line arguments.
*9c5db199SXin Li
*9c5db199SXin Li    @return: A list of DUT server addresses from command line arg
*9c5db199SXin Li             --dut_servers.
*9c5db199SXin Li    """
*9c5db199SXin Li    if parser.options.dut_servers:
*9c5db199SXin Li        dut_servers = parser.options.dut_servers.replace(
*9c5db199SXin Li            ',', ' ').strip().split()
*9c5db199SXin Li    else:
*9c5db199SXin Li        dut_servers = []
*9c5db199SXin Li
*9c5db199SXin Li    if dut_servers:
*9c5db199SXin Li        for dut_server in dut_servers:
*9c5db199SXin Li            if not dut_server or re.search('\s', dut_server):
*9c5db199SXin Li                parser.parser.error(
*9c5db199SXin Li                    "Invalid DUT Server address: %s" % str(dut_server))
*9c5db199SXin Li        dut_servers = list(set(dut_servers))
*9c5db199SXin Li        dut_servers.sort()
*9c5db199SXin Li    return dut_servers
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _get_machines(parser):
*9c5db199SXin Li    """Get a list of machine names from command line arg -m or a file.
*9c5db199SXin Li
*9c5db199SXin Li    @param parser: Parser for the command line arguments.
*9c5db199SXin Li
*9c5db199SXin Li    @return: A list of machine names from command line arg -m or the
*9c5db199SXin Li             machines file specified in the command line arg -M.
*9c5db199SXin Li    """
*9c5db199SXin Li    if parser.options.machines:
*9c5db199SXin Li        machines = parser.options.machines.replace(',', ' ').strip().split()
*9c5db199SXin Li    else:
*9c5db199SXin Li        machines = []
*9c5db199SXin Li    machines_file = parser.options.machines_file
*9c5db199SXin Li    if machines_file:
*9c5db199SXin Li        machines = []
*9c5db199SXin Li        for m in open(machines_file, 'r').readlines():
*9c5db199SXin Li            # remove comments, spaces
*9c5db199SXin Li            m = re.sub('#.*', '', m).strip()
*9c5db199SXin Li            if m:
*9c5db199SXin Li                machines.append(m)
*9c5db199SXin Li        logging.debug('Read list of machines from file: %s', machines_file)
*9c5db199SXin Li        logging.debug('Machines: %s', ','.join(machines))
*9c5db199SXin Li
*9c5db199SXin Li    if machines:
*9c5db199SXin Li        for machine in machines:
*9c5db199SXin Li            if not machine or re.search('\s', machine):
*9c5db199SXin Li                parser.parser.error("Invalid machine: %s" % str(machine))
*9c5db199SXin Li        machines = list(set(machines))
*9c5db199SXin Li        machines.sort()
*9c5db199SXin Li    return machines
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _stage_ssp(parser, resultsdir):
*9c5db199SXin Li    """Stage server-side package.
*9c5db199SXin Li
*9c5db199SXin Li    This function calls a control segment to stage server-side package based on
*9c5db199SXin Li    the job and autoserv command line option. The detail implementation could
*9c5db199SXin Li    be different for each host type. Currently, only CrosHost has
*9c5db199SXin Li    stage_server_side_package function defined.
*9c5db199SXin Li    The script returns None if no server-side package is available. However,
*9c5db199SXin Li    it may raise exception if it failed for reasons other than artifact (the
*9c5db199SXin Li    server-side package) not found.
*9c5db199SXin Li
*9c5db199SXin Li    @param parser: Command line arguments parser passed in the autoserv process.
*9c5db199SXin Li    @param resultsdir: Folder to store results. This could be different from
*9c5db199SXin Li            parser.options.results: parser.options.results  can be set to None
*9c5db199SXin Li            for results to be stored in a temp folder. resultsdir can be None
*9c5db199SXin Li            for autoserv run requires no logging.
*9c5db199SXin Li
*9c5db199SXin Li    @return: url to the autotest server-side package. None in case of errors.
*9c5db199SXin Li    """
*9c5db199SXin Li    machines_list = _get_machines(parser)
*9c5db199SXin Li    machines_list = server_job.get_machine_dicts(
*9c5db199SXin Li            machine_names=machines_list,
*9c5db199SXin Li            store_dir=os.path.join(resultsdir, parser.options.host_info_subdir),
*9c5db199SXin Li            in_lab=parser.options.lab,
*9c5db199SXin Li            use_shadow_store=not parser.options.local_only_host_info,
*9c5db199SXin Li            host_attributes=parser.options.host_attributes,
*9c5db199SXin Li    )
*9c5db199SXin Li
*9c5db199SXin Li    namespace = {'machines': machines_list,
*9c5db199SXin Li                 'image': parser.options.test_source_build}
*9c5db199SXin Li    script_locals = {}
*9c5db199SXin Li
*9c5db199SXin Li    seven.exec_file(
*9c5db199SXin Li        STAGE_SERVER_SIDE_PACKAGE_CONTROL_FILE,
*9c5db199SXin Li        globals_=namespace,
*9c5db199SXin Li        locals_=script_locals,
*9c5db199SXin Li    )
*9c5db199SXin Li    ssp_url = script_locals['ssp_url']
*9c5db199SXin Li    if not ssp_url:
*9c5db199SXin Li        logging.error('Failed to stage SSP package: %s',
*9c5db199SXin Li                      script_locals['error_msg'])
*9c5db199SXin Li        logging.error('This job will fail later, when attempting to run with'
*9c5db199SXin Li                      ' SSP')
*9c5db199SXin Li    return ssp_url
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _run_with_ssp(job, container_id, job_id, results, parser, ssp_url,
*9c5db199SXin Li                  machines):
*9c5db199SXin Li    """Run the server job with server-side packaging.
*9c5db199SXin Li
*9c5db199SXin Li    @param job: The server job object.
*9c5db199SXin Li    @param container_id: ID of the container to run the test.
*9c5db199SXin Li    @param job_id: ID of the test job.
*9c5db199SXin Li    @param results: Folder to store results. This could be different from
*9c5db199SXin Li                    parser.options.results:
*9c5db199SXin Li                    parser.options.results  can be set to None for results to be
*9c5db199SXin Li                    stored in a temp folder.
*9c5db199SXin Li                    results can be None if the autoserv run requires no logging.
*9c5db199SXin Li    @param parser: Command line parser that contains the options.
*9c5db199SXin Li    @param ssp_url: url of the staged server-side package.
*9c5db199SXin Li    @param machines: A list of machines to run the test.
*9c5db199SXin Li    """
*9c5db199SXin Li    if not ssp_url:
*9c5db199SXin Li        job.record('FAIL', None, None,
*9c5db199SXin Li                   'Failed to stage server-side package')
*9c5db199SXin Li        raise error.AutoservError('Failed to stage server-side package')
*9c5db199SXin Li
*9c5db199SXin Li    bucket = lxc.ContainerBucket(
*9c5db199SXin Li            base_name=_ssp_base_image_name_or_default(parser.options))
*9c5db199SXin Li    control = (parser.args[0] if len(parser.args) > 0 and parser.args[0] != ''
*9c5db199SXin Li               else None)
*9c5db199SXin Li    try:
*9c5db199SXin Li        dut_name = machines[0] if len(machines) >= 1 else None
*9c5db199SXin Li        test_container = bucket.setup_test(container_id, job_id, ssp_url,
*9c5db199SXin Li                                           results, control=control,
*9c5db199SXin Li                                           job_folder=_LXC_JOB_FOLDER,
*9c5db199SXin Li                                           dut_name=dut_name)
*9c5db199SXin Li    except Exception as e:
*9c5db199SXin Li        job.record('START', None, None, 'Starting SSP')
*9c5db199SXin Li        job.record('END ABORT', None, None,
*9c5db199SXin Li                   'Failed to setup container for test: %s. Check logs in '
*9c5db199SXin Li                   'ssp_logs folder for more details.' % e)
*9c5db199SXin Li        raise error.AutoservSSPError
*9c5db199SXin Li
*9c5db199SXin Li    args = sys.argv[:]
*9c5db199SXin Li    args.remove('--require-ssp')
*9c5db199SXin Li    # --parent_job_id is only useful in autoserv running in host, not in
*9c5db199SXin Li    # container. Include this argument will cause test to fail for builds before
*9c5db199SXin Li    # CL 286265 was merged.
*9c5db199SXin Li    if '--parent_job_id' in args:
*9c5db199SXin Li        index = args.index('--parent_job_id')
*9c5db199SXin Li        args.remove('--parent_job_id')
*9c5db199SXin Li        # Remove the actual parent job id in command line arg.
*9c5db199SXin Li        del args[index]
*9c5db199SXin Li
*9c5db199SXin Li    # A dictionary of paths to replace in the command line. Key is the path to
*9c5db199SXin Li    # be replaced with the one in value.
*9c5db199SXin Li    paths_to_replace = {}
*9c5db199SXin Li    # Replace the control file path with the one in container.
*9c5db199SXin Li    if control:
*9c5db199SXin Li        container_control_filename = os.path.join(
*9c5db199SXin Li                lxc.CONTROL_TEMP_PATH, os.path.basename(control))
*9c5db199SXin Li        paths_to_replace[control] = container_control_filename
*9c5db199SXin Li    # Update result directory with the one in container.
*9c5db199SXin Li    container_result_dir = os.path.join(lxc.RESULT_DIR_FMT % _LXC_JOB_FOLDER)
*9c5db199SXin Li    if parser.options.results:
*9c5db199SXin Li        paths_to_replace[parser.options.results] = container_result_dir
*9c5db199SXin Li    args = [paths_to_replace.get(arg, arg) for arg in args]
*9c5db199SXin Li
*9c5db199SXin Li    # Apply --use-existing-results, results directory is aready created and
*9c5db199SXin Li    # mounted in container. Apply this arg to avoid exception being raised.
*9c5db199SXin Li    if not '--use-existing-results' in args:
*9c5db199SXin Li        args.append('--use-existing-results')
*9c5db199SXin Li
*9c5db199SXin Li    # Make sure autoserv running in container using a different pid file.
*9c5db199SXin Li    if not '--pidfile-label' in args:
*9c5db199SXin Li        args.extend(['--pidfile-label', 'container_autoserv'])
*9c5db199SXin Li
*9c5db199SXin Li    cmd_line = ' '.join(["'%s'" % arg if ' ' in arg else arg for arg in args])
*9c5db199SXin Li    logging.info('Run command in container: %s', cmd_line)
*9c5db199SXin Li    success = False
*9c5db199SXin Li    try:
*9c5db199SXin Li        test_container.attach_run(cmd_line)
*9c5db199SXin Li        success = True
*9c5db199SXin Li    except Exception as e:
*9c5db199SXin Li        # If the test run inside container fails without generating any log,
*9c5db199SXin Li        # write a message to status.log to help troubleshooting.
*9c5db199SXin Li        debug_files = os.listdir(os.path.join(results, 'debug'))
*9c5db199SXin Li        if not debug_files:
*9c5db199SXin Li            job.record('FAIL', None, None,
*9c5db199SXin Li                       'Failed to run test inside the container: %s. Check '
*9c5db199SXin Li                       'logs in ssp_logs folder for more details.' % e)
*9c5db199SXin Li        raise
*9c5db199SXin Li    finally:
*9c5db199SXin Li        metrics.Counter(
*9c5db199SXin Li            'chromeos/autotest/experimental/execute_job_in_ssp').increment(
*9c5db199SXin Li                fields={'success': success})
*9c5db199SXin Li        test_container.destroy()
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef correct_results_folder_permission(results):
*9c5db199SXin Li    """Make sure the results folder has the right permission settings.
*9c5db199SXin Li
*9c5db199SXin Li    For tests running with server-side packaging, the results folder has the
*9c5db199SXin Li    owner of root. This must be changed to the user running the autoserv
*9c5db199SXin Li    process, so parsing job can access the results folder.
*9c5db199SXin Li    TODO(dshi): crbug.com/459344 Remove this function when test container can be
*9c5db199SXin Li    unprivileged container.
*9c5db199SXin Li
*9c5db199SXin Li    @param results: Path to the results folder.
*9c5db199SXin Li
*9c5db199SXin Li    """
*9c5db199SXin Li    if not results:
*9c5db199SXin Li        return
*9c5db199SXin Li
*9c5db199SXin Li    utils.run('sudo -n chown -R %s "%s"' % (os.getuid(), results))
*9c5db199SXin Li    utils.run('sudo -n chgrp -R %s "%s"' % (os.getgid(), results))
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _start_servod(machine):
*9c5db199SXin Li    """Try to start servod in moblab if it's not already running or running with
*9c5db199SXin Li    different board or port.
*9c5db199SXin Li
*9c5db199SXin Li    @param machine: Name of the dut used for test.
*9c5db199SXin Li    """
*9c5db199SXin Li    if not utils.is_moblab():
*9c5db199SXin Li        return
*9c5db199SXin Li
*9c5db199SXin Li    logging.debug('Trying to start servod.')
*9c5db199SXin Li    try:
*9c5db199SXin Li        afe = frontend.AFE()
*9c5db199SXin Li        board = server_utils.get_board_from_afe(machine, afe)
*9c5db199SXin Li        hosts = afe.get_hosts(hostname=machine)
*9c5db199SXin Li        servo_host = hosts[0].attributes.get('servo_host', None)
*9c5db199SXin Li        servo_port = hosts[0].attributes.get('servo_port', 9999)
*9c5db199SXin Li        if not servo_host in ['localhost', '127.0.0.1']:
*9c5db199SXin Li            logging.warning('Starting servod is aborted. The dut\'s servo_host '
*9c5db199SXin Li                         'attribute is not set to localhost.')
*9c5db199SXin Li            return
*9c5db199SXin Li    except (urllib.error.HTTPError, urllib.error.URLError):
*9c5db199SXin Li        # Ignore error if RPC failed to get board
*9c5db199SXin Li        logging.error('Failed to get board name from AFE. Start servod is '
*9c5db199SXin Li                      'aborted')
*9c5db199SXin Li        return
*9c5db199SXin Li
*9c5db199SXin Li    try:
*9c5db199SXin Li        pid = utils.run('pgrep servod').stdout
*9c5db199SXin Li        cmd_line = utils.run('ps -fp %s' % pid).stdout
*9c5db199SXin Li        if ('--board %s' % board in cmd_line and
*9c5db199SXin Li            '--port %s' % servo_port in cmd_line):
*9c5db199SXin Li            logging.debug('Servod is already running with given board and port.'
*9c5db199SXin Li                          ' There is no need to restart servod.')
*9c5db199SXin Li            return
*9c5db199SXin Li        logging.debug('Servod is running with different board or port. '
*9c5db199SXin Li                      'Stopping existing servod.')
*9c5db199SXin Li        utils.run('sudo stop servod')
*9c5db199SXin Li    except error.CmdError:
*9c5db199SXin Li        # servod is not running.
*9c5db199SXin Li        pass
*9c5db199SXin Li
*9c5db199SXin Li    try:
*9c5db199SXin Li        utils.run(START_SERVOD_CMD % (board, servo_port))
*9c5db199SXin Li        logging.debug('Servod is started')
*9c5db199SXin Li    except error.CmdError as e:
*9c5db199SXin Li        logging.error('Servod failed to be started, error: %s', e)
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _control_path_on_disk(control_name):
*9c5db199SXin Li    """Find the control file corresponding to the given control name, on disk.
*9c5db199SXin Li
*9c5db199SXin Li    @param control_name: NAME attribute of the control file to fetch.
*9c5db199SXin Li    @return: Path to the control file.
*9c5db199SXin Li    """
*9c5db199SXin Li    cf_getter = suite.create_fs_getter(_AUTOTEST_ROOT)
*9c5db199SXin Li    control_name_predicate = suite.test_name_matches_pattern_predicate(
*9c5db199SXin Li            '^%s$' % control_name)
*9c5db199SXin Li    tests = suite.find_and_parse_tests(cf_getter, control_name_predicate)
*9c5db199SXin Li    if not tests:
*9c5db199SXin Li        raise error.AutoservError(
*9c5db199SXin Li                'Failed to find any control files with NAME %s' % control_name)
*9c5db199SXin Li    if len(tests) > 1:
*9c5db199SXin Li        logging.error('Found more than one control file with NAME %s: %s',
*9c5db199SXin Li                      control_name, [t.path for t in tests])
*9c5db199SXin Li        raise error.AutoservError(
*9c5db199SXin Li                'Found more than one control file with NAME %s' % control_name)
*9c5db199SXin Li    return tests[0].path
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _stage_control_file(control_name, results_dir):
*9c5db199SXin Li    """Stage the control file to execute from local autotest checkout.
*9c5db199SXin Li
*9c5db199SXin Li    @param control_name: Name of the control file to stage.
*9c5db199SXin Li    @param results_dir: Results directory to stage the control file into.
*9c5db199SXin Li    @return: Absolute path to the staged control file.
*9c5db199SXin Li    """
*9c5db199SXin Li    control_path = _control_path_on_disk(control_name)
*9c5db199SXin Li    new_control = os.path.join(results_dir, _CONTROL_FILE_FROM_CONTROL_NAME)
*9c5db199SXin Li    shutil.copy2(control_path, new_control)
*9c5db199SXin Li    return new_control
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef run_autoserv(pid_file_manager, results, parser, ssp_url, use_ssp):
*9c5db199SXin Li    """Run server job with given options.
*9c5db199SXin Li
*9c5db199SXin Li    @param pid_file_manager: PidFileManager used to monitor the autoserv process
*9c5db199SXin Li    @param results: Folder to store results.
*9c5db199SXin Li    @param parser: Parser for the command line arguments.
*9c5db199SXin Li    @param ssp_url: Url to server-side package.
*9c5db199SXin Li    @param use_ssp: Set to True to run with server-side packaging.
*9c5db199SXin Li    """
*9c5db199SXin Li    # send stdin to /dev/null
*9c5db199SXin Li    dev_null = os.open(os.devnull, os.O_RDONLY)
*9c5db199SXin Li    os.dup2(dev_null, sys.stdin.fileno())
*9c5db199SXin Li    os.close(dev_null)
*9c5db199SXin Li
*9c5db199SXin Li    # Create separate process group if the process is not a process group
*9c5db199SXin Li    # leader. This allows autoserv process to keep running after the caller
*9c5db199SXin Li    # process (drone manager call) exits.
*9c5db199SXin Li    if os.getpid() != os.getpgid(0):
*9c5db199SXin Li        os.setsid()
*9c5db199SXin Li
*9c5db199SXin Li    # Container name is predefined so the container can be destroyed in
*9c5db199SXin Li    # handle_sigterm.
*9c5db199SXin Li    job_or_task_id = job_directories.get_job_id_or_task_id(
*9c5db199SXin Li            parser.options.results)
*9c5db199SXin Li    container_id = lxc.ContainerId(job_or_task_id, time.time(), os.getpid())
*9c5db199SXin Li
*9c5db199SXin Li    # Implement SIGTERM handler
*9c5db199SXin Li    def handle_sigterm(signum, frame):
*9c5db199SXin Li        logging.debug('Received SIGTERM')
*9c5db199SXin Li        if pid_file_manager:
*9c5db199SXin Li            pid_file_manager.close_file(1, signal.SIGTERM)
*9c5db199SXin Li        logging.debug('Finished writing to pid_file. Killing process.')
*9c5db199SXin Li
*9c5db199SXin Li        # Update results folder's file permission. This needs to be done ASAP
*9c5db199SXin Li        # before the parsing process tries to access the log.
*9c5db199SXin Li        if use_ssp and results:
*9c5db199SXin Li            correct_results_folder_permission(results)
*9c5db199SXin Li
*9c5db199SXin Li        # This sleep allows the pending output to be logged before the kill
*9c5db199SXin Li        # signal is sent.
*9c5db199SXin Li        time.sleep(.1)
*9c5db199SXin Li        if use_ssp:
*9c5db199SXin Li            logging.debug('Destroy container %s before aborting the autoserv '
*9c5db199SXin Li                          'process.', container_id)
*9c5db199SXin Li            try:
*9c5db199SXin Li                bucket = lxc.ContainerBucket(
*9c5db199SXin Li                        base_name=_ssp_base_image_name_or_default(
*9c5db199SXin Li                                parser.options))
*9c5db199SXin Li                container = bucket.get_container(container_id)
*9c5db199SXin Li                if container:
*9c5db199SXin Li                    container.destroy()
*9c5db199SXin Li                    logging.debug("Container %s destroyed.", container_id)
*9c5db199SXin Li                else:
*9c5db199SXin Li                    logging.debug('Container %s is not found.', container_id)
*9c5db199SXin Li                    bucket.scrub_container_location(container_id)
*9c5db199SXin Li            except:
*9c5db199SXin Li                # Handle any exception so the autoserv process can be aborted.
*9c5db199SXin Li                logging.exception('Failed to destroy container %s.',
*9c5db199SXin Li                                  container_id)
*9c5db199SXin Li            # Try to correct the result file permission again after the
*9c5db199SXin Li            # container is destroyed, as the container might have created some
*9c5db199SXin Li            # new files in the result folder.
*9c5db199SXin Li            if results:
*9c5db199SXin Li                correct_results_folder_permission(results)
*9c5db199SXin Li
*9c5db199SXin Li        os.killpg(os.getpgrp(), signal.SIGKILL)
*9c5db199SXin Li
*9c5db199SXin Li    # Set signal handler
*9c5db199SXin Li    signal.signal(signal.SIGTERM, handle_sigterm)
*9c5db199SXin Li
*9c5db199SXin Li    # faulthandler is only needed to debug in the Lab and is not avaliable to
*9c5db199SXin Li    # be imported in the chroot as part of VMTest, so Try-Except it.
*9c5db199SXin Li    try:
*9c5db199SXin Li        import faulthandler
*9c5db199SXin Li        faulthandler.register(signal.SIGTERM, all_threads=True, chain=True)
*9c5db199SXin Li        logging.debug('faulthandler registered on SIGTERM.')
*9c5db199SXin Li    except ImportError:
*9c5db199SXin Li        # exc_clear() doesn't exist (nor is needed) in python3
*9c5db199SXin Li        if six.PY2:
*9c5db199SXin Li            sys.exc_clear()
*9c5db199SXin Li
*9c5db199SXin Li    # Ignore SIGTTOU's generated by output from forked children.
*9c5db199SXin Li    signal.signal(signal.SIGTTOU, signal.SIG_IGN)
*9c5db199SXin Li
*9c5db199SXin Li    # If we received a SIGALARM, let's be loud about it.
*9c5db199SXin Li    signal.signal(signal.SIGALRM, log_alarm)
*9c5db199SXin Li
*9c5db199SXin Li    # Server side tests that call shell scripts often depend on $USER being set
*9c5db199SXin Li    # but depending on how you launch your autotest scheduler it may not be set.
*9c5db199SXin Li    os.environ['USER'] = getpass.getuser()
*9c5db199SXin Li
*9c5db199SXin Li    label = parser.options.label
*9c5db199SXin Li    group_name = parser.options.group_name
*9c5db199SXin Li    user = parser.options.user
*9c5db199SXin Li    client = parser.options.client
*9c5db199SXin Li    server = parser.options.server
*9c5db199SXin Li    verify = parser.options.verify
*9c5db199SXin Li    repair = parser.options.repair
*9c5db199SXin Li    cleanup = parser.options.cleanup
*9c5db199SXin Li    provision = parser.options.provision
*9c5db199SXin Li    reset = parser.options.reset
*9c5db199SXin Li    job_labels = parser.options.job_labels
*9c5db199SXin Li    no_tee = parser.options.no_tee
*9c5db199SXin Li    execution_tag = parser.options.execution_tag
*9c5db199SXin Li    ssh_user = parser.options.ssh_user
*9c5db199SXin Li    ssh_port = parser.options.ssh_port
*9c5db199SXin Li    ssh_pass = parser.options.ssh_pass
*9c5db199SXin Li    collect_crashinfo = parser.options.collect_crashinfo
*9c5db199SXin Li    control_filename = parser.options.control_filename
*9c5db199SXin Li    verify_job_repo_url = parser.options.verify_job_repo_url
*9c5db199SXin Li    skip_crash_collection = parser.options.skip_crash_collection
*9c5db199SXin Li    ssh_verbosity = int(parser.options.ssh_verbosity)
*9c5db199SXin Li    ssh_options = parser.options.ssh_options
*9c5db199SXin Li    no_use_packaging = parser.options.no_use_packaging
*9c5db199SXin Li    in_lab = bool(parser.options.lab)
*9c5db199SXin Li    companion_hosts = _get_companions(parser)
*9c5db199SXin Li    dut_servers = _get_dutservers(parser)
*9c5db199SXin Li    is_cft = parser.options.cft
*9c5db199SXin Li    force_full_log_collection = parser.options.force_full_log_collection
*9c5db199SXin Li
*9c5db199SXin Li    # can't be both a client and a server side test
*9c5db199SXin Li    if client and server:
*9c5db199SXin Li        parser.parser.error("Can not specify a test as both server and client!")
*9c5db199SXin Li
*9c5db199SXin Li    if provision and client:
*9c5db199SXin Li        parser.parser.error("Cannot specify provisioning and client!")
*9c5db199SXin Li
*9c5db199SXin Li    is_special_task = (verify or repair or cleanup or collect_crashinfo or
*9c5db199SXin Li                       provision or reset)
*9c5db199SXin Li    use_client_trampoline = False
*9c5db199SXin Li    if parser.options.control_name:
*9c5db199SXin Li        if use_ssp:
*9c5db199SXin Li            # When use_ssp is True, autoserv will be re-executed inside a
*9c5db199SXin Li            # container preserving the --control-name argument. Control file
*9c5db199SXin Li            # will be staged inside the rexecuted autoserv.
*9c5db199SXin Li            control = None
*9c5db199SXin Li        else:
*9c5db199SXin Li            try:
*9c5db199SXin Li                control = _stage_control_file(parser.options.control_name,
*9c5db199SXin Li                                              results)
*9c5db199SXin Li            except error.AutoservError as e:
*9c5db199SXin Li                logging.info("Using client trampoline because of: %s", e)
*9c5db199SXin Li                control = parser.options.control_name
*9c5db199SXin Li                use_client_trampoline = True
*9c5db199SXin Li
*9c5db199SXin Li    elif parser.args:
*9c5db199SXin Li        control = parser.args[0]
*9c5db199SXin Li    else:
*9c5db199SXin Li        if not is_special_task:
*9c5db199SXin Li            parser.parser.error("Missing argument: control file")
*9c5db199SXin Li        control = None
*9c5db199SXin Li
*9c5db199SXin Li    if ssh_verbosity > 0:
*9c5db199SXin Li        # ssh_verbosity is an integer between 0 and 3, inclusive
*9c5db199SXin Li        ssh_verbosity_flag = '-' + 'v' * ssh_verbosity
*9c5db199SXin Li    else:
*9c5db199SXin Li        ssh_verbosity_flag = ''
*9c5db199SXin Li
*9c5db199SXin Li    machines = _get_machines(parser)
*9c5db199SXin Li    if group_name and len(machines) < 2:
*9c5db199SXin Li        parser.parser.error('-G %r may only be supplied with more than one '
*9c5db199SXin Li                            'machine.' % group_name)
*9c5db199SXin Li
*9c5db199SXin Li    logging.debug("Parser.args is %r", parser.args)
*9c5db199SXin Li    try:
*9c5db199SXin Li      logging.debug("Parser.options.args is %r", parser.options.args)
*9c5db199SXin Li    except AttributeError:
*9c5db199SXin Li      logging.debug("No Parser.options.args.")
*9c5db199SXin Li
*9c5db199SXin Li    try:
*9c5db199SXin Li      logging.debug("Parser.options is %r", parser.options)
*9c5db199SXin Li    except AttributeError:
*9c5db199SXin Li      logging.debug("No Parser.options.")
*9c5db199SXin Li    job_kwargs = {
*9c5db199SXin Li            'control': control,
*9c5db199SXin Li            'args': parser.args[1:],
*9c5db199SXin Li            'resultdir': results,
*9c5db199SXin Li            'label': label,
*9c5db199SXin Li            'user': user,
*9c5db199SXin Li            'machines': machines,
*9c5db199SXin Li            'machine_dict_list': server_job.get_machine_dicts(
*9c5db199SXin Li                    machine_names=machines,
*9c5db199SXin Li                    store_dir=os.path.join(results,
*9c5db199SXin Li                                           parser.options.host_info_subdir),
*9c5db199SXin Li                    in_lab=in_lab,
*9c5db199SXin Li                    use_shadow_store=not parser.options.local_only_host_info,
*9c5db199SXin Li                    host_attributes=parser.options.host_attributes,
*9c5db199SXin Li            ),
*9c5db199SXin Li            'client': client,
*9c5db199SXin Li            'ssh_user': ssh_user,
*9c5db199SXin Li            'ssh_port': ssh_port,
*9c5db199SXin Li            'ssh_pass': ssh_pass,
*9c5db199SXin Li            'ssh_verbosity_flag': ssh_verbosity_flag,
*9c5db199SXin Li            'ssh_options': ssh_options,
*9c5db199SXin Li            'group_name': group_name,
*9c5db199SXin Li            'tag': execution_tag,
*9c5db199SXin Li            'disable_sysinfo': parser.options.disable_sysinfo,
*9c5db199SXin Li            'in_lab': in_lab,
*9c5db199SXin Li            'use_client_trampoline': use_client_trampoline,
*9c5db199SXin Li            'sync_offload_dir': parser.options.sync_offload_dir,
*9c5db199SXin Li            'companion_hosts': server_job.get_machine_dicts(
*9c5db199SXin Li                    machine_names=companion_hosts,
*9c5db199SXin Li                    store_dir=os.path.join(results,
*9c5db199SXin Li                                           parser.options.host_info_subdir),
*9c5db199SXin Li                    in_lab=in_lab,
*9c5db199SXin Li                    use_shadow_store=not parser.options.local_only_host_info,
*9c5db199SXin Li                    host_attributes=parser.options.host_attributes),
*9c5db199SXin Li            'dut_servers': dut_servers,
*9c5db199SXin Li            'is_cft': is_cft,
*9c5db199SXin Li            'force_full_log_collection': force_full_log_collection
*9c5db199SXin Li    }
*9c5db199SXin Li    if parser.options.parent_job_id:
*9c5db199SXin Li        job_kwargs['parent_job_id'] = int(parser.options.parent_job_id)
*9c5db199SXin Li    if control_filename:
*9c5db199SXin Li        job_kwargs['control_filename'] = control_filename
*9c5db199SXin Li    if parser.options.image_storage_server:
*9c5db199SXin Li        global_config.global_config.override_config_value(
*9c5db199SXin Li            'CROS', 'image_storage_server',
*9c5db199SXin Li            os.path.join(parser.options.image_storage_server, ''))
*9c5db199SXin Li
*9c5db199SXin Li    job = server_job.server_job(**job_kwargs)
*9c5db199SXin Li
*9c5db199SXin Li    job.logging.start_logging()
*9c5db199SXin Li
*9c5db199SXin Li    # perform checks
*9c5db199SXin Li    job.precheck()
*9c5db199SXin Li
*9c5db199SXin Li    # run the job
*9c5db199SXin Li    exit_code = 0
*9c5db199SXin Li    auto_start_servod = global_config.global_config.get_config_value(
*9c5db199SXin Li            'AUTOSERV', 'auto_start_servod', type=bool, default=False)
*9c5db199SXin Li
*9c5db199SXin Li    if not utils.is_in_container():
*9c5db199SXin Li        # crbug.com/1054522 -- ts_mon setup is broken inside the SSP container
*9c5db199SXin Li        # due to a problem in the installed python packages.
*9c5db199SXin Li        # Trying to clean up an incorrectly initialized ts_mon state adds a 5
*9c5db199SXin Li        # second overhead in process teardown, so avoid setting up ts_mon
*9c5db199SXin Li        # entirely inside the SSP container.
*9c5db199SXin Li        site_utils.SetupTsMonGlobalState('autoserv', indirect=False,
*9c5db199SXin Li                                         short_lived=True)
*9c5db199SXin Li    try:
*9c5db199SXin Li        try:
*9c5db199SXin Li            if repair:
*9c5db199SXin Li                if auto_start_servod and len(machines) == 1:
*9c5db199SXin Li                    _start_servod(machines[0])
*9c5db199SXin Li                job.repair(job_labels)
*9c5db199SXin Li            elif verify:
*9c5db199SXin Li                job.verify(job_labels)
*9c5db199SXin Li            elif provision:
*9c5db199SXin Li                job.provision(job_labels)
*9c5db199SXin Li            elif reset:
*9c5db199SXin Li                job.reset(job_labels)
*9c5db199SXin Li            elif cleanup:
*9c5db199SXin Li                job.cleanup(job_labels)
*9c5db199SXin Li            else:
*9c5db199SXin Li                if auto_start_servod and len(machines) == 1:
*9c5db199SXin Li                    _start_servod(machines[0])
*9c5db199SXin Li                if use_ssp:
*9c5db199SXin Li                    try:
*9c5db199SXin Li                        _run_with_ssp(job, container_id, job_or_task_id,
*9c5db199SXin Li                                        results, parser, ssp_url, machines)
*9c5db199SXin Li                    finally:
*9c5db199SXin Li                        # Update the ownership of files in result folder.
*9c5db199SXin Li                        correct_results_folder_permission(results)
*9c5db199SXin Li                else:
*9c5db199SXin Li                    if collect_crashinfo:
*9c5db199SXin Li                        # Update the ownership of files in result folder. If the
*9c5db199SXin Li                        # job to collect crashinfo was running inside container
*9c5db199SXin Li                        # (SSP) and crashed before correcting folder permission,
*9c5db199SXin Li                        # the result folder might have wrong permission setting.
*9c5db199SXin Li                        try:
*9c5db199SXin Li                            correct_results_folder_permission(results)
*9c5db199SXin Li                        except:
*9c5db199SXin Li                            # Ignore any error as the user may not have root
*9c5db199SXin Li                            # permission to run sudo command.
*9c5db199SXin Li                            pass
*9c5db199SXin Li                    metric_name = ('chromeos/autotest/experimental/'
*9c5db199SXin Li                                   'autoserv_job_run_duration')
*9c5db199SXin Li                    f = {'in_container': utils.is_in_container(),
*9c5db199SXin Li                         'success': False}
*9c5db199SXin Li                    with metrics.SecondsTimer(metric_name, fields=f) as c:
*9c5db199SXin Li                        job.run(verify_job_repo_url=verify_job_repo_url,
*9c5db199SXin Li                                only_collect_crashinfo=collect_crashinfo,
*9c5db199SXin Li                                skip_crash_collection=skip_crash_collection,
*9c5db199SXin Li                                job_labels=job_labels,
*9c5db199SXin Li                                use_packaging=(not no_use_packaging))
*9c5db199SXin Li                        c['success'] = True
*9c5db199SXin Li
*9c5db199SXin Li        finally:
*9c5db199SXin Li            job.close()
*9c5db199SXin Li    except error.AutoservSSPError:
*9c5db199SXin Li        # Due to the complexity of the TKO parsing/stainless connection, this
*9c5db199SXin Li        # must be 0 so that the "abort" is actually reflected on stainless.
*9c5db199SXin Li        exit_code = 0
*9c5db199SXin Li        traceback.print_exc()
*9c5db199SXin Li    except:
*9c5db199SXin Li        exit_code = 1
*9c5db199SXin Li        traceback.print_exc()
*9c5db199SXin Li    finally:
*9c5db199SXin Li        metrics.Flush()
*9c5db199SXin Li
*9c5db199SXin Li    sys.exit(exit_code)
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Li# Job breakdown statuses
*9c5db199SXin Li_hs = host_states.Status
*9c5db199SXin Li_qs = host_queue_entry_states.Status
*9c5db199SXin Li_status_list = [
*9c5db199SXin Li        _qs.QUEUED, _qs.RESETTING, _qs.VERIFYING,
*9c5db199SXin Li        _qs.PROVISIONING, _hs.REPAIRING, _qs.CLEANING,
*9c5db199SXin Li        _qs.RUNNING, _qs.GATHERING, _qs.PARSING]
*9c5db199SXin Li_JOB_OVERHEAD_STATUS = autotest_enum.AutotestEnum(*_status_list,
*9c5db199SXin Li                                                  string_values=True)
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef get_job_status(options):
*9c5db199SXin Li    """Returns the HQE Status for this run.
*9c5db199SXin Li
*9c5db199SXin Li    @param options: parser options.
*9c5db199SXin Li    """
*9c5db199SXin Li    s = _JOB_OVERHEAD_STATUS
*9c5db199SXin Li    task_mapping = {
*9c5db199SXin Li            'reset': s.RESETTING, 'verify': s.VERIFYING,
*9c5db199SXin Li            'provision': s.PROVISIONING, 'repair': s.REPAIRING,
*9c5db199SXin Li            'cleanup': s.CLEANING, 'collect_crashinfo': s.GATHERING}
*9c5db199SXin Li    match = [task for task in task_mapping if getattr(options, task, False)]
*9c5db199SXin Li    return task_mapping[match[0]] if match else s.RUNNING
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _require_ssp_from_control(control_name):
*9c5db199SXin Li    """Read the value of REQUIRE_SSP from test control file.
*9c5db199SXin Li
*9c5db199SXin Li    This reads the control file from the prod checkout of autotest and uses that
*9c5db199SXin Li    to determine whether to even stage the SSP package on a devserver.
*9c5db199SXin Li
*9c5db199SXin Li    This means:
*9c5db199SXin Li    [1] Any change in REQUIRE_SSP directive in a test requires a prod-push to go
*9c5db199SXin Li    live.
*9c5db199SXin Li    [2] This function may find that the control file does not exist but the SSP
*9c5db199SXin Li    package may contain the test file. This function conservatively returns True
*9c5db199SXin Li    in that case.
*9c5db199SXin Li
*9c5db199SXin Li    This function is called very early in autoserv, before logging is setup.
*9c5db199SXin Li    """
*9c5db199SXin Li    if not control_name:
*9c5db199SXin Li        return True
*9c5db199SXin Li    try:
*9c5db199SXin Li        path = _control_path_on_disk(control_name)
*9c5db199SXin Li    except error.AutoservError as e:
*9c5db199SXin Li        sys.stderr.write("autoserv: Could not determine control file path,"
*9c5db199SXin Li                         " assuming we need SSP: %s\n" % e)
*9c5db199SXin Li        sys.stderr.flush()
*9c5db199SXin Li        return True
*9c5db199SXin Li    if not os.path.isfile(path):
*9c5db199SXin Li        return True
*9c5db199SXin Li    control = control_data.parse_control(path)
*9c5db199SXin Li    # There must be explicit directive in the control file to disable SSP.
*9c5db199SXin Li    if not control or control.require_ssp is None:
*9c5db199SXin Li        return True
*9c5db199SXin Li    return control.require_ssp
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef _ssp_base_image_name_or_default(options):
*9c5db199SXin Li    """Extract base image name from autoserv options or the global config."""
*9c5db199SXin Li    if options.ssp_base_image_name:
*9c5db199SXin Li        return options.ssp_base_image_name
*9c5db199SXin Li    return global_config.global_config.get_config_value('AUTOSERV',
*9c5db199SXin Li                                                        'container_base_name')
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Lidef main():
*9c5db199SXin Li    start_time = datetime.datetime.now()
*9c5db199SXin Li    parser = autoserv_parser.autoserv_parser
*9c5db199SXin Li    parser.parse_args()
*9c5db199SXin Li
*9c5db199SXin Li    if len(sys.argv) == 1:
*9c5db199SXin Li        parser.parser.print_help()
*9c5db199SXin Li        sys.exit(1)
*9c5db199SXin Li
*9c5db199SXin Li    if parser.options.no_logging:
*9c5db199SXin Li        results = None
*9c5db199SXin Li    else:
*9c5db199SXin Li        results = parser.options.results
*9c5db199SXin Li        if not results:
*9c5db199SXin Li            results = 'results.' + time.strftime('%Y-%m-%d-%H.%M.%S')
*9c5db199SXin Li        results = os.path.abspath(results)
*9c5db199SXin Li        resultdir_exists = False
*9c5db199SXin Li        for filename in ('control.srv', 'status.log', '.autoserv_execute'):
*9c5db199SXin Li            if os.path.exists(os.path.join(results, filename)):
*9c5db199SXin Li                resultdir_exists = True
*9c5db199SXin Li        if not parser.options.use_existing_results and resultdir_exists:
*9c5db199SXin Li            error = "Error: results directory already exists: %s\n" % results
*9c5db199SXin Li            sys.stderr.write(error)
*9c5db199SXin Li            sys.exit(1)
*9c5db199SXin Li
*9c5db199SXin Li        # Now that we certified that there's no leftover results dir from
*9c5db199SXin Li        # previous jobs, lets create the result dir since the logging system
*9c5db199SXin Li        # needs to create the log file in there.
*9c5db199SXin Li        if not os.path.isdir(results):
*9c5db199SXin Li            os.makedirs(results)
*9c5db199SXin Li
*9c5db199SXin Li    if parser.options.require_ssp:
*9c5db199SXin Li        # This is currently only used for skylab (i.e., when --control-name is
*9c5db199SXin Li        # used).
*9c5db199SXin Li        use_ssp = _require_ssp_from_control(parser.options.control_name)
*9c5db199SXin Li    else:
*9c5db199SXin Li        use_ssp = False
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Li    if use_ssp:
*9c5db199SXin Li        log_dir = os.path.join(results, 'ssp_logs') if results else None
*9c5db199SXin Li        if log_dir and not os.path.exists(log_dir):
*9c5db199SXin Li            os.makedirs(log_dir)
*9c5db199SXin Li    else:
*9c5db199SXin Li        log_dir = results
*9c5db199SXin Li
*9c5db199SXin Li    logging_manager.configure_logging(
*9c5db199SXin Li            server_logging_config.ServerLoggingConfig(),
*9c5db199SXin Li            results_dir=log_dir,
*9c5db199SXin Li            use_console=not parser.options.no_tee,
*9c5db199SXin Li            verbose=parser.options.verbose,
*9c5db199SXin Li            no_console_prefix=parser.options.no_console_prefix)
*9c5db199SXin Li
*9c5db199SXin Li    logging.debug('autoserv is running in drone %s.', socket.gethostname())
*9c5db199SXin Li    logging.debug('autoserv environment: %r', os.environ)
*9c5db199SXin Li    logging.debug('autoserv command was: %s', ' '.join(sys.argv))
*9c5db199SXin Li    logging.debug('autoserv parsed options: %s', parser.options)
*9c5db199SXin Li    logging.debug('autoserv python version: %s', sys.version)
*9c5db199SXin Li
*9c5db199SXin Li    if use_ssp:
*9c5db199SXin Li        ssp_url = _stage_ssp(parser, results)
*9c5db199SXin Li    else:
*9c5db199SXin Li        ssp_url = None
*9c5db199SXin Li
*9c5db199SXin Li    if results:
*9c5db199SXin Li        logging.info("Results placed in %s" % results)
*9c5db199SXin Li
*9c5db199SXin Li        # wait until now to perform this check, so it get properly logged
*9c5db199SXin Li        if (parser.options.use_existing_results and not resultdir_exists and
*9c5db199SXin Li            not utils.is_in_container()):
*9c5db199SXin Li            logging.error("No existing results directory found: %s", results)
*9c5db199SXin Li            sys.exit(1)
*9c5db199SXin Li
*9c5db199SXin Li    if parser.options.write_pidfile and results:
*9c5db199SXin Li        pid_file_manager = pidfile.PidFileManager(parser.options.pidfile_label,
*9c5db199SXin Li                                                  results)
*9c5db199SXin Li        pid_file_manager.open_file()
*9c5db199SXin Li    else:
*9c5db199SXin Li        pid_file_manager = None
*9c5db199SXin Li
*9c5db199SXin Li    autotest.Autotest.set_install_in_tmpdir(
*9c5db199SXin Li        parser.options.install_in_tmpdir)
*9c5db199SXin Li
*9c5db199SXin Li    exit_code = 0
*9c5db199SXin Li    is_task = (parser.options.verify or parser.options.repair or
*9c5db199SXin Li               parser.options.provision or parser.options.reset or
*9c5db199SXin Li               parser.options.cleanup or parser.options.collect_crashinfo)
*9c5db199SXin Li
*9c5db199SXin Li    trace_labels = {
*9c5db199SXin Li            'job_id': job_directories.get_job_id_or_task_id(
*9c5db199SXin Li                    parser.options.results)
*9c5db199SXin Li    }
*9c5db199SXin Li    trace = cloud_trace.SpanStack(
*9c5db199SXin Li            labels=trace_labels,
*9c5db199SXin Li            global_context=parser.options.cloud_trace_context)
*9c5db199SXin Li    trace.enabled = parser.options.cloud_trace_context_enabled == 'True'
*9c5db199SXin Li    try:
*9c5db199SXin Li        try:
*9c5db199SXin Li            with trace.Span(get_job_status(parser.options)):
*9c5db199SXin Li                run_autoserv(pid_file_manager, results, parser, ssp_url,
*9c5db199SXin Li                             use_ssp)
*9c5db199SXin Li        except SystemExit as e:
*9c5db199SXin Li            exit_code = e.code
*9c5db199SXin Li            if exit_code:
*9c5db199SXin Li                logging.exception('Uncaught SystemExit with code %s', exit_code)
*9c5db199SXin Li        except Exception:
*9c5db199SXin Li            # If we don't know what happened, we'll classify it as
*9c5db199SXin Li            # an 'abort' and return 1.
*9c5db199SXin Li            logging.exception('Uncaught Exception, exit_code = 1.')
*9c5db199SXin Li            exit_code = 1
*9c5db199SXin Li    finally:
*9c5db199SXin Li        if pid_file_manager:
*9c5db199SXin Li            pid_file_manager.close_file(exit_code)
*9c5db199SXin Li    sys.exit(exit_code)
*9c5db199SXin Li
*9c5db199SXin Li
*9c5db199SXin Liif __name__ == '__main__':
*9c5db199SXin Li    main()