utils/analyzer/SATestBuild.py

e5dd7070Spatrick#!/usr/bin/env python
e5dd7070Spatrick
e5dd7070Spatrick"""
e5dd7070SpatrickStatic Analyzer qualification infrastructure.
e5dd7070Spatrick
e5dd7070SpatrickThe goal is to test the analyzer against different projects,
e5dd7070Spatrickcheck for failures, compare results, and measure performance.
e5dd7070Spatrick
e5dd7070SpatrickRepository Directory will contain sources of the projects as well as the
e5dd7070Spatrickinformation on how to build them and the expected output.
e5dd7070SpatrickRepository Directory structure:
e5dd7070Spatrick   - ProjectMap file
e5dd7070Spatrick   - Historical Performance Data
e5dd7070Spatrick   - Project Dir1
e5dd7070Spatrick     - ReferenceOutput
e5dd7070Spatrick   - Project Dir2
e5dd7070Spatrick     - ReferenceOutput
e5dd7070Spatrick   ..
e5dd7070SpatrickNote that the build tree must be inside the project dir.
e5dd7070Spatrick
e5dd7070SpatrickTo test the build of the analyzer one would:
e5dd7070Spatrick   - Copy over a copy of the Repository Directory. (TODO: Prefer to ensure that
e5dd7070Spatrick     the build directory does not pollute the repository to min network
e5dd7070Spatrick     traffic).
e5dd7070Spatrick   - Build all projects, until error. Produce logs to report errors.
e5dd7070Spatrick   - Compare results.
e5dd7070Spatrick
e5dd7070SpatrickThe files which should be kept around for failure investigations:
e5dd7070Spatrick   RepositoryCopy/Project DirI/ScanBuildResults
e5dd7070Spatrick   RepositoryCopy/Project DirI/run_static_analyzer.log
e5dd7070Spatrick
e5dd7070SpatrickAssumptions (TODO: shouldn't need to assume these.):
e5dd7070Spatrick   The script is being run from the Repository Directory.
e5dd7070Spatrick   The compiler for scan-build and scan-build are in the PATH.
e5dd7070Spatrick   export PATH=/Users/zaks/workspace/c2llvm/build/Release+Asserts/bin:$PATH
e5dd7070Spatrick
e5dd7070SpatrickFor more logging, set the  env variables:
e5dd7070Spatrick   zaks:TI zaks$ export CCC_ANALYZER_LOG=1
e5dd7070Spatrick   zaks:TI zaks$ export CCC_ANALYZER_VERBOSE=1
e5dd7070Spatrick
e5dd7070SpatrickThe list of checkers tested are hardcoded in the Checkers variable.
e5dd7070SpatrickFor testing additional checkers, use the SA_ADDITIONAL_CHECKERS environment
e5dd7070Spatrickvariable. It should contain a comma separated list.
e5dd7070Spatrick"""
e5dd7070Spatrickimport CmpRuns
ec727ea7Spatrickimport SATestUtils as utils
ec727ea7Spatrickfrom ProjectMap import DownloadType, ProjectInfo
e5dd7070Spatrick
e5dd7070Spatrickimport glob
e5dd7070Spatrickimport logging
e5dd7070Spatrickimport math
e5dd7070Spatrickimport multiprocessing
e5dd7070Spatrickimport os
e5dd7070Spatrickimport plistlib
e5dd7070Spatrickimport shutil
e5dd7070Spatrickimport sys
e5dd7070Spatrickimport threading
e5dd7070Spatrickimport time
ec727ea7Spatrickimport zipfile
ec727ea7Spatrick
ec727ea7Spatrickfrom queue import Queue
ec727ea7Spatrick# mypy has problems finding InvalidFileException in the module
ec727ea7Spatrick# and this is we can shush that false positive
ec727ea7Spatrickfrom plistlib import InvalidFileException  # type:ignore
ec727ea7Spatrickfrom subprocess import CalledProcessError, check_call
ec727ea7Spatrickfrom typing import Dict, IO, List, NamedTuple, Optional, TYPE_CHECKING, Tuple
ec727ea7Spatrick
e5dd7070Spatrick
e5dd7070Spatrick###############################################################################
e5dd7070Spatrick# Helper functions.
e5dd7070Spatrick###############################################################################
e5dd7070Spatrick
ec727ea7Spatrickclass StreamToLogger:
ec727ea7Spatrick    def __init__(self, logger: logging.Logger,
ec727ea7Spatrick                 log_level: int = logging.INFO):
e5dd7070Spatrick        self.logger = logger
e5dd7070Spatrick        self.log_level = log_level
e5dd7070Spatrick
ec727ea7Spatrick    def write(self, message: str):
e5dd7070Spatrick        # Rstrip in order not to write an extra newline.
ec727ea7Spatrick        self.logger.log(self.log_level, message.rstrip())
e5dd7070Spatrick
e5dd7070Spatrick    def flush(self):
e5dd7070Spatrick        pass
e5dd7070Spatrick
ec727ea7Spatrick    def fileno(self) -> int:
e5dd7070Spatrick        return 0
e5dd7070Spatrick
e5dd7070Spatrick
ec727ea7SpatrickLOCAL = threading.local()
e5dd7070Spatrick
e5dd7070Spatrick
ec727ea7Spatrickdef init_logger(name: str):
ec727ea7Spatrick    # TODO: use debug levels for VERBOSE messages
ec727ea7Spatrick    logger = logging.getLogger(name)
ec727ea7Spatrick    logger.setLevel(logging.DEBUG)
ec727ea7Spatrick    LOCAL.stdout = StreamToLogger(logger, logging.INFO)
ec727ea7Spatrick    LOCAL.stderr = StreamToLogger(logger, logging.ERROR)
e5dd7070Spatrick
e5dd7070Spatrick
ec727ea7Spatrickinit_logger("main")
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef stderr(message: str):
ec727ea7Spatrick    LOCAL.stderr.write(message)
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef stdout(message: str):
ec727ea7Spatrick    LOCAL.stdout.write(message)
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatricklogging.basicConfig(
ec727ea7Spatrick    format='%(asctime)s:%(levelname)s:%(name)s: %(message)s')
ec727ea7Spatrick
e5dd7070Spatrick
e5dd7070Spatrick###############################################################################
e5dd7070Spatrick# Configuration setup.
e5dd7070Spatrick###############################################################################
e5dd7070Spatrick
e5dd7070Spatrick
e5dd7070Spatrick# Find Clang for static analysis.
e5dd7070Spatrickif 'CC' in os.environ:
ec727ea7Spatrick    cc_candidate: Optional[str] = os.environ['CC']
e5dd7070Spatrickelse:
ec727ea7Spatrick    cc_candidate = utils.which("clang", os.environ['PATH'])
ec727ea7Spatrickif not cc_candidate:
ec727ea7Spatrick    stderr("Error: cannot find 'clang' in PATH")
e5dd7070Spatrick    sys.exit(1)
e5dd7070Spatrick
ec727ea7SpatrickCLANG = cc_candidate
e5dd7070Spatrick
ec727ea7Spatrick# Number of jobs.
ec727ea7SpatrickMAX_JOBS = int(math.ceil(multiprocessing.cpu_count() * 0.75))
e5dd7070Spatrick
e5dd7070Spatrick# Names of the project specific scripts.
e5dd7070Spatrick# The script that downloads the project.
ec727ea7SpatrickDOWNLOAD_SCRIPT = "download_project.sh"
e5dd7070Spatrick# The script that needs to be executed before the build can start.
ec727ea7SpatrickCLEANUP_SCRIPT = "cleanup_run_static_analyzer.sh"
e5dd7070Spatrick# This is a file containing commands for scan-build.
ec727ea7SpatrickBUILD_SCRIPT = "run_static_analyzer.cmd"
e5dd7070Spatrick
e5dd7070Spatrick# A comment in a build script which disables wrapping.
ec727ea7SpatrickNO_PREFIX_CMD = "#NOPREFIX"
e5dd7070Spatrick
e5dd7070Spatrick# The log file name.
ec727ea7SpatrickLOG_DIR_NAME = "Logs"
ec727ea7SpatrickBUILD_LOG_NAME = "run_static_analyzer.log"
e5dd7070Spatrick# Summary file - contains the summary of the failures. Ex: This info can be be
e5dd7070Spatrick# displayed when buildbot detects a build failure.
ec727ea7SpatrickNUM_OF_FAILURES_IN_SUMMARY = 10
e5dd7070Spatrick
e5dd7070Spatrick# The scan-build result directory.
ec727ea7SpatrickOUTPUT_DIR_NAME = "ScanBuildResults"
ec727ea7SpatrickREF_PREFIX = "Ref"
e5dd7070Spatrick
e5dd7070Spatrick# The name of the directory storing the cached project source. If this
e5dd7070Spatrick# directory does not exist, the download script will be executed.
e5dd7070Spatrick# That script should create the "CachedSource" directory and download the
e5dd7070Spatrick# project source into it.
ec727ea7SpatrickCACHED_SOURCE_DIR_NAME = "CachedSource"
e5dd7070Spatrick
e5dd7070Spatrick# The name of the directory containing the source code that will be analyzed.
e5dd7070Spatrick# Each time a project is analyzed, a fresh copy of its CachedSource directory
e5dd7070Spatrick# will be copied to the PatchedSource directory and then the local patches
ec727ea7Spatrick# in PATCHFILE_NAME will be applied (if PATCHFILE_NAME exists).
ec727ea7SpatrickPATCHED_SOURCE_DIR_NAME = "PatchedSource"
e5dd7070Spatrick
e5dd7070Spatrick# The name of the patchfile specifying any changes that should be applied
e5dd7070Spatrick# to the CachedSource before analyzing.
ec727ea7SpatrickPATCHFILE_NAME = "changes_for_analyzer.patch"
e5dd7070Spatrick
e5dd7070Spatrick# The list of checkers used during analyzes.
e5dd7070Spatrick# Currently, consists of all the non-experimental checkers, plus a few alpha
e5dd7070Spatrick# checkers we don't want to regress on.
ec727ea7SpatrickCHECKERS = ",".join([
e5dd7070Spatrick    "alpha.unix.SimpleStream",
e5dd7070Spatrick    "alpha.security.taint",
e5dd7070Spatrick    "cplusplus.NewDeleteLeaks",
e5dd7070Spatrick    "core",
e5dd7070Spatrick    "cplusplus",
e5dd7070Spatrick    "deadcode",
e5dd7070Spatrick    "security",
e5dd7070Spatrick    "unix",
e5dd7070Spatrick    "osx",
e5dd7070Spatrick    "nullability"
e5dd7070Spatrick])
e5dd7070Spatrick
ec727ea7SpatrickVERBOSE = 0
ec727ea7Spatrick
e5dd7070Spatrick
e5dd7070Spatrick###############################################################################
e5dd7070Spatrick# Test harness logic.
e5dd7070Spatrick###############################################################################
e5dd7070Spatrick
e5dd7070Spatrick
ec727ea7Spatrickdef run_cleanup_script(directory: str, build_log_file: IO):
e5dd7070Spatrick    """
e5dd7070Spatrick    Run pre-processing script if any.
e5dd7070Spatrick    """
ec727ea7Spatrick    cwd = os.path.join(directory, PATCHED_SOURCE_DIR_NAME)
ec727ea7Spatrick    script_path = os.path.join(directory, CLEANUP_SCRIPT)
ec727ea7Spatrick
ec727ea7Spatrick    utils.run_script(script_path, build_log_file, cwd,
ec727ea7Spatrick                     out=LOCAL.stdout, err=LOCAL.stderr,
ec727ea7Spatrick                     verbose=VERBOSE)
e5dd7070Spatrick
e5dd7070Spatrick
ec727ea7Spatrickclass TestInfo(NamedTuple):
e5dd7070Spatrick    """
ec727ea7Spatrick    Information about a project and settings for its analysis.
e5dd7070Spatrick    """
ec727ea7Spatrick    project: ProjectInfo
ec727ea7Spatrick    override_compiler: bool = False
ec727ea7Spatrick    extra_analyzer_config: str = ""
*12c85518Srobert    extra_checkers: str = ""
ec727ea7Spatrick    is_reference_build: bool = False
ec727ea7Spatrick    strictness: int = 0
e5dd7070Spatrick
e5dd7070Spatrick
ec727ea7Spatrick# typing package doesn't have a separate type for Queue, but has a generic stub
ec727ea7Spatrick# We still want to have a type-safe checked project queue, for this reason,
ec727ea7Spatrick# we specify generic type for mypy.
ec727ea7Spatrick#
ec727ea7Spatrick# It is a common workaround for this situation:
ec727ea7Spatrick# https://mypy.readthedocs.io/en/stable/common_issues.html#using-classes-that-are-generic-in-stubs-but-not-at-runtime
ec727ea7Spatrickif TYPE_CHECKING:
ec727ea7Spatrick    TestQueue = Queue[TestInfo]  # this is only processed by mypy
e5dd7070Spatrickelse:
ec727ea7Spatrick    TestQueue = Queue  # this will be executed at runtime
e5dd7070Spatrick
e5dd7070Spatrick
ec727ea7Spatrickclass RegressionTester:
e5dd7070Spatrick    """
ec727ea7Spatrick    A component aggregating all of the project testing.
e5dd7070Spatrick    """
*12c85518Srobert
ec727ea7Spatrick    def __init__(self, jobs: int, projects: List[ProjectInfo],
ec727ea7Spatrick                 override_compiler: bool, extra_analyzer_config: str,
*12c85518Srobert                 extra_checkers: str,
ec727ea7Spatrick                 regenerate: bool, strictness: bool):
ec727ea7Spatrick        self.jobs = jobs
ec727ea7Spatrick        self.projects = projects
ec727ea7Spatrick        self.override_compiler = override_compiler
ec727ea7Spatrick        self.extra_analyzer_config = extra_analyzer_config
*12c85518Srobert        self.extra_checkers = extra_checkers
ec727ea7Spatrick        self.regenerate = regenerate
ec727ea7Spatrick        self.strictness = strictness
e5dd7070Spatrick
ec727ea7Spatrick    def test_all(self) -> bool:
ec727ea7Spatrick        projects_to_test: List[TestInfo] = []
e5dd7070Spatrick
ec727ea7Spatrick        # Test the projects.
ec727ea7Spatrick        for project in self.projects:
ec727ea7Spatrick            projects_to_test.append(
ec727ea7Spatrick                TestInfo(project,
ec727ea7Spatrick                         self.override_compiler,
ec727ea7Spatrick                         self.extra_analyzer_config,
*12c85518Srobert                         self.extra_checkers,
ec727ea7Spatrick                         self.regenerate, self.strictness))
ec727ea7Spatrick        if self.jobs <= 1:
ec727ea7Spatrick            return self._single_threaded_test_all(projects_to_test)
e5dd7070Spatrick        else:
ec727ea7Spatrick            return self._multi_threaded_test_all(projects_to_test)
e5dd7070Spatrick
ec727ea7Spatrick    def _single_threaded_test_all(self,
ec727ea7Spatrick                                  projects_to_test: List[TestInfo]) -> bool:
e5dd7070Spatrick        """
e5dd7070Spatrick        Run all projects.
e5dd7070Spatrick        :return: whether tests have passed.
e5dd7070Spatrick        """
ec727ea7Spatrick        success = True
ec727ea7Spatrick        for project_info in projects_to_test:
ec727ea7Spatrick            tester = ProjectTester(project_info)
ec727ea7Spatrick            success &= tester.test()
ec727ea7Spatrick        return success
e5dd7070Spatrick
ec727ea7Spatrick    def _multi_threaded_test_all(self,
ec727ea7Spatrick                                 projects_to_test: List[TestInfo]) -> bool:
e5dd7070Spatrick        """
e5dd7070Spatrick        Run each project in a separate thread.
e5dd7070Spatrick
e5dd7070Spatrick        This is OK despite GIL, as testing is blocked
e5dd7070Spatrick        on launching external processes.
e5dd7070Spatrick
e5dd7070Spatrick        :return: whether tests have passed.
e5dd7070Spatrick        """
ec727ea7Spatrick        tasks_queue = TestQueue()
e5dd7070Spatrick
ec727ea7Spatrick        for project_info in projects_to_test:
ec727ea7Spatrick            tasks_queue.put(project_info)
e5dd7070Spatrick
ec727ea7Spatrick        results_differ = threading.Event()
ec727ea7Spatrick        failure_flag = threading.Event()
e5dd7070Spatrick
ec727ea7Spatrick        for _ in range(self.jobs):
ec727ea7Spatrick            T = TestProjectThread(tasks_queue, results_differ, failure_flag)
e5dd7070Spatrick            T.start()
e5dd7070Spatrick
e5dd7070Spatrick        # Required to handle Ctrl-C gracefully.
ec727ea7Spatrick        while tasks_queue.unfinished_tasks:
e5dd7070Spatrick            time.sleep(0.1)  # Seconds.
ec727ea7Spatrick            if failure_flag.is_set():
ec727ea7Spatrick                stderr("Test runner crashed\n")
e5dd7070Spatrick                sys.exit(1)
ec727ea7Spatrick        return not results_differ.is_set()
e5dd7070Spatrick
e5dd7070Spatrick
ec727ea7Spatrickclass ProjectTester:
ec727ea7Spatrick    """
ec727ea7Spatrick    A component aggregating testing for one project.
ec727ea7Spatrick    """
*12c85518Srobert
ec727ea7Spatrick    def __init__(self, test_info: TestInfo, silent: bool = False):
ec727ea7Spatrick        self.project = test_info.project
ec727ea7Spatrick        self.override_compiler = test_info.override_compiler
ec727ea7Spatrick        self.extra_analyzer_config = test_info.extra_analyzer_config
*12c85518Srobert        self.extra_checkers = test_info.extra_checkers
ec727ea7Spatrick        self.is_reference_build = test_info.is_reference_build
ec727ea7Spatrick        self.strictness = test_info.strictness
ec727ea7Spatrick        self.silent = silent
e5dd7070Spatrick
ec727ea7Spatrick    def test(self) -> bool:
ec727ea7Spatrick        """
ec727ea7Spatrick        Test a given project.
ec727ea7Spatrick        :return tests_passed: Whether tests have passed according
ec727ea7Spatrick        to the :param strictness: criteria.
ec727ea7Spatrick        """
ec727ea7Spatrick        if not self.project.enabled:
ec727ea7Spatrick            self.out(
ec727ea7Spatrick                f" \n\n--- Skipping disabled project {self.project.name}\n")
ec727ea7Spatrick            return True
e5dd7070Spatrick
ec727ea7Spatrick        self.out(f" \n\n--- Building project {self.project.name}\n")
ec727ea7Spatrick
ec727ea7Spatrick        start_time = time.time()
ec727ea7Spatrick
ec727ea7Spatrick        project_dir = self.get_project_dir()
ec727ea7Spatrick        self.vout(f"  Build directory: {project_dir}.\n")
ec727ea7Spatrick
ec727ea7Spatrick        # Set the build results directory.
ec727ea7Spatrick        output_dir = self.get_output_dir()
ec727ea7Spatrick
ec727ea7Spatrick        self.build(project_dir, output_dir)
ec727ea7Spatrick        check_build(output_dir)
ec727ea7Spatrick
ec727ea7Spatrick        if self.is_reference_build:
ec727ea7Spatrick            cleanup_reference_results(output_dir)
ec727ea7Spatrick            passed = True
e5dd7070Spatrick        else:
ec727ea7Spatrick            passed = run_cmp_results(project_dir, self.strictness)
ec727ea7Spatrick
ec727ea7Spatrick        self.out(f"Completed tests for project {self.project.name} "
ec727ea7Spatrick                 f"(time: {time.time() - start_time:.2f}).\n")
ec727ea7Spatrick
ec727ea7Spatrick        return passed
ec727ea7Spatrick
ec727ea7Spatrick    def get_project_dir(self) -> str:
ec727ea7Spatrick        return os.path.join(os.path.abspath(os.curdir), self.project.name)
ec727ea7Spatrick
ec727ea7Spatrick    def get_output_dir(self) -> str:
ec727ea7Spatrick        if self.is_reference_build:
ec727ea7Spatrick            dirname = REF_PREFIX + OUTPUT_DIR_NAME
ec727ea7Spatrick        else:
ec727ea7Spatrick            dirname = OUTPUT_DIR_NAME
ec727ea7Spatrick
ec727ea7Spatrick        return os.path.join(self.get_project_dir(), dirname)
ec727ea7Spatrick
ec727ea7Spatrick    def build(self, directory: str, output_dir: str) -> Tuple[float, int]:
ec727ea7Spatrick        build_log_path = get_build_log_path(output_dir)
ec727ea7Spatrick
ec727ea7Spatrick        self.out(f"Log file: {build_log_path}\n")
ec727ea7Spatrick        self.out(f"Output directory: {output_dir}\n")
ec727ea7Spatrick
ec727ea7Spatrick        remove_log_file(output_dir)
ec727ea7Spatrick
ec727ea7Spatrick        # Clean up scan build results.
ec727ea7Spatrick        if os.path.exists(output_dir):
ec727ea7Spatrick            self.vout(f"  Removing old results: {output_dir}\n")
ec727ea7Spatrick
ec727ea7Spatrick            shutil.rmtree(output_dir)
ec727ea7Spatrick
ec727ea7Spatrick        assert(not os.path.exists(output_dir))
ec727ea7Spatrick        os.makedirs(os.path.join(output_dir, LOG_DIR_NAME))
ec727ea7Spatrick
ec727ea7Spatrick        # Build and analyze the project.
ec727ea7Spatrick        with open(build_log_path, "w+") as build_log_file:
ec727ea7Spatrick            if self.project.mode == 1:
ec727ea7Spatrick                self._download_and_patch(directory, build_log_file)
ec727ea7Spatrick                run_cleanup_script(directory, build_log_file)
ec727ea7Spatrick                build_time, memory = self.scan_build(directory, output_dir,
ec727ea7Spatrick                                                     build_log_file)
ec727ea7Spatrick            else:
ec727ea7Spatrick                build_time, memory = self.analyze_preprocessed(directory,
ec727ea7Spatrick                                                               output_dir)
ec727ea7Spatrick
ec727ea7Spatrick            if self.is_reference_build:
ec727ea7Spatrick                run_cleanup_script(directory, build_log_file)
ec727ea7Spatrick                normalize_reference_results(directory, output_dir,
ec727ea7Spatrick                                            self.project.mode)
ec727ea7Spatrick
ec727ea7Spatrick        self.out(f"Build complete (time: {utils.time_to_str(build_time)}, "
ec727ea7Spatrick                 f"peak memory: {utils.memory_to_str(memory)}). "
ec727ea7Spatrick                 f"See the log for more details: {build_log_path}\n")
ec727ea7Spatrick
ec727ea7Spatrick        return build_time, memory
ec727ea7Spatrick
ec727ea7Spatrick    def scan_build(self, directory: str, output_dir: str,
ec727ea7Spatrick                   build_log_file: IO) -> Tuple[float, int]:
ec727ea7Spatrick        """
ec727ea7Spatrick        Build the project with scan-build by reading in the commands and
ec727ea7Spatrick        prefixing them with the scan-build options.
ec727ea7Spatrick        """
ec727ea7Spatrick        build_script_path = os.path.join(directory, BUILD_SCRIPT)
ec727ea7Spatrick        if not os.path.exists(build_script_path):
ec727ea7Spatrick            stderr(f"Error: build script is not defined: "
ec727ea7Spatrick                   f"{build_script_path}\n")
ec727ea7Spatrick            sys.exit(1)
ec727ea7Spatrick
ec727ea7Spatrick        all_checkers = CHECKERS
ec727ea7Spatrick        if 'SA_ADDITIONAL_CHECKERS' in os.environ:
ec727ea7Spatrick            all_checkers = (all_checkers + ',' +
ec727ea7Spatrick                            os.environ['SA_ADDITIONAL_CHECKERS'])
*12c85518Srobert        if self.extra_checkers != "":
*12c85518Srobert            all_checkers += "," + self.extra_checkers
ec727ea7Spatrick
ec727ea7Spatrick        # Run scan-build from within the patched source directory.
ec727ea7Spatrick        cwd = os.path.join(directory, PATCHED_SOURCE_DIR_NAME)
ec727ea7Spatrick
ec727ea7Spatrick        options = f"--use-analyzer '{CLANG}' "
ec727ea7Spatrick        options += f"-plist-html -o '{output_dir}' "
ec727ea7Spatrick        options += f"-enable-checker {all_checkers} "
ec727ea7Spatrick        options += "--keep-empty "
ec727ea7Spatrick        options += f"-analyzer-config '{self.generate_config()}' "
ec727ea7Spatrick
ec727ea7Spatrick        if self.override_compiler:
ec727ea7Spatrick            options += "--override-compiler "
ec727ea7Spatrick
ec727ea7Spatrick        extra_env: Dict[str, str] = {}
ec727ea7Spatrick
ec727ea7Spatrick        execution_time = 0.0
ec727ea7Spatrick        peak_memory = 0
ec727ea7Spatrick
ec727ea7Spatrick        try:
ec727ea7Spatrick            command_file = open(build_script_path, "r")
ec727ea7Spatrick            command_prefix = "scan-build " + options + " "
ec727ea7Spatrick
ec727ea7Spatrick            for command in command_file:
ec727ea7Spatrick                command = command.strip()
ec727ea7Spatrick
ec727ea7Spatrick                if len(command) == 0:
ec727ea7Spatrick                    continue
ec727ea7Spatrick
ec727ea7Spatrick                # Custom analyzer invocation specified by project.
ec727ea7Spatrick                # Communicate required information using environment variables
ec727ea7Spatrick                # instead.
ec727ea7Spatrick                if command == NO_PREFIX_CMD:
ec727ea7Spatrick                    command_prefix = ""
ec727ea7Spatrick                    extra_env['OUTPUT'] = output_dir
ec727ea7Spatrick                    extra_env['CC'] = CLANG
ec727ea7Spatrick                    extra_env['ANALYZER_CONFIG'] = self.generate_config()
ec727ea7Spatrick                    continue
ec727ea7Spatrick
ec727ea7Spatrick                if command.startswith("#"):
ec727ea7Spatrick                    continue
ec727ea7Spatrick
ec727ea7Spatrick                # If using 'make', auto imply a -jX argument
ec727ea7Spatrick                # to speed up analysis.  xcodebuild will
ec727ea7Spatrick                # automatically use the maximum number of cores.
ec727ea7Spatrick                if (command.startswith("make ") or command == "make") and \
ec727ea7Spatrick                        "-j" not in command:
ec727ea7Spatrick                    command += f" -j{MAX_JOBS}"
ec727ea7Spatrick
ec727ea7Spatrick                command_to_run = command_prefix + command
ec727ea7Spatrick
ec727ea7Spatrick                self.vout(f"  Executing: {command_to_run}\n")
ec727ea7Spatrick
ec727ea7Spatrick                time, mem = utils.check_and_measure_call(
ec727ea7Spatrick                    command_to_run, cwd=cwd,
ec727ea7Spatrick                    stderr=build_log_file,
ec727ea7Spatrick                    stdout=build_log_file,
ec727ea7Spatrick                    env=dict(os.environ, **extra_env),
ec727ea7Spatrick                    shell=True)
ec727ea7Spatrick
ec727ea7Spatrick                execution_time += time
ec727ea7Spatrick                peak_memory = max(peak_memory, mem)
ec727ea7Spatrick
ec727ea7Spatrick        except CalledProcessError:
ec727ea7Spatrick            stderr("Error: scan-build failed. Its output was: \n")
ec727ea7Spatrick            build_log_file.seek(0)
ec727ea7Spatrick            shutil.copyfileobj(build_log_file, LOCAL.stderr)
ec727ea7Spatrick            sys.exit(1)
ec727ea7Spatrick
ec727ea7Spatrick        return execution_time, peak_memory
ec727ea7Spatrick
ec727ea7Spatrick    def analyze_preprocessed(self, directory: str,
ec727ea7Spatrick                             output_dir: str) -> Tuple[float, int]:
ec727ea7Spatrick        """
ec727ea7Spatrick        Run analysis on a set of preprocessed files.
ec727ea7Spatrick        """
ec727ea7Spatrick        if os.path.exists(os.path.join(directory, BUILD_SCRIPT)):
ec727ea7Spatrick            stderr(f"Error: The preprocessed files project "
ec727ea7Spatrick                   f"should not contain {BUILD_SCRIPT}\n")
ec727ea7Spatrick            raise Exception()
ec727ea7Spatrick
ec727ea7Spatrick        prefix = CLANG + " --analyze "
ec727ea7Spatrick
ec727ea7Spatrick        prefix += "--analyzer-output plist "
ec727ea7Spatrick        prefix += " -Xclang -analyzer-checker=" + CHECKERS
ec727ea7Spatrick        prefix += " -fcxx-exceptions -fblocks "
ec727ea7Spatrick        prefix += " -Xclang -analyzer-config "
ec727ea7Spatrick        prefix += f"-Xclang {self.generate_config()} "
ec727ea7Spatrick
ec727ea7Spatrick        if self.project.mode == 2:
ec727ea7Spatrick            prefix += "-std=c++11 "
ec727ea7Spatrick
ec727ea7Spatrick        plist_path = os.path.join(directory, output_dir, "date")
ec727ea7Spatrick        fail_path = os.path.join(plist_path, "failures")
ec727ea7Spatrick        os.makedirs(fail_path)
ec727ea7Spatrick
ec727ea7Spatrick        execution_time = 0.0
ec727ea7Spatrick        peak_memory = 0
ec727ea7Spatrick
ec727ea7Spatrick        for full_file_name in glob.glob(directory + "/*"):
ec727ea7Spatrick            file_name = os.path.basename(full_file_name)
ec727ea7Spatrick            failed = False
ec727ea7Spatrick
ec727ea7Spatrick            # Only run the analyzes on supported files.
ec727ea7Spatrick            if utils.has_no_extension(file_name):
ec727ea7Spatrick                continue
ec727ea7Spatrick            if not utils.is_valid_single_input_file(file_name):
ec727ea7Spatrick                stderr(f"Error: Invalid single input file {full_file_name}.\n")
ec727ea7Spatrick                raise Exception()
ec727ea7Spatrick
ec727ea7Spatrick            # Build and call the analyzer command.
ec727ea7Spatrick            plist_basename = os.path.join(plist_path, file_name)
ec727ea7Spatrick            output_option = f"-o '{plist_basename}.plist' "
ec727ea7Spatrick            command = f"{prefix}{output_option}'{file_name}'"
ec727ea7Spatrick
ec727ea7Spatrick            log_path = os.path.join(fail_path, file_name + ".stderr.txt")
ec727ea7Spatrick            with open(log_path, "w+") as log_file:
ec727ea7Spatrick                try:
ec727ea7Spatrick                    self.vout(f"  Executing: {command}\n")
ec727ea7Spatrick
ec727ea7Spatrick                    time, mem = utils.check_and_measure_call(
ec727ea7Spatrick                        command, cwd=directory, stderr=log_file,
ec727ea7Spatrick                        stdout=log_file, shell=True)
ec727ea7Spatrick
ec727ea7Spatrick                    execution_time += time
ec727ea7Spatrick                    peak_memory = max(peak_memory, mem)
ec727ea7Spatrick
ec727ea7Spatrick                except CalledProcessError as e:
ec727ea7Spatrick                    stderr(f"Error: Analyzes of {full_file_name} failed. "
ec727ea7Spatrick                           f"See {log_file.name} for details. "
ec727ea7Spatrick                           f"Error code {e.returncode}.\n")
ec727ea7Spatrick                    failed = True
ec727ea7Spatrick
ec727ea7Spatrick                # If command did not fail, erase the log file.
ec727ea7Spatrick                if not failed:
ec727ea7Spatrick                    os.remove(log_file.name)
ec727ea7Spatrick
ec727ea7Spatrick        return execution_time, peak_memory
ec727ea7Spatrick
ec727ea7Spatrick    def generate_config(self) -> str:
ec727ea7Spatrick        out = "serialize-stats=true,stable-report-filename=true"
ec727ea7Spatrick
ec727ea7Spatrick        if self.extra_analyzer_config:
ec727ea7Spatrick            out += "," + self.extra_analyzer_config
ec727ea7Spatrick
ec727ea7Spatrick        return out
ec727ea7Spatrick
ec727ea7Spatrick    def _download_and_patch(self, directory: str, build_log_file: IO):
ec727ea7Spatrick        """
ec727ea7Spatrick        Download the project and apply the local patchfile if it exists.
ec727ea7Spatrick        """
ec727ea7Spatrick        cached_source = os.path.join(directory, CACHED_SOURCE_DIR_NAME)
ec727ea7Spatrick
ec727ea7Spatrick        # If the we don't already have the cached source, run the project's
ec727ea7Spatrick        # download script to download it.
ec727ea7Spatrick        if not os.path.exists(cached_source):
ec727ea7Spatrick            self._download(directory, build_log_file)
ec727ea7Spatrick            if not os.path.exists(cached_source):
ec727ea7Spatrick                stderr(f"Error: '{cached_source}' not found after download.\n")
ec727ea7Spatrick                exit(1)
ec727ea7Spatrick
ec727ea7Spatrick        patched_source = os.path.join(directory, PATCHED_SOURCE_DIR_NAME)
ec727ea7Spatrick
ec727ea7Spatrick        # Remove potentially stale patched source.
ec727ea7Spatrick        if os.path.exists(patched_source):
ec727ea7Spatrick            shutil.rmtree(patched_source)
ec727ea7Spatrick
ec727ea7Spatrick        # Copy the cached source and apply any patches to the copy.
ec727ea7Spatrick        shutil.copytree(cached_source, patched_source, symlinks=True)
ec727ea7Spatrick        self._apply_patch(directory, build_log_file)
ec727ea7Spatrick
ec727ea7Spatrick    def _download(self, directory: str, build_log_file: IO):
ec727ea7Spatrick        """
ec727ea7Spatrick        Run the script to download the project, if it exists.
ec727ea7Spatrick        """
ec727ea7Spatrick        if self.project.source == DownloadType.GIT:
ec727ea7Spatrick            self._download_from_git(directory, build_log_file)
ec727ea7Spatrick        elif self.project.source == DownloadType.ZIP:
ec727ea7Spatrick            self._unpack_zip(directory, build_log_file)
ec727ea7Spatrick        elif self.project.source == DownloadType.SCRIPT:
ec727ea7Spatrick            self._run_download_script(directory, build_log_file)
ec727ea7Spatrick        else:
ec727ea7Spatrick            raise ValueError(
ec727ea7Spatrick                f"Unknown source type '{self.project.source}' is found "
ec727ea7Spatrick                f"for the '{self.project.name}' project")
ec727ea7Spatrick
ec727ea7Spatrick    def _download_from_git(self, directory: str, build_log_file: IO):
ec727ea7Spatrick        repo = self.project.origin
ec727ea7Spatrick        cached_source = os.path.join(directory, CACHED_SOURCE_DIR_NAME)
ec727ea7Spatrick
ec727ea7Spatrick        check_call(f"git clone --recursive {repo} {cached_source}",
ec727ea7Spatrick                   cwd=directory, stderr=build_log_file,
ec727ea7Spatrick                   stdout=build_log_file, shell=True)
ec727ea7Spatrick        check_call(f"git checkout --quiet {self.project.commit}",
ec727ea7Spatrick                   cwd=cached_source, stderr=build_log_file,
ec727ea7Spatrick                   stdout=build_log_file, shell=True)
ec727ea7Spatrick
ec727ea7Spatrick    def _unpack_zip(self, directory: str, build_log_file: IO):
ec727ea7Spatrick        zip_files = list(glob.glob(directory + "/*.zip"))
ec727ea7Spatrick
ec727ea7Spatrick        if len(zip_files) == 0:
ec727ea7Spatrick            raise ValueError(
ec727ea7Spatrick                f"Couldn't find any zip files to unpack for the "
ec727ea7Spatrick                f"'{self.project.name}' project")
ec727ea7Spatrick
ec727ea7Spatrick        if len(zip_files) > 1:
ec727ea7Spatrick            raise ValueError(
ec727ea7Spatrick                f"Couldn't decide which of the zip files ({zip_files}) "
ec727ea7Spatrick                f"for the '{self.project.name}' project to unpack")
ec727ea7Spatrick
ec727ea7Spatrick        with zipfile.ZipFile(zip_files[0], "r") as zip_file:
ec727ea7Spatrick            zip_file.extractall(os.path.join(directory,
ec727ea7Spatrick                                             CACHED_SOURCE_DIR_NAME))
ec727ea7Spatrick
ec727ea7Spatrick    @staticmethod
ec727ea7Spatrick    def _run_download_script(directory: str, build_log_file: IO):
ec727ea7Spatrick        script_path = os.path.join(directory, DOWNLOAD_SCRIPT)
ec727ea7Spatrick        utils.run_script(script_path, build_log_file, directory,
ec727ea7Spatrick                         out=LOCAL.stdout, err=LOCAL.stderr,
ec727ea7Spatrick                         verbose=VERBOSE)
ec727ea7Spatrick
ec727ea7Spatrick    def _apply_patch(self, directory: str, build_log_file: IO):
ec727ea7Spatrick        patchfile_path = os.path.join(directory, PATCHFILE_NAME)
ec727ea7Spatrick        patched_source = os.path.join(directory, PATCHED_SOURCE_DIR_NAME)
ec727ea7Spatrick
ec727ea7Spatrick        if not os.path.exists(patchfile_path):
ec727ea7Spatrick            self.out("  No local patches.\n")
ec727ea7Spatrick            return
ec727ea7Spatrick
ec727ea7Spatrick        self.out("  Applying patch.\n")
ec727ea7Spatrick        try:
ec727ea7Spatrick            check_call(f"patch -p1 < '{patchfile_path}'",
ec727ea7Spatrick                       cwd=patched_source,
ec727ea7Spatrick                       stderr=build_log_file,
ec727ea7Spatrick                       stdout=build_log_file,
ec727ea7Spatrick                       shell=True)
ec727ea7Spatrick
ec727ea7Spatrick        except CalledProcessError:
ec727ea7Spatrick            stderr(f"Error: Patch failed. "
ec727ea7Spatrick                   f"See {build_log_file.name} for details.\n")
ec727ea7Spatrick            sys.exit(1)
ec727ea7Spatrick
ec727ea7Spatrick    def out(self, what: str):
ec727ea7Spatrick        if not self.silent:
ec727ea7Spatrick            stdout(what)
ec727ea7Spatrick
ec727ea7Spatrick    def vout(self, what: str):
ec727ea7Spatrick        if VERBOSE >= 1:
ec727ea7Spatrick            self.out(what)
e5dd7070Spatrick
e5dd7070Spatrick
ec727ea7Spatrickclass TestProjectThread(threading.Thread):
ec727ea7Spatrick    def __init__(self, tasks_queue: TestQueue,
ec727ea7Spatrick                 results_differ: threading.Event,
ec727ea7Spatrick                 failure_flag: threading.Event):
ec727ea7Spatrick        """
ec727ea7Spatrick        :param results_differ: Used to signify that results differ from
ec727ea7Spatrick               the canonical ones.
ec727ea7Spatrick        :param failure_flag: Used to signify a failure during the run.
ec727ea7Spatrick        """
ec727ea7Spatrick        self.tasks_queue = tasks_queue
ec727ea7Spatrick        self.results_differ = results_differ
ec727ea7Spatrick        self.failure_flag = failure_flag
ec727ea7Spatrick        super().__init__()
e5dd7070Spatrick
ec727ea7Spatrick        # Needed to gracefully handle interrupts with Ctrl-C
ec727ea7Spatrick        self.daemon = True
ec727ea7Spatrick
ec727ea7Spatrick    def run(self):
ec727ea7Spatrick        while not self.tasks_queue.empty():
ec727ea7Spatrick            try:
ec727ea7Spatrick                test_info = self.tasks_queue.get()
ec727ea7Spatrick                init_logger(test_info.project.name)
ec727ea7Spatrick
ec727ea7Spatrick                tester = ProjectTester(test_info)
ec727ea7Spatrick                if not tester.test():
ec727ea7Spatrick                    self.results_differ.set()
ec727ea7Spatrick
ec727ea7Spatrick                self.tasks_queue.task_done()
ec727ea7Spatrick
ec727ea7Spatrick            except BaseException:
ec727ea7Spatrick                self.failure_flag.set()
ec727ea7Spatrick                raise
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrick###############################################################################
ec727ea7Spatrick# Utility functions.
ec727ea7Spatrick###############################################################################
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef check_build(output_dir: str):
ec727ea7Spatrick    """
ec727ea7Spatrick    Given the scan-build output directory, checks if the build failed
ec727ea7Spatrick    (by searching for the failures directories). If there are failures, it
ec727ea7Spatrick    creates a summary file in the output directory.
ec727ea7Spatrick
ec727ea7Spatrick    """
ec727ea7Spatrick    # Check if there are failures.
ec727ea7Spatrick    failures = glob.glob(output_dir + "/*/failures/*.stderr.txt")
ec727ea7Spatrick    total_failed = len(failures)
ec727ea7Spatrick
ec727ea7Spatrick    if total_failed == 0:
ec727ea7Spatrick        clean_up_empty_plists(output_dir)
ec727ea7Spatrick        clean_up_empty_folders(output_dir)
ec727ea7Spatrick
ec727ea7Spatrick        plists = glob.glob(output_dir + "/*/*.plist")
ec727ea7Spatrick        stdout(f"Number of bug reports "
ec727ea7Spatrick               f"(non-empty plist files) produced: {len(plists)}\n")
ec727ea7Spatrick        return
ec727ea7Spatrick
ec727ea7Spatrick    stderr("Error: analysis failed.\n")
ec727ea7Spatrick    stderr(f"Total of {total_failed} failures discovered.\n")
ec727ea7Spatrick
ec727ea7Spatrick    if total_failed > NUM_OF_FAILURES_IN_SUMMARY:
ec727ea7Spatrick        stderr(f"See the first {NUM_OF_FAILURES_IN_SUMMARY} below.\n")
ec727ea7Spatrick
ec727ea7Spatrick    for index, failed_log_path in enumerate(failures, start=1):
ec727ea7Spatrick        if index >= NUM_OF_FAILURES_IN_SUMMARY:
ec727ea7Spatrick            break
ec727ea7Spatrick
ec727ea7Spatrick        stderr(f"\n-- Error #{index} -----------\n")
ec727ea7Spatrick
ec727ea7Spatrick        with open(failed_log_path, "r") as failed_log:
ec727ea7Spatrick            shutil.copyfileobj(failed_log, LOCAL.stdout)
ec727ea7Spatrick
ec727ea7Spatrick    if total_failed > NUM_OF_FAILURES_IN_SUMMARY:
ec727ea7Spatrick        stderr("See the results folder for more.")
ec727ea7Spatrick
ec727ea7Spatrick    sys.exit(1)
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef cleanup_reference_results(output_dir: str):
ec727ea7Spatrick    """
ec727ea7Spatrick    Delete html, css, and js files from reference results. These can
ec727ea7Spatrick    include multiple copies of the benchmark source and so get very large.
ec727ea7Spatrick    """
ec727ea7Spatrick    extensions = ["html", "css", "js"]
ec727ea7Spatrick
ec727ea7Spatrick    for extension in extensions:
ec727ea7Spatrick        for file_to_rm in glob.glob(f"{output_dir}/*/*.{extension}"):
ec727ea7Spatrick            file_to_rm = os.path.join(output_dir, file_to_rm)
ec727ea7Spatrick            os.remove(file_to_rm)
ec727ea7Spatrick
ec727ea7Spatrick    # Remove the log file. It leaks absolute path names.
ec727ea7Spatrick    remove_log_file(output_dir)
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef run_cmp_results(directory: str, strictness: int = 0) -> bool:
ec727ea7Spatrick    """
ec727ea7Spatrick    Compare the warnings produced by scan-build.
ec727ea7Spatrick    strictness defines the success criteria for the test:
ec727ea7Spatrick      0 - success if there are no crashes or analyzer failure.
ec727ea7Spatrick      1 - success if there are no difference in the number of reported bugs.
ec727ea7Spatrick      2 - success if all the bug reports are identical.
ec727ea7Spatrick
ec727ea7Spatrick    :return success: Whether tests pass according to the strictness
ec727ea7Spatrick    criteria.
ec727ea7Spatrick    """
ec727ea7Spatrick    tests_passed = True
ec727ea7Spatrick    start_time = time.time()
ec727ea7Spatrick
ec727ea7Spatrick    ref_dir = os.path.join(directory, REF_PREFIX + OUTPUT_DIR_NAME)
ec727ea7Spatrick    new_dir = os.path.join(directory, OUTPUT_DIR_NAME)
ec727ea7Spatrick
ec727ea7Spatrick    # We have to go one level down the directory tree.
ec727ea7Spatrick    ref_list = glob.glob(ref_dir + "/*")
ec727ea7Spatrick    new_list = glob.glob(new_dir + "/*")
ec727ea7Spatrick
ec727ea7Spatrick    # Log folders are also located in the results dir, so ignore them.
ec727ea7Spatrick    ref_log_dir = os.path.join(ref_dir, LOG_DIR_NAME)
ec727ea7Spatrick    if ref_log_dir in ref_list:
ec727ea7Spatrick        ref_list.remove(ref_log_dir)
ec727ea7Spatrick    new_list.remove(os.path.join(new_dir, LOG_DIR_NAME))
ec727ea7Spatrick
ec727ea7Spatrick    if len(ref_list) != len(new_list):
ec727ea7Spatrick        stderr(f"Mismatch in number of results folders: "
ec727ea7Spatrick               f"{ref_list} vs {new_list}")
ec727ea7Spatrick        sys.exit(1)
ec727ea7Spatrick
ec727ea7Spatrick    # There might be more then one folder underneath - one per each scan-build
ec727ea7Spatrick    # command (Ex: one for configure and one for make).
ec727ea7Spatrick    if len(ref_list) > 1:
ec727ea7Spatrick        # Assume that the corresponding folders have the same names.
ec727ea7Spatrick        ref_list.sort()
ec727ea7Spatrick        new_list.sort()
ec727ea7Spatrick
ec727ea7Spatrick    # Iterate and find the differences.
ec727ea7Spatrick    num_diffs = 0
ec727ea7Spatrick    for ref_dir, new_dir in zip(ref_list, new_list):
ec727ea7Spatrick        assert(ref_dir != new_dir)
ec727ea7Spatrick
ec727ea7Spatrick        if VERBOSE >= 1:
ec727ea7Spatrick            stdout(f"  Comparing Results: {ref_dir} {new_dir}\n")
ec727ea7Spatrick
ec727ea7Spatrick        patched_source = os.path.join(directory, PATCHED_SOURCE_DIR_NAME)
ec727ea7Spatrick
ec727ea7Spatrick        ref_results = CmpRuns.ResultsDirectory(ref_dir)
ec727ea7Spatrick        new_results = CmpRuns.ResultsDirectory(new_dir, patched_source)
ec727ea7Spatrick
ec727ea7Spatrick        # Scan the results, delete empty plist files.
ec727ea7Spatrick        num_diffs, reports_in_ref, reports_in_new = \
ec727ea7Spatrick            CmpRuns.dump_scan_build_results_diff(ref_results, new_results,
ec727ea7Spatrick                                                 delete_empty=False,
ec727ea7Spatrick                                                 out=LOCAL.stdout)
ec727ea7Spatrick
ec727ea7Spatrick        if num_diffs > 0:
ec727ea7Spatrick            stdout(f"Warning: {num_diffs} differences in diagnostics.\n")
ec727ea7Spatrick
ec727ea7Spatrick        if strictness >= 2 and num_diffs > 0:
ec727ea7Spatrick            stdout("Error: Diffs found in strict mode (2).\n")
ec727ea7Spatrick            tests_passed = False
ec727ea7Spatrick
ec727ea7Spatrick        elif strictness >= 1 and reports_in_ref != reports_in_new:
ec727ea7Spatrick            stdout("Error: The number of results are different "
ec727ea7Spatrick                   " strict mode (1).\n")
ec727ea7Spatrick            tests_passed = False
ec727ea7Spatrick
ec727ea7Spatrick    stdout(f"Diagnostic comparison complete "
ec727ea7Spatrick           f"(time: {time.time() - start_time:.2f}).\n")
ec727ea7Spatrick
ec727ea7Spatrick    return tests_passed
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef normalize_reference_results(directory: str, output_dir: str,
ec727ea7Spatrick                                build_mode: int):
ec727ea7Spatrick    """
ec727ea7Spatrick    Make the absolute paths relative in the reference results.
ec727ea7Spatrick    """
ec727ea7Spatrick    for dir_path, _, filenames in os.walk(output_dir):
ec727ea7Spatrick        for filename in filenames:
ec727ea7Spatrick            if not filename.endswith('plist'):
ec727ea7Spatrick                continue
ec727ea7Spatrick
ec727ea7Spatrick            plist = os.path.join(dir_path, filename)
*12c85518Srobert            with open(plist, "rb") as plist_file:
*12c85518Srobert                data = plistlib.load(plist_file)
ec727ea7Spatrick            path_prefix = directory
ec727ea7Spatrick
ec727ea7Spatrick            if build_mode == 1:
ec727ea7Spatrick                path_prefix = os.path.join(directory, PATCHED_SOURCE_DIR_NAME)
ec727ea7Spatrick
ec727ea7Spatrick            paths = [source[len(path_prefix) + 1:]
ec727ea7Spatrick                     if source.startswith(path_prefix) else source
ec727ea7Spatrick                     for source in data['files']]
ec727ea7Spatrick            data['files'] = paths
ec727ea7Spatrick
ec727ea7Spatrick            # Remove transient fields which change from run to run.
ec727ea7Spatrick            for diagnostic in data['diagnostics']:
ec727ea7Spatrick                if 'HTMLDiagnostics_files' in diagnostic:
ec727ea7Spatrick                    diagnostic.pop('HTMLDiagnostics_files')
ec727ea7Spatrick
ec727ea7Spatrick            if 'clang_version' in data:
ec727ea7Spatrick                data.pop('clang_version')
ec727ea7Spatrick
*12c85518Srobert            with open(plist, "wb") as plist_file:
*12c85518Srobert                plistlib.dump(data, plist_file)
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef get_build_log_path(output_dir: str) -> str:
ec727ea7Spatrick    return os.path.join(output_dir, LOG_DIR_NAME, BUILD_LOG_NAME)
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef remove_log_file(output_dir: str):
ec727ea7Spatrick    build_log_path = get_build_log_path(output_dir)
ec727ea7Spatrick
ec727ea7Spatrick    # Clean up the log file.
ec727ea7Spatrick    if os.path.exists(build_log_path):
ec727ea7Spatrick        if VERBOSE >= 1:
ec727ea7Spatrick            stdout(f"  Removing log file: {build_log_path}\n")
ec727ea7Spatrick
ec727ea7Spatrick        os.remove(build_log_path)
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef clean_up_empty_plists(output_dir: str):
ec727ea7Spatrick    """
ec727ea7Spatrick    A plist file is created for each call to the analyzer(each source file).
ec727ea7Spatrick    We are only interested on the once that have bug reports,
ec727ea7Spatrick    so delete the rest.
ec727ea7Spatrick    """
ec727ea7Spatrick    for plist in glob.glob(output_dir + "/*/*.plist"):
ec727ea7Spatrick        plist = os.path.join(output_dir, plist)
ec727ea7Spatrick
ec727ea7Spatrick        try:
ec727ea7Spatrick            with open(plist, "rb") as plist_file:
ec727ea7Spatrick                data = plistlib.load(plist_file)
ec727ea7Spatrick            # Delete empty reports.
ec727ea7Spatrick            if not data['files']:
ec727ea7Spatrick                os.remove(plist)
ec727ea7Spatrick                continue
ec727ea7Spatrick
ec727ea7Spatrick        except InvalidFileException as e:
ec727ea7Spatrick            stderr(f"Error parsing plist file {plist}: {str(e)}")
ec727ea7Spatrick            continue
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickdef clean_up_empty_folders(output_dir: str):
ec727ea7Spatrick    """
ec727ea7Spatrick    Remove empty folders from results, as git would not store them.
ec727ea7Spatrick    """
ec727ea7Spatrick    subdirs = glob.glob(output_dir + "/*")
ec727ea7Spatrick    for subdir in subdirs:
ec727ea7Spatrick        if not os.listdir(subdir):
ec727ea7Spatrick            os.removedirs(subdir)
ec727ea7Spatrick
ec727ea7Spatrick
ec727ea7Spatrickif __name__ == "__main__":
ec727ea7Spatrick    print("SATestBuild.py should not be used on its own.")
ec727ea7Spatrick    print("Please use 'SATest.py build' instead")
ec727ea7Spatrick    sys.exit(1)