FuzzTest (revision e5dd70708596ae51455a0ffa086a00c5b29f8583) - OpenGrok cross reference for /openbsd-src/gnu/llvm/clang/utils/FuzzTest

*e5dd7070Spatrick#!/usr/bin/env python
*e5dd7070Spatrick
*e5dd7070Spatrick"""
*e5dd7070SpatrickThis is a generic fuzz testing tool, see --help for more information.
*e5dd7070Spatrick"""
*e5dd7070Spatrick
*e5dd7070Spatrickimport os
*e5dd7070Spatrickimport sys
*e5dd7070Spatrickimport random
*e5dd7070Spatrickimport subprocess
*e5dd7070Spatrickimport itertools
*e5dd7070Spatrick
*e5dd7070Spatrickclass TestGenerator:
*e5dd7070Spatrick    def __init__(self, inputs, delete, insert, replace,
*e5dd7070Spatrick                 insert_strings, pick_input):
*e5dd7070Spatrick        self.inputs = [(s, open(s).read()) for s in inputs]
*e5dd7070Spatrick
*e5dd7070Spatrick        self.delete = bool(delete)
*e5dd7070Spatrick        self.insert = bool(insert)
*e5dd7070Spatrick        self.replace = bool(replace)
*e5dd7070Spatrick        self.pick_input = bool(pick_input)
*e5dd7070Spatrick        self.insert_strings = list(insert_strings)
*e5dd7070Spatrick
*e5dd7070Spatrick        self.num_positions = sum([len(d) for _,d in self.inputs])
*e5dd7070Spatrick        self.num_insert_strings = len(insert_strings)
*e5dd7070Spatrick        self.num_tests = ((delete + (insert + replace)*self.num_insert_strings)
*e5dd7070Spatrick                          * self.num_positions)
*e5dd7070Spatrick        self.num_tests += 1
*e5dd7070Spatrick
*e5dd7070Spatrick        if self.pick_input:
*e5dd7070Spatrick            self.num_tests *= self.num_positions
*e5dd7070Spatrick
*e5dd7070Spatrick    def position_to_source_index(self, position):
*e5dd7070Spatrick        for i,(s,d) in enumerate(self.inputs):
*e5dd7070Spatrick            n = len(d)
*e5dd7070Spatrick            if position < n:
*e5dd7070Spatrick                return (i,position)
*e5dd7070Spatrick            position -= n
*e5dd7070Spatrick        raise ValueError,'Invalid position.'
*e5dd7070Spatrick
*e5dd7070Spatrick    def get_test(self, index):
*e5dd7070Spatrick        assert 0 <= index < self.num_tests
*e5dd7070Spatrick
*e5dd7070Spatrick        picked_position = None
*e5dd7070Spatrick        if self.pick_input:
*e5dd7070Spatrick            index,picked_position = divmod(index, self.num_positions)
*e5dd7070Spatrick            picked_position = self.position_to_source_index(picked_position)
*e5dd7070Spatrick
*e5dd7070Spatrick        if index == 0:
*e5dd7070Spatrick            return ('nothing', None, None, picked_position)
*e5dd7070Spatrick
*e5dd7070Spatrick        index -= 1
*e5dd7070Spatrick        index,position = divmod(index, self.num_positions)
*e5dd7070Spatrick        position = self.position_to_source_index(position)
*e5dd7070Spatrick        if self.delete:
*e5dd7070Spatrick            if index == 0:
*e5dd7070Spatrick                return ('delete', position, None, picked_position)
*e5dd7070Spatrick            index -= 1
*e5dd7070Spatrick
*e5dd7070Spatrick        index,insert_index = divmod(index, self.num_insert_strings)
*e5dd7070Spatrick        insert_str = self.insert_strings[insert_index]
*e5dd7070Spatrick        if self.insert:
*e5dd7070Spatrick            if index == 0:
*e5dd7070Spatrick                return ('insert', position, insert_str, picked_position)
*e5dd7070Spatrick            index -= 1
*e5dd7070Spatrick
*e5dd7070Spatrick        assert self.replace
*e5dd7070Spatrick        assert index == 0
*e5dd7070Spatrick        return ('replace', position, insert_str, picked_position)
*e5dd7070Spatrick
*e5dd7070Spatrickclass TestApplication:
*e5dd7070Spatrick    def __init__(self, tg, test):
*e5dd7070Spatrick        self.tg = tg
*e5dd7070Spatrick        self.test = test
*e5dd7070Spatrick
*e5dd7070Spatrick    def apply(self):
*e5dd7070Spatrick        if self.test[0] == 'nothing':
*e5dd7070Spatrick            pass
*e5dd7070Spatrick        else:
*e5dd7070Spatrick            i,j = self.test[1]
*e5dd7070Spatrick            name,data = self.tg.inputs[i]
*e5dd7070Spatrick            if self.test[0] == 'delete':
*e5dd7070Spatrick                data = data[:j] + data[j+1:]
*e5dd7070Spatrick            elif self.test[0] == 'insert':
*e5dd7070Spatrick                data = data[:j] + self.test[2] + data[j:]
*e5dd7070Spatrick            elif self.test[0] == 'replace':
*e5dd7070Spatrick                data = data[:j] + self.test[2] + data[j+1:]
*e5dd7070Spatrick            else:
*e5dd7070Spatrick                raise ValueError,'Invalid test %r' % self.test
*e5dd7070Spatrick            open(name,'wb').write(data)
*e5dd7070Spatrick
*e5dd7070Spatrick    def revert(self):
*e5dd7070Spatrick        if self.test[0] != 'nothing':
*e5dd7070Spatrick            i,j = self.test[1]
*e5dd7070Spatrick            name,data = self.tg.inputs[i]
*e5dd7070Spatrick            open(name,'wb').write(data)
*e5dd7070Spatrick
*e5dd7070Spatrickdef quote(str):
*e5dd7070Spatrick    return '"' + str + '"'
*e5dd7070Spatrick
*e5dd7070Spatrickdef run_one_test(test_application, index, input_files, args):
*e5dd7070Spatrick    test = test_application.test
*e5dd7070Spatrick
*e5dd7070Spatrick    # Interpolate arguments.
*e5dd7070Spatrick    options = { 'index' : index,
*e5dd7070Spatrick                'inputs' : ' '.join(quote(f) for f in input_files) }
*e5dd7070Spatrick
*e5dd7070Spatrick    # Add picked input interpolation arguments, if used.
*e5dd7070Spatrick    if test[3] is not None:
*e5dd7070Spatrick        pos = test[3][1]
*e5dd7070Spatrick        options['picked_input'] = input_files[test[3][0]]
*e5dd7070Spatrick        options['picked_input_pos'] = pos
*e5dd7070Spatrick        # Compute the line and column.
*e5dd7070Spatrick        file_data = test_application.tg.inputs[test[3][0]][1]
*e5dd7070Spatrick        line = column = 1
*e5dd7070Spatrick        for i in range(pos):
*e5dd7070Spatrick            c = file_data[i]
*e5dd7070Spatrick            if c == '\n':
*e5dd7070Spatrick                line += 1
*e5dd7070Spatrick                column = 1
*e5dd7070Spatrick            else:
*e5dd7070Spatrick                column += 1
*e5dd7070Spatrick        options['picked_input_line'] = line
*e5dd7070Spatrick        options['picked_input_col'] = column
*e5dd7070Spatrick
*e5dd7070Spatrick    test_args = [a % options for a in args]
*e5dd7070Spatrick    if opts.verbose:
*e5dd7070Spatrick        print '%s: note: executing %r' % (sys.argv[0], test_args)
*e5dd7070Spatrick
*e5dd7070Spatrick    stdout = None
*e5dd7070Spatrick    stderr = None
*e5dd7070Spatrick    if opts.log_dir:
*e5dd7070Spatrick        stdout_log_path = os.path.join(opts.log_dir, '%s.out' % index)
*e5dd7070Spatrick        stderr_log_path = os.path.join(opts.log_dir, '%s.err' % index)
*e5dd7070Spatrick        stdout = open(stdout_log_path, 'wb')
*e5dd7070Spatrick        stderr = open(stderr_log_path, 'wb')
*e5dd7070Spatrick    else:
*e5dd7070Spatrick        sys.stdout.flush()
*e5dd7070Spatrick    p = subprocess.Popen(test_args, stdout=stdout, stderr=stderr)
*e5dd7070Spatrick    p.communicate()
*e5dd7070Spatrick    exit_code = p.wait()
*e5dd7070Spatrick
*e5dd7070Spatrick    test_result = (exit_code == opts.expected_exit_code or
*e5dd7070Spatrick                   exit_code in opts.extra_exit_codes)
*e5dd7070Spatrick
*e5dd7070Spatrick    if stdout is not None:
*e5dd7070Spatrick        stdout.close()
*e5dd7070Spatrick        stderr.close()
*e5dd7070Spatrick
*e5dd7070Spatrick        # Remove the logs for passes, unless logging all results.
*e5dd7070Spatrick        if not opts.log_all and test_result:
*e5dd7070Spatrick            os.remove(stdout_log_path)
*e5dd7070Spatrick            os.remove(stderr_log_path)
*e5dd7070Spatrick
*e5dd7070Spatrick    if not test_result:
*e5dd7070Spatrick        print 'FAIL: %d' % index
*e5dd7070Spatrick    elif not opts.succinct:
*e5dd7070Spatrick        print 'PASS: %d' % index
*e5dd7070Spatrick    return test_result
*e5dd7070Spatrick
*e5dd7070Spatrickdef main():
*e5dd7070Spatrick    global opts
*e5dd7070Spatrick    from optparse import OptionParser, OptionGroup
*e5dd7070Spatrick    parser = OptionParser("""%prog [options] ... test command args ...
*e5dd7070Spatrick
*e5dd7070Spatrick%prog is a tool for fuzzing inputs and testing them.
*e5dd7070Spatrick
*e5dd7070SpatrickThe most basic usage is something like:
*e5dd7070Spatrick
*e5dd7070Spatrick  $ %prog --file foo.txt ./test.sh
*e5dd7070Spatrick
*e5dd7070Spatrickwhich will run a default list of fuzzing strategies on the input. For each
*e5dd7070Spatrickfuzzed input, it will overwrite the input files (in place), run the test script,
*e5dd7070Spatrickthen restore the files back to their original contents.
*e5dd7070Spatrick
*e5dd7070SpatrickNOTE: You should make sure you have a backup copy of your inputs, in case
*e5dd7070Spatricksomething goes wrong!!!
*e5dd7070Spatrick
*e5dd7070SpatrickYou can cause the fuzzing to not restore the original files with
*e5dd7070Spatrick'--no-revert'. Generally this is used with '--test <index>' to run one failing
*e5dd7070Spatricktest and then leave the fuzzed inputs in place to examine the failure.
*e5dd7070Spatrick
*e5dd7070SpatrickFor each fuzzed input, %prog will run the test command given on the command
*e5dd7070Spatrickline. Each argument in the command is subject to string interpolation before
*e5dd7070Spatrickbeing executed. The syntax is "%(VARIABLE)FORMAT" where FORMAT is a standard
*e5dd7070Spatrickprintf format, and VARIABLE is one of:
*e5dd7070Spatrick
*e5dd7070Spatrick  'index' - the test index being run
*e5dd7070Spatrick  'inputs' - the full list of test inputs
*e5dd7070Spatrick  'picked_input'      - (with --pick-input) the selected input file
*e5dd7070Spatrick  'picked_input_pos'  - (with --pick-input) the selected input position
*e5dd7070Spatrick  'picked_input_line' - (with --pick-input) the selected input line
*e5dd7070Spatrick  'picked_input_col'  - (with --pick-input) the selected input column
*e5dd7070Spatrick
*e5dd7070SpatrickBy default, the script will run forever continually picking new tests to
*e5dd7070Spatrickrun. You can limit the number of tests that are run with '--max-tests <number>',
*e5dd7070Spatrickand you can run a particular test with '--test <index>'.
*e5dd7070Spatrick
*e5dd7070SpatrickYou can specify '--stop-on-fail' to stop the script on the first failure
*e5dd7070Spatrickwithout reverting the changes.
*e5dd7070Spatrick
*e5dd7070Spatrick""")
*e5dd7070Spatrick    parser.add_option("-v", "--verbose", help="Show more output",
*e5dd7070Spatrick                      action='store_true', dest="verbose", default=False)
*e5dd7070Spatrick    parser.add_option("-s", "--succinct",  help="Reduce amount of output",
*e5dd7070Spatrick                      action="store_true", dest="succinct", default=False)
*e5dd7070Spatrick
*e5dd7070Spatrick    group = OptionGroup(parser, "Test Execution")
*e5dd7070Spatrick    group.add_option("", "--expected-exit-code", help="Set expected exit code",
*e5dd7070Spatrick                     type=int, dest="expected_exit_code",
*e5dd7070Spatrick                     default=0)
*e5dd7070Spatrick    group.add_option("", "--extra-exit-code",
*e5dd7070Spatrick                     help="Set additional expected exit code",
*e5dd7070Spatrick                     type=int, action="append", dest="extra_exit_codes",
*e5dd7070Spatrick                     default=[])
*e5dd7070Spatrick    group.add_option("", "--log-dir",
*e5dd7070Spatrick                     help="Capture test logs to an output directory",
*e5dd7070Spatrick                     type=str, dest="log_dir",
*e5dd7070Spatrick                     default=None)
*e5dd7070Spatrick    group.add_option("", "--log-all",
*e5dd7070Spatrick                     help="Log all outputs (not just failures)",
*e5dd7070Spatrick                     action="store_true", dest="log_all", default=False)
*e5dd7070Spatrick    parser.add_option_group(group)
*e5dd7070Spatrick
*e5dd7070Spatrick    group = OptionGroup(parser, "Input Files")
*e5dd7070Spatrick    group.add_option("", "--file", metavar="PATH",
*e5dd7070Spatrick                     help="Add an input file to fuzz",
*e5dd7070Spatrick                     type=str, action="append", dest="input_files", default=[])
*e5dd7070Spatrick    group.add_option("", "--filelist", metavar="LIST",
*e5dd7070Spatrick                     help="Add a list of inputs files to fuzz (one per line)",
*e5dd7070Spatrick                     type=str, action="append", dest="filelists", default=[])
*e5dd7070Spatrick    parser.add_option_group(group)
*e5dd7070Spatrick
*e5dd7070Spatrick    group = OptionGroup(parser, "Fuzz Options")
*e5dd7070Spatrick    group.add_option("", "--replacement-chars", dest="replacement_chars",
*e5dd7070Spatrick                     help="Characters to insert/replace",
*e5dd7070Spatrick                     default="0{}[]<>\;@#$^%& ")
*e5dd7070Spatrick    group.add_option("", "--replacement-string", dest="replacement_strings",
*e5dd7070Spatrick                     action="append", help="Add a replacement string to use",
*e5dd7070Spatrick                     default=[])
*e5dd7070Spatrick    group.add_option("", "--replacement-list", dest="replacement_lists",
*e5dd7070Spatrick                     help="Add a list of replacement strings (one per line)",
*e5dd7070Spatrick                     action="append", default=[])
*e5dd7070Spatrick    group.add_option("", "--no-delete", help="Don't delete characters",
*e5dd7070Spatrick                     action='store_false', dest="enable_delete", default=True)
*e5dd7070Spatrick    group.add_option("", "--no-insert", help="Don't insert strings",
*e5dd7070Spatrick                     action='store_false', dest="enable_insert", default=True)
*e5dd7070Spatrick    group.add_option("", "--no-replace", help="Don't replace strings",
*e5dd7070Spatrick                     action='store_false', dest="enable_replace", default=True)
*e5dd7070Spatrick    group.add_option("", "--no-revert", help="Don't revert changes",
*e5dd7070Spatrick                     action='store_false', dest="revert", default=True)
*e5dd7070Spatrick    group.add_option("", "--stop-on-fail", help="Stop on first failure",
*e5dd7070Spatrick                     action='store_true', dest="stop_on_fail", default=False)
*e5dd7070Spatrick    parser.add_option_group(group)
*e5dd7070Spatrick
*e5dd7070Spatrick    group = OptionGroup(parser, "Test Selection")
*e5dd7070Spatrick    group.add_option("", "--test", help="Run a particular test",
*e5dd7070Spatrick                     type=int, dest="test", default=None, metavar="INDEX")
*e5dd7070Spatrick    group.add_option("", "--max-tests", help="Maximum number of tests",
*e5dd7070Spatrick                     type=int, dest="max_tests", default=None, metavar="COUNT")
*e5dd7070Spatrick    group.add_option("", "--pick-input",
*e5dd7070Spatrick                     help="Randomly select an input byte as well as fuzzing",
*e5dd7070Spatrick                     action='store_true', dest="pick_input", default=False)
*e5dd7070Spatrick    parser.add_option_group(group)
*e5dd7070Spatrick
*e5dd7070Spatrick    parser.disable_interspersed_args()
*e5dd7070Spatrick
*e5dd7070Spatrick    (opts, args) = parser.parse_args()
*e5dd7070Spatrick
*e5dd7070Spatrick    if not args:
*e5dd7070Spatrick        parser.error("Invalid number of arguments")
*e5dd7070Spatrick
*e5dd7070Spatrick    # Collect the list of inputs.
*e5dd7070Spatrick    input_files = list(opts.input_files)
*e5dd7070Spatrick    for filelist in opts.filelists:
*e5dd7070Spatrick        f = open(filelist)
*e5dd7070Spatrick        try:
*e5dd7070Spatrick            for ln in f:
*e5dd7070Spatrick                ln = ln.strip()
*e5dd7070Spatrick                if ln:
*e5dd7070Spatrick                    input_files.append(ln)
*e5dd7070Spatrick        finally:
*e5dd7070Spatrick            f.close()
*e5dd7070Spatrick    input_files.sort()
*e5dd7070Spatrick
*e5dd7070Spatrick    if not input_files:
*e5dd7070Spatrick        parser.error("No input files!")
*e5dd7070Spatrick
*e5dd7070Spatrick    print '%s: note: fuzzing %d files.' % (sys.argv[0], len(input_files))
*e5dd7070Spatrick
*e5dd7070Spatrick    # Make sure the log directory exists if used.
*e5dd7070Spatrick    if opts.log_dir:
*e5dd7070Spatrick        if not os.path.exists(opts.log_dir):
*e5dd7070Spatrick            try:
*e5dd7070Spatrick                os.mkdir(opts.log_dir)
*e5dd7070Spatrick            except OSError:
*e5dd7070Spatrick                print "%s: error: log directory couldn't be created!" % (
*e5dd7070Spatrick                    sys.argv[0],)
*e5dd7070Spatrick                raise SystemExit,1
*e5dd7070Spatrick
*e5dd7070Spatrick    # Get the list if insert/replacement strings.
*e5dd7070Spatrick    replacements = list(opts.replacement_chars)
*e5dd7070Spatrick    replacements.extend(opts.replacement_strings)
*e5dd7070Spatrick    for replacement_list in opts.replacement_lists:
*e5dd7070Spatrick        f = open(replacement_list)
*e5dd7070Spatrick        try:
*e5dd7070Spatrick            for ln in f:
*e5dd7070Spatrick                ln = ln[:-1]
*e5dd7070Spatrick                if ln:
*e5dd7070Spatrick                    replacements.append(ln)
*e5dd7070Spatrick        finally:
*e5dd7070Spatrick            f.close()
*e5dd7070Spatrick
*e5dd7070Spatrick    # Unique and order the replacement list.
*e5dd7070Spatrick    replacements = list(set(replacements))
*e5dd7070Spatrick    replacements.sort()
*e5dd7070Spatrick
*e5dd7070Spatrick    # Create the test generator.
*e5dd7070Spatrick    tg = TestGenerator(input_files, opts.enable_delete, opts.enable_insert,
*e5dd7070Spatrick                       opts.enable_replace, replacements, opts.pick_input)
*e5dd7070Spatrick
*e5dd7070Spatrick    print '%s: note: %d input bytes.' % (sys.argv[0], tg.num_positions)
*e5dd7070Spatrick    print '%s: note: %d total tests.' % (sys.argv[0], tg.num_tests)
*e5dd7070Spatrick    if opts.test is not None:
*e5dd7070Spatrick        it = [opts.test]
*e5dd7070Spatrick    elif opts.max_tests is not None:
*e5dd7070Spatrick        it = itertools.imap(random.randrange,
*e5dd7070Spatrick                            itertools.repeat(tg.num_tests, opts.max_tests))
*e5dd7070Spatrick    else:
*e5dd7070Spatrick        it = itertools.imap(random.randrange, itertools.repeat(tg.num_tests))
*e5dd7070Spatrick    for test in it:
*e5dd7070Spatrick        t = tg.get_test(test)
*e5dd7070Spatrick
*e5dd7070Spatrick        if opts.verbose:
*e5dd7070Spatrick            print '%s: note: running test %d: %r' % (sys.argv[0], test, t)
*e5dd7070Spatrick        ta = TestApplication(tg, t)
*e5dd7070Spatrick        try:
*e5dd7070Spatrick            ta.apply()
*e5dd7070Spatrick            test_result = run_one_test(ta, test, input_files, args)
*e5dd7070Spatrick            if not test_result and opts.stop_on_fail:
*e5dd7070Spatrick                opts.revert = False
*e5dd7070Spatrick                sys.exit(1)
*e5dd7070Spatrick        finally:
*e5dd7070Spatrick            if opts.revert:
*e5dd7070Spatrick                ta.revert()
*e5dd7070Spatrick
*e5dd7070Spatrick        sys.stdout.flush()
*e5dd7070Spatrick
*e5dd7070Spatrickif __name__ == '__main__':
*e5dd7070Spatrick    main()