1e5dd7070Spatrick //==-- handle_llvm.cpp - Helper function for Clang fuzzers -----------------==//
2e5dd7070Spatrick //
3e5dd7070Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4e5dd7070Spatrick // See https://llvm.org/LICENSE.txt for license information.
5e5dd7070Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6e5dd7070Spatrick //
7e5dd7070Spatrick //===----------------------------------------------------------------------===//
8e5dd7070Spatrick //
9e5dd7070Spatrick // Implements HandleLLVM for use by the Clang fuzzers. First runs a loop
10e5dd7070Spatrick // vectorizer optimization pass over the given IR code. Then mimics lli on both
11e5dd7070Spatrick // versions to JIT the generated code and execute it. Currently, functions are
12e5dd7070Spatrick // executed on dummy inputs.
13e5dd7070Spatrick //
14e5dd7070Spatrick //===----------------------------------------------------------------------===//
15e5dd7070Spatrick
16e5dd7070Spatrick #include "handle_llvm.h"
17e5dd7070Spatrick #include "input_arrays.h"
18e5dd7070Spatrick
19e5dd7070Spatrick #include "llvm/ADT/Triple.h"
20e5dd7070Spatrick #include "llvm/Analysis/TargetLibraryInfo.h"
21e5dd7070Spatrick #include "llvm/Analysis/TargetTransformInfo.h"
22ec727ea7Spatrick #include "llvm/CodeGen/CommandFlags.h"
23e5dd7070Spatrick #include "llvm/CodeGen/MachineModuleInfo.h"
24e5dd7070Spatrick #include "llvm/CodeGen/TargetPassConfig.h"
25e5dd7070Spatrick #include "llvm/ExecutionEngine/JITEventListener.h"
26e5dd7070Spatrick #include "llvm/ExecutionEngine/JITSymbol.h"
27e5dd7070Spatrick #include "llvm/ExecutionEngine/MCJIT.h"
28e5dd7070Spatrick #include "llvm/ExecutionEngine/ObjectCache.h"
29e5dd7070Spatrick #include "llvm/ExecutionEngine/RTDyldMemoryManager.h"
30e5dd7070Spatrick #include "llvm/ExecutionEngine/SectionMemoryManager.h"
31e5dd7070Spatrick #include "llvm/IR/IRPrintingPasses.h"
32ec727ea7Spatrick #include "llvm/IR/LLVMContext.h"
33e5dd7070Spatrick #include "llvm/IR/Module.h"
34e5dd7070Spatrick #include "llvm/IR/Verifier.h"
35*12c85518Srobert #include "llvm/IRPrinter/IRPrintingPasses.h"
36e5dd7070Spatrick #include "llvm/IRReader/IRReader.h"
37*12c85518Srobert #include "llvm/MC/TargetRegistry.h"
38*12c85518Srobert #include "llvm/Passes/OptimizationLevel.h"
39*12c85518Srobert #include "llvm/Passes/PassBuilder.h"
40e5dd7070Spatrick #include "llvm/Support/MemoryBuffer.h"
41e5dd7070Spatrick #include "llvm/Support/SourceMgr.h"
42e5dd7070Spatrick #include "llvm/Support/TargetSelect.h"
43e5dd7070Spatrick #include "llvm/Target/TargetMachine.h"
44e5dd7070Spatrick
45e5dd7070Spatrick using namespace llvm;
46e5dd7070Spatrick
47e5dd7070Spatrick // Define a type for the functions that are compiled and executed
48e5dd7070Spatrick typedef void (*LLVMFunc)(int*, int*, int*, int);
49e5dd7070Spatrick
50e5dd7070Spatrick // Helper function to parse command line args and find the optimization level
51*12c85518Srobert static CodeGenOpt::Level
getOptLevel(const std::vector<const char * > & ExtraArgs)52*12c85518Srobert getOptLevel(const std::vector<const char *> &ExtraArgs) {
53e5dd7070Spatrick // Find the optimization level from the command line args
54*12c85518Srobert CodeGenOpt::Level OLvl = CodeGenOpt::Default;
55e5dd7070Spatrick for (auto &A : ExtraArgs) {
56e5dd7070Spatrick if (A[0] == '-' && A[1] == 'O') {
57*12c85518Srobert if (auto Level = CodeGenOpt::parseLevel(A[2])) {
58*12c85518Srobert OLvl = *Level;
59*12c85518Srobert } else {
60e5dd7070Spatrick errs() << "error: opt level must be between 0 and 3.\n";
61e5dd7070Spatrick std::exit(1);
62e5dd7070Spatrick }
63e5dd7070Spatrick }
64e5dd7070Spatrick }
65*12c85518Srobert return OLvl;
66e5dd7070Spatrick }
67e5dd7070Spatrick
ErrorAndExit(std::string message)68e5dd7070Spatrick static void ErrorAndExit(std::string message) {
69e5dd7070Spatrick errs()<< "ERROR: " << message << "\n";
70e5dd7070Spatrick std::exit(1);
71e5dd7070Spatrick }
72e5dd7070Spatrick
73e5dd7070Spatrick // Helper function to add optimization passes to the TargetMachine at the
74e5dd7070Spatrick // specified optimization level, OptLevel
RunOptimizationPasses(raw_ostream & OS,Module & M,CodeGenOpt::Level OptLevel)75*12c85518Srobert static void RunOptimizationPasses(raw_ostream &OS, Module &M,
76*12c85518Srobert CodeGenOpt::Level OptLevel) {
77*12c85518Srobert llvm::OptimizationLevel OL;
78*12c85518Srobert switch (OptLevel) {
79*12c85518Srobert case CodeGenOpt::None:
80*12c85518Srobert OL = OptimizationLevel::O0;
81*12c85518Srobert break;
82*12c85518Srobert case CodeGenOpt::Less:
83*12c85518Srobert OL = OptimizationLevel::O1;
84*12c85518Srobert break;
85*12c85518Srobert case CodeGenOpt::Default:
86*12c85518Srobert OL = OptimizationLevel::O2;
87*12c85518Srobert break;
88*12c85518Srobert case CodeGenOpt::Aggressive:
89*12c85518Srobert OL = OptimizationLevel::O3;
90*12c85518Srobert break;
91*12c85518Srobert }
92*12c85518Srobert
93*12c85518Srobert LoopAnalysisManager LAM;
94*12c85518Srobert FunctionAnalysisManager FAM;
95*12c85518Srobert CGSCCAnalysisManager CGAM;
96*12c85518Srobert ModuleAnalysisManager MAM;
97*12c85518Srobert
98*12c85518Srobert PassBuilder PB;
99*12c85518Srobert
100*12c85518Srobert PB.registerModuleAnalyses(MAM);
101*12c85518Srobert PB.registerCGSCCAnalyses(CGAM);
102*12c85518Srobert PB.registerFunctionAnalyses(FAM);
103*12c85518Srobert PB.registerLoopAnalyses(LAM);
104*12c85518Srobert PB.crossRegisterProxies(LAM, FAM, CGAM, MAM);
105*12c85518Srobert
106*12c85518Srobert ModulePassManager MPM;
107*12c85518Srobert if (OL == OptimizationLevel::O0)
108*12c85518Srobert MPM = PB.buildO0DefaultPipeline(OL);
109*12c85518Srobert else
110*12c85518Srobert MPM = PB.buildPerModuleDefaultPipeline(OL);
111*12c85518Srobert MPM.addPass(PrintModulePass(OS));
112*12c85518Srobert
113*12c85518Srobert MPM.run(M, MAM);
114e5dd7070Spatrick }
115e5dd7070Spatrick
116e5dd7070Spatrick // Mimics the opt tool to run an optimization pass over the provided IR
OptLLVM(const std::string & IR,CodeGenOpt::Level OLvl)117e5dd7070Spatrick static std::string OptLLVM(const std::string &IR, CodeGenOpt::Level OLvl) {
118e5dd7070Spatrick // Create a module that will run the optimization passes
119e5dd7070Spatrick SMDiagnostic Err;
120e5dd7070Spatrick LLVMContext Context;
121e5dd7070Spatrick std::unique_ptr<Module> M = parseIR(MemoryBufferRef(IR, "IR"), Err, Context);
122e5dd7070Spatrick if (!M || verifyModule(*M, &errs()))
123e5dd7070Spatrick ErrorAndExit("Could not parse IR");
124e5dd7070Spatrick
125e5dd7070Spatrick Triple ModuleTriple(M->getTargetTriple());
126a9ac8606Spatrick const TargetOptions Options =
127a9ac8606Spatrick codegen::InitTargetOptionsFromCodeGenFlags(ModuleTriple);
128e5dd7070Spatrick std::string E;
129ec727ea7Spatrick const Target *TheTarget =
130ec727ea7Spatrick TargetRegistry::lookupTarget(codegen::getMArch(), ModuleTriple, E);
131a9ac8606Spatrick if (!TheTarget)
132a9ac8606Spatrick ErrorAndExit(E);
133a9ac8606Spatrick
134a9ac8606Spatrick std::unique_ptr<TargetMachine> TM(TheTarget->createTargetMachine(
135ec727ea7Spatrick M->getTargetTriple(), codegen::getCPUStr(), codegen::getFeaturesStr(),
136ec727ea7Spatrick Options, codegen::getExplicitRelocModel(),
137a9ac8606Spatrick codegen::getExplicitCodeModel(), OLvl));
138a9ac8606Spatrick if (!TM)
139a9ac8606Spatrick ErrorAndExit("Could not create target machine");
140a9ac8606Spatrick
141ec727ea7Spatrick codegen::setFunctionAttributes(codegen::getCPUStr(),
142ec727ea7Spatrick codegen::getFeaturesStr(), *M);
143e5dd7070Spatrick
144e5dd7070Spatrick // Add a pass that writes the optimized IR to an output stream
145e5dd7070Spatrick std::string outString;
146e5dd7070Spatrick raw_string_ostream OS(outString);
147*12c85518Srobert RunOptimizationPasses(OS, *M, OLvl);
148e5dd7070Spatrick
149*12c85518Srobert return outString;
150e5dd7070Spatrick }
151e5dd7070Spatrick
152e5dd7070Spatrick // Takes a function and runs it on a set of inputs
153e5dd7070Spatrick // First determines whether f is the optimized or unoptimized function
RunFuncOnInputs(LLVMFunc f,int Arr[kNumArrays][kArraySize])154e5dd7070Spatrick static void RunFuncOnInputs(LLVMFunc f, int Arr[kNumArrays][kArraySize]) {
155e5dd7070Spatrick for (int i = 0; i < kNumArrays / 3; i++)
156e5dd7070Spatrick f(Arr[i], Arr[i + (kNumArrays / 3)], Arr[i + (2 * kNumArrays / 3)],
157e5dd7070Spatrick kArraySize);
158e5dd7070Spatrick }
159e5dd7070Spatrick
160e5dd7070Spatrick // Takes a string of IR and compiles it using LLVM's JIT Engine
CreateAndRunJITFunc(const std::string & IR,CodeGenOpt::Level OLvl)161e5dd7070Spatrick static void CreateAndRunJITFunc(const std::string &IR, CodeGenOpt::Level OLvl) {
162e5dd7070Spatrick SMDiagnostic Err;
163e5dd7070Spatrick LLVMContext Context;
164e5dd7070Spatrick std::unique_ptr<Module> M = parseIR(MemoryBufferRef(IR, "IR"), Err, Context);
165e5dd7070Spatrick if (!M)
166e5dd7070Spatrick ErrorAndExit("Could not parse IR");
167e5dd7070Spatrick
168e5dd7070Spatrick Function *EntryFunc = M->getFunction("foo");
169e5dd7070Spatrick if (!EntryFunc)
170e5dd7070Spatrick ErrorAndExit("Function not found in module");
171e5dd7070Spatrick
172e5dd7070Spatrick std::string ErrorMsg;
173a9ac8606Spatrick Triple ModuleTriple(M->getTargetTriple());
174a9ac8606Spatrick
175e5dd7070Spatrick EngineBuilder builder(std::move(M));
176ec727ea7Spatrick builder.setMArch(codegen::getMArch());
177ec727ea7Spatrick builder.setMCPU(codegen::getCPUStr());
178ec727ea7Spatrick builder.setMAttrs(codegen::getFeatureList());
179e5dd7070Spatrick builder.setErrorStr(&ErrorMsg);
180e5dd7070Spatrick builder.setEngineKind(EngineKind::JIT);
181e5dd7070Spatrick builder.setMCJITMemoryManager(std::make_unique<SectionMemoryManager>());
182e5dd7070Spatrick builder.setOptLevel(OLvl);
183a9ac8606Spatrick builder.setTargetOptions(
184a9ac8606Spatrick codegen::InitTargetOptionsFromCodeGenFlags(ModuleTriple));
185e5dd7070Spatrick
186e5dd7070Spatrick std::unique_ptr<ExecutionEngine> EE(builder.create());
187e5dd7070Spatrick if (!EE)
188e5dd7070Spatrick ErrorAndExit("Could not create execution engine");
189e5dd7070Spatrick
190e5dd7070Spatrick EE->finalizeObject();
191e5dd7070Spatrick EE->runStaticConstructorsDestructors(false);
192e5dd7070Spatrick
193e5dd7070Spatrick #if defined(__GNUC__) && !defined(__clang) && \
194e5dd7070Spatrick ((__GNUC__ == 4) && (__GNUC_MINOR__ < 9))
195e5dd7070Spatrick // Silence
196e5dd7070Spatrick //
197e5dd7070Spatrick // warning: ISO C++ forbids casting between pointer-to-function and
198e5dd7070Spatrick // pointer-to-object [-Wpedantic]
199e5dd7070Spatrick //
200e5dd7070Spatrick // Since C++11 this casting is conditionally supported and GCC versions
201e5dd7070Spatrick // starting from 4.9.0 don't warn about the cast.
202e5dd7070Spatrick #pragma GCC diagnostic push
203e5dd7070Spatrick #pragma GCC diagnostic ignored "-Wpedantic"
204e5dd7070Spatrick #endif
205e5dd7070Spatrick LLVMFunc f = reinterpret_cast<LLVMFunc>(EE->getPointerToFunction(EntryFunc));
206e5dd7070Spatrick #if defined(__GNUC__) && !defined(__clang) && \
207e5dd7070Spatrick ((__GNUC__ == 4) && (__GNUC_MINOR__ < 9))
208e5dd7070Spatrick #pragma GCC diagnostic pop
209e5dd7070Spatrick #endif
210e5dd7070Spatrick
211e5dd7070Spatrick // Figure out if we are running the optimized func or the unoptimized func
212e5dd7070Spatrick RunFuncOnInputs(f, (OLvl == CodeGenOpt::None) ? UnoptArrays : OptArrays);
213e5dd7070Spatrick
214e5dd7070Spatrick EE->runStaticConstructorsDestructors(true);
215e5dd7070Spatrick }
216e5dd7070Spatrick
217e5dd7070Spatrick // Main fuzz target called by ExampleClangLLVMProtoFuzzer.cpp
218e5dd7070Spatrick // Mimics the lli tool to JIT the LLVM IR code and execute it
HandleLLVM(const std::string & IR,const std::vector<const char * > & ExtraArgs)219e5dd7070Spatrick void clang_fuzzer::HandleLLVM(const std::string &IR,
220e5dd7070Spatrick const std::vector<const char *> &ExtraArgs) {
221e5dd7070Spatrick // Populate OptArrays and UnoptArrays with the arrays from InputArrays
222e5dd7070Spatrick memcpy(OptArrays, InputArrays, kTotalSize);
223e5dd7070Spatrick memcpy(UnoptArrays, InputArrays, kTotalSize);
224e5dd7070Spatrick
225e5dd7070Spatrick // Parse ExtraArgs to set the optimization level
226*12c85518Srobert CodeGenOpt::Level OLvl = getOptLevel(ExtraArgs);
227e5dd7070Spatrick
228e5dd7070Spatrick // First we optimize the IR by running a loop vectorizer pass
229e5dd7070Spatrick std::string OptIR = OptLLVM(IR, OLvl);
230e5dd7070Spatrick
231e5dd7070Spatrick CreateAndRunJITFunc(OptIR, OLvl);
232e5dd7070Spatrick CreateAndRunJITFunc(IR, CodeGenOpt::None);
233e5dd7070Spatrick
234e5dd7070Spatrick if (memcmp(OptArrays, UnoptArrays, kTotalSize))
235e5dd7070Spatrick ErrorAndExit("!!!BUG!!!");
236e5dd7070Spatrick }
237