109467b48Spatrick //===-- ModuleUtils.cpp - Functions to manipulate Modules -----------------===// 209467b48Spatrick // 309467b48Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 409467b48Spatrick // See https://llvm.org/LICENSE.txt for license information. 509467b48Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 609467b48Spatrick // 709467b48Spatrick //===----------------------------------------------------------------------===// 809467b48Spatrick // 909467b48Spatrick // This family of functions perform manipulations on Modules. 1009467b48Spatrick // 1109467b48Spatrick //===----------------------------------------------------------------------===// 1209467b48Spatrick 1309467b48Spatrick #include "llvm/Transforms/Utils/ModuleUtils.h" 14097a140dSpatrick #include "llvm/Analysis/TargetLibraryInfo.h" 1509467b48Spatrick #include "llvm/Analysis/VectorUtils.h" 1609467b48Spatrick #include "llvm/IR/DerivedTypes.h" 1709467b48Spatrick #include "llvm/IR/Function.h" 1809467b48Spatrick #include "llvm/IR/IRBuilder.h" 1909467b48Spatrick #include "llvm/IR/Module.h" 2009467b48Spatrick #include "llvm/Support/raw_ostream.h" 2109467b48Spatrick using namespace llvm; 2209467b48Spatrick 23097a140dSpatrick #define DEBUG_TYPE "moduleutils" 24097a140dSpatrick 2509467b48Spatrick static void appendToGlobalArray(const char *Array, Module &M, Function *F, 2609467b48Spatrick int Priority, Constant *Data) { 2709467b48Spatrick IRBuilder<> IRB(M.getContext()); 2809467b48Spatrick FunctionType *FnTy = FunctionType::get(IRB.getVoidTy(), false); 2909467b48Spatrick 3009467b48Spatrick // Get the current set of static global constructors and add the new ctor 3109467b48Spatrick // to the list. 3209467b48Spatrick SmallVector<Constant *, 16> CurrentCtors; 3309467b48Spatrick StructType *EltTy = StructType::get( 3409467b48Spatrick IRB.getInt32Ty(), PointerType::getUnqual(FnTy), IRB.getInt8PtrTy()); 3509467b48Spatrick if (GlobalVariable *GVCtor = M.getNamedGlobal(Array)) { 3609467b48Spatrick if (Constant *Init = GVCtor->getInitializer()) { 3709467b48Spatrick unsigned n = Init->getNumOperands(); 3809467b48Spatrick CurrentCtors.reserve(n + 1); 3909467b48Spatrick for (unsigned i = 0; i != n; ++i) 4009467b48Spatrick CurrentCtors.push_back(cast<Constant>(Init->getOperand(i))); 4109467b48Spatrick } 4209467b48Spatrick GVCtor->eraseFromParent(); 4309467b48Spatrick } 4409467b48Spatrick 4509467b48Spatrick // Build a 3 field global_ctor entry. We don't take a comdat key. 4609467b48Spatrick Constant *CSVals[3]; 4709467b48Spatrick CSVals[0] = IRB.getInt32(Priority); 4809467b48Spatrick CSVals[1] = F; 4909467b48Spatrick CSVals[2] = Data ? ConstantExpr::getPointerCast(Data, IRB.getInt8PtrTy()) 5009467b48Spatrick : Constant::getNullValue(IRB.getInt8PtrTy()); 5109467b48Spatrick Constant *RuntimeCtorInit = 5209467b48Spatrick ConstantStruct::get(EltTy, makeArrayRef(CSVals, EltTy->getNumElements())); 5309467b48Spatrick 5409467b48Spatrick CurrentCtors.push_back(RuntimeCtorInit); 5509467b48Spatrick 5609467b48Spatrick // Create a new initializer. 5709467b48Spatrick ArrayType *AT = ArrayType::get(EltTy, CurrentCtors.size()); 5809467b48Spatrick Constant *NewInit = ConstantArray::get(AT, CurrentCtors); 5909467b48Spatrick 6009467b48Spatrick // Create the new global variable and replace all uses of 6109467b48Spatrick // the old global variable with the new one. 6209467b48Spatrick (void)new GlobalVariable(M, NewInit->getType(), false, 6309467b48Spatrick GlobalValue::AppendingLinkage, NewInit, Array); 6409467b48Spatrick } 6509467b48Spatrick 6609467b48Spatrick void llvm::appendToGlobalCtors(Module &M, Function *F, int Priority, Constant *Data) { 6709467b48Spatrick appendToGlobalArray("llvm.global_ctors", M, F, Priority, Data); 6809467b48Spatrick } 6909467b48Spatrick 7009467b48Spatrick void llvm::appendToGlobalDtors(Module &M, Function *F, int Priority, Constant *Data) { 7109467b48Spatrick appendToGlobalArray("llvm.global_dtors", M, F, Priority, Data); 7209467b48Spatrick } 7309467b48Spatrick 7409467b48Spatrick static void appendToUsedList(Module &M, StringRef Name, ArrayRef<GlobalValue *> Values) { 7509467b48Spatrick GlobalVariable *GV = M.getGlobalVariable(Name); 7609467b48Spatrick SmallPtrSet<Constant *, 16> InitAsSet; 7709467b48Spatrick SmallVector<Constant *, 16> Init; 7809467b48Spatrick if (GV) { 79*73471bf0Spatrick if (GV->hasInitializer()) { 8009467b48Spatrick auto *CA = cast<ConstantArray>(GV->getInitializer()); 8109467b48Spatrick for (auto &Op : CA->operands()) { 8209467b48Spatrick Constant *C = cast_or_null<Constant>(Op); 8309467b48Spatrick if (InitAsSet.insert(C).second) 8409467b48Spatrick Init.push_back(C); 8509467b48Spatrick } 86*73471bf0Spatrick } 8709467b48Spatrick GV->eraseFromParent(); 8809467b48Spatrick } 8909467b48Spatrick 9009467b48Spatrick Type *Int8PtrTy = llvm::Type::getInt8PtrTy(M.getContext()); 9109467b48Spatrick for (auto *V : Values) { 92*73471bf0Spatrick Constant *C = ConstantExpr::getPointerBitCastOrAddrSpaceCast(V, Int8PtrTy); 9309467b48Spatrick if (InitAsSet.insert(C).second) 9409467b48Spatrick Init.push_back(C); 9509467b48Spatrick } 9609467b48Spatrick 9709467b48Spatrick if (Init.empty()) 9809467b48Spatrick return; 9909467b48Spatrick 10009467b48Spatrick ArrayType *ATy = ArrayType::get(Int8PtrTy, Init.size()); 10109467b48Spatrick GV = new llvm::GlobalVariable(M, ATy, false, GlobalValue::AppendingLinkage, 10209467b48Spatrick ConstantArray::get(ATy, Init), Name); 10309467b48Spatrick GV->setSection("llvm.metadata"); 10409467b48Spatrick } 10509467b48Spatrick 10609467b48Spatrick void llvm::appendToUsed(Module &M, ArrayRef<GlobalValue *> Values) { 10709467b48Spatrick appendToUsedList(M, "llvm.used", Values); 10809467b48Spatrick } 10909467b48Spatrick 11009467b48Spatrick void llvm::appendToCompilerUsed(Module &M, ArrayRef<GlobalValue *> Values) { 11109467b48Spatrick appendToUsedList(M, "llvm.compiler.used", Values); 11209467b48Spatrick } 11309467b48Spatrick 11409467b48Spatrick FunctionCallee 11509467b48Spatrick llvm::declareSanitizerInitFunction(Module &M, StringRef InitName, 11609467b48Spatrick ArrayRef<Type *> InitArgTypes) { 11709467b48Spatrick assert(!InitName.empty() && "Expected init function name"); 11809467b48Spatrick return M.getOrInsertFunction( 11909467b48Spatrick InitName, 12009467b48Spatrick FunctionType::get(Type::getVoidTy(M.getContext()), InitArgTypes, false), 12109467b48Spatrick AttributeList()); 12209467b48Spatrick } 12309467b48Spatrick 124097a140dSpatrick Function *llvm::createSanitizerCtor(Module &M, StringRef CtorName) { 125*73471bf0Spatrick Function *Ctor = Function::createWithDefaultAttr( 126097a140dSpatrick FunctionType::get(Type::getVoidTy(M.getContext()), false), 127*73471bf0Spatrick GlobalValue::InternalLinkage, 0, CtorName, &M); 128*73471bf0Spatrick Ctor->addAttribute(AttributeList::FunctionIndex, Attribute::NoUnwind); 129097a140dSpatrick BasicBlock *CtorBB = BasicBlock::Create(M.getContext(), "", Ctor); 130097a140dSpatrick ReturnInst::Create(M.getContext(), CtorBB); 131*73471bf0Spatrick // Ensure Ctor cannot be discarded, even if in a comdat. 132*73471bf0Spatrick appendToUsed(M, {Ctor}); 133097a140dSpatrick return Ctor; 134097a140dSpatrick } 135097a140dSpatrick 13609467b48Spatrick std::pair<Function *, FunctionCallee> llvm::createSanitizerCtorAndInitFunctions( 13709467b48Spatrick Module &M, StringRef CtorName, StringRef InitName, 13809467b48Spatrick ArrayRef<Type *> InitArgTypes, ArrayRef<Value *> InitArgs, 13909467b48Spatrick StringRef VersionCheckName) { 14009467b48Spatrick assert(!InitName.empty() && "Expected init function name"); 14109467b48Spatrick assert(InitArgs.size() == InitArgTypes.size() && 14209467b48Spatrick "Sanitizer's init function expects different number of arguments"); 14309467b48Spatrick FunctionCallee InitFunction = 14409467b48Spatrick declareSanitizerInitFunction(M, InitName, InitArgTypes); 145097a140dSpatrick Function *Ctor = createSanitizerCtor(M, CtorName); 146097a140dSpatrick IRBuilder<> IRB(Ctor->getEntryBlock().getTerminator()); 14709467b48Spatrick IRB.CreateCall(InitFunction, InitArgs); 14809467b48Spatrick if (!VersionCheckName.empty()) { 14909467b48Spatrick FunctionCallee VersionCheckFunction = M.getOrInsertFunction( 15009467b48Spatrick VersionCheckName, FunctionType::get(IRB.getVoidTy(), {}, false), 15109467b48Spatrick AttributeList()); 15209467b48Spatrick IRB.CreateCall(VersionCheckFunction, {}); 15309467b48Spatrick } 15409467b48Spatrick return std::make_pair(Ctor, InitFunction); 15509467b48Spatrick } 15609467b48Spatrick 15709467b48Spatrick std::pair<Function *, FunctionCallee> 15809467b48Spatrick llvm::getOrCreateSanitizerCtorAndInitFunctions( 15909467b48Spatrick Module &M, StringRef CtorName, StringRef InitName, 16009467b48Spatrick ArrayRef<Type *> InitArgTypes, ArrayRef<Value *> InitArgs, 16109467b48Spatrick function_ref<void(Function *, FunctionCallee)> FunctionsCreatedCallback, 16209467b48Spatrick StringRef VersionCheckName) { 16309467b48Spatrick assert(!CtorName.empty() && "Expected ctor function name"); 16409467b48Spatrick 16509467b48Spatrick if (Function *Ctor = M.getFunction(CtorName)) 16609467b48Spatrick // FIXME: Sink this logic into the module, similar to the handling of 16709467b48Spatrick // globals. This will make moving to a concurrent model much easier. 16809467b48Spatrick if (Ctor->arg_size() == 0 || 16909467b48Spatrick Ctor->getReturnType() == Type::getVoidTy(M.getContext())) 17009467b48Spatrick return {Ctor, declareSanitizerInitFunction(M, InitName, InitArgTypes)}; 17109467b48Spatrick 17209467b48Spatrick Function *Ctor; 17309467b48Spatrick FunctionCallee InitFunction; 17409467b48Spatrick std::tie(Ctor, InitFunction) = llvm::createSanitizerCtorAndInitFunctions( 17509467b48Spatrick M, CtorName, InitName, InitArgTypes, InitArgs, VersionCheckName); 17609467b48Spatrick FunctionsCreatedCallback(Ctor, InitFunction); 17709467b48Spatrick return std::make_pair(Ctor, InitFunction); 17809467b48Spatrick } 17909467b48Spatrick 18009467b48Spatrick void llvm::filterDeadComdatFunctions( 18109467b48Spatrick Module &M, SmallVectorImpl<Function *> &DeadComdatFunctions) { 18209467b48Spatrick // Build a map from the comdat to the number of entries in that comdat we 18309467b48Spatrick // think are dead. If this fully covers the comdat group, then the entire 18409467b48Spatrick // group is dead. If we find another entry in the comdat group though, we'll 18509467b48Spatrick // have to preserve the whole group. 18609467b48Spatrick SmallDenseMap<Comdat *, int, 16> ComdatEntriesCovered; 18709467b48Spatrick for (Function *F : DeadComdatFunctions) { 18809467b48Spatrick Comdat *C = F->getComdat(); 18909467b48Spatrick assert(C && "Expected all input GVs to be in a comdat!"); 19009467b48Spatrick ComdatEntriesCovered[C] += 1; 19109467b48Spatrick } 19209467b48Spatrick 19309467b48Spatrick auto CheckComdat = [&](Comdat &C) { 19409467b48Spatrick auto CI = ComdatEntriesCovered.find(&C); 19509467b48Spatrick if (CI == ComdatEntriesCovered.end()) 19609467b48Spatrick return; 19709467b48Spatrick 19809467b48Spatrick // If this could have been covered by a dead entry, just subtract one to 19909467b48Spatrick // account for it. 20009467b48Spatrick if (CI->second > 0) { 20109467b48Spatrick CI->second -= 1; 20209467b48Spatrick return; 20309467b48Spatrick } 20409467b48Spatrick 20509467b48Spatrick // If we've already accounted for all the entries that were dead, the 20609467b48Spatrick // entire comdat is alive so remove it from the map. 20709467b48Spatrick ComdatEntriesCovered.erase(CI); 20809467b48Spatrick }; 20909467b48Spatrick 21009467b48Spatrick auto CheckAllComdats = [&] { 21109467b48Spatrick for (Function &F : M.functions()) 21209467b48Spatrick if (Comdat *C = F.getComdat()) { 21309467b48Spatrick CheckComdat(*C); 21409467b48Spatrick if (ComdatEntriesCovered.empty()) 21509467b48Spatrick return; 21609467b48Spatrick } 21709467b48Spatrick for (GlobalVariable &GV : M.globals()) 21809467b48Spatrick if (Comdat *C = GV.getComdat()) { 21909467b48Spatrick CheckComdat(*C); 22009467b48Spatrick if (ComdatEntriesCovered.empty()) 22109467b48Spatrick return; 22209467b48Spatrick } 22309467b48Spatrick for (GlobalAlias &GA : M.aliases()) 22409467b48Spatrick if (Comdat *C = GA.getComdat()) { 22509467b48Spatrick CheckComdat(*C); 22609467b48Spatrick if (ComdatEntriesCovered.empty()) 22709467b48Spatrick return; 22809467b48Spatrick } 22909467b48Spatrick }; 23009467b48Spatrick CheckAllComdats(); 23109467b48Spatrick 23209467b48Spatrick if (ComdatEntriesCovered.empty()) { 23309467b48Spatrick DeadComdatFunctions.clear(); 23409467b48Spatrick return; 23509467b48Spatrick } 23609467b48Spatrick 23709467b48Spatrick // Remove the entries that were not covering. 23809467b48Spatrick erase_if(DeadComdatFunctions, [&](GlobalValue *GV) { 23909467b48Spatrick return ComdatEntriesCovered.find(GV->getComdat()) == 24009467b48Spatrick ComdatEntriesCovered.end(); 24109467b48Spatrick }); 24209467b48Spatrick } 24309467b48Spatrick 24409467b48Spatrick std::string llvm::getUniqueModuleId(Module *M) { 24509467b48Spatrick MD5 Md5; 24609467b48Spatrick bool ExportsSymbols = false; 24709467b48Spatrick auto AddGlobal = [&](GlobalValue &GV) { 24809467b48Spatrick if (GV.isDeclaration() || GV.getName().startswith("llvm.") || 24909467b48Spatrick !GV.hasExternalLinkage() || GV.hasComdat()) 25009467b48Spatrick return; 25109467b48Spatrick ExportsSymbols = true; 25209467b48Spatrick Md5.update(GV.getName()); 25309467b48Spatrick Md5.update(ArrayRef<uint8_t>{0}); 25409467b48Spatrick }; 25509467b48Spatrick 25609467b48Spatrick for (auto &F : *M) 25709467b48Spatrick AddGlobal(F); 25809467b48Spatrick for (auto &GV : M->globals()) 25909467b48Spatrick AddGlobal(GV); 26009467b48Spatrick for (auto &GA : M->aliases()) 26109467b48Spatrick AddGlobal(GA); 26209467b48Spatrick for (auto &IF : M->ifuncs()) 26309467b48Spatrick AddGlobal(IF); 26409467b48Spatrick 26509467b48Spatrick if (!ExportsSymbols) 26609467b48Spatrick return ""; 26709467b48Spatrick 26809467b48Spatrick MD5::MD5Result R; 26909467b48Spatrick Md5.final(R); 27009467b48Spatrick 27109467b48Spatrick SmallString<32> Str; 27209467b48Spatrick MD5::stringifyResult(R, Str); 273*73471bf0Spatrick return ("." + Str).str(); 27409467b48Spatrick } 27509467b48Spatrick 27609467b48Spatrick void VFABI::setVectorVariantNames( 27709467b48Spatrick CallInst *CI, const SmallVector<std::string, 8> &VariantMappings) { 27809467b48Spatrick if (VariantMappings.empty()) 27909467b48Spatrick return; 28009467b48Spatrick 28109467b48Spatrick SmallString<256> Buffer; 28209467b48Spatrick llvm::raw_svector_ostream Out(Buffer); 28309467b48Spatrick for (const std::string &VariantMapping : VariantMappings) 28409467b48Spatrick Out << VariantMapping << ","; 28509467b48Spatrick // Get rid of the trailing ','. 28609467b48Spatrick assert(!Buffer.str().empty() && "Must have at least one char."); 28709467b48Spatrick Buffer.pop_back(); 28809467b48Spatrick 28909467b48Spatrick Module *M = CI->getModule(); 29009467b48Spatrick #ifndef NDEBUG 29109467b48Spatrick for (const std::string &VariantMapping : VariantMappings) { 292097a140dSpatrick LLVM_DEBUG(dbgs() << "VFABI: adding mapping '" << VariantMapping << "'\n"); 293097a140dSpatrick Optional<VFInfo> VI = VFABI::tryDemangleForVFABI(VariantMapping, *M); 294097a140dSpatrick assert(VI.hasValue() && "Cannot add an invalid VFABI name."); 29509467b48Spatrick assert(M->getNamedValue(VI.getValue().VectorName) && 29609467b48Spatrick "Cannot add variant to attribute: " 29709467b48Spatrick "vector function declaration is missing."); 29809467b48Spatrick } 29909467b48Spatrick #endif 30009467b48Spatrick CI->addAttribute( 30109467b48Spatrick AttributeList::FunctionIndex, 30209467b48Spatrick Attribute::get(M->getContext(), MappingsAttrName, Buffer.str())); 30309467b48Spatrick } 304