1 //===- ModuleSummaryAnalysis.cpp - Module summary index builder -----------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This pass builds a ModuleSummaryIndex object for the module, to be written 10 // to bitcode or LLVM assembly. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "llvm/Analysis/ModuleSummaryAnalysis.h" 15 #include "llvm/ADT/ArrayRef.h" 16 #include "llvm/ADT/DenseSet.h" 17 #include "llvm/ADT/MapVector.h" 18 #include "llvm/ADT/STLExtras.h" 19 #include "llvm/ADT/SetVector.h" 20 #include "llvm/ADT/SmallPtrSet.h" 21 #include "llvm/ADT/SmallVector.h" 22 #include "llvm/ADT/StringRef.h" 23 #include "llvm/Analysis/BlockFrequencyInfo.h" 24 #include "llvm/Analysis/BranchProbabilityInfo.h" 25 #include "llvm/Analysis/IndirectCallPromotionAnalysis.h" 26 #include "llvm/Analysis/LoopInfo.h" 27 #include "llvm/Analysis/ProfileSummaryInfo.h" 28 #include "llvm/Analysis/TypeMetadataUtils.h" 29 #include "llvm/IR/Attributes.h" 30 #include "llvm/IR/BasicBlock.h" 31 #include "llvm/IR/CallSite.h" 32 #include "llvm/IR/Constant.h" 33 #include "llvm/IR/Constants.h" 34 #include "llvm/IR/Dominators.h" 35 #include "llvm/IR/Function.h" 36 #include "llvm/IR/GlobalAlias.h" 37 #include "llvm/IR/GlobalValue.h" 38 #include "llvm/IR/GlobalVariable.h" 39 #include "llvm/IR/Instructions.h" 40 #include "llvm/IR/IntrinsicInst.h" 41 #include "llvm/IR/Intrinsics.h" 42 #include "llvm/IR/Metadata.h" 43 #include "llvm/IR/Module.h" 44 #include "llvm/IR/ModuleSummaryIndex.h" 45 #include "llvm/IR/Use.h" 46 #include "llvm/IR/User.h" 47 #include "llvm/Object/ModuleSymbolTable.h" 48 #include "llvm/Object/SymbolicFile.h" 49 #include "llvm/Pass.h" 50 #include "llvm/Support/Casting.h" 51 #include "llvm/Support/CommandLine.h" 52 #include <algorithm> 53 #include <cassert> 54 #include <cstdint> 55 #include <vector> 56 57 using namespace llvm; 58 59 #define DEBUG_TYPE "module-summary-analysis" 60 61 // Option to force edges cold which will block importing when the 62 // -import-cold-multiplier is set to 0. Useful for debugging. 63 FunctionSummary::ForceSummaryHotnessType ForceSummaryEdgesCold = 64 FunctionSummary::FSHT_None; 65 cl::opt<FunctionSummary::ForceSummaryHotnessType, true> FSEC( 66 "force-summary-edges-cold", cl::Hidden, cl::location(ForceSummaryEdgesCold), 67 cl::desc("Force all edges in the function summary to cold"), 68 cl::values(clEnumValN(FunctionSummary::FSHT_None, "none", "None."), 69 clEnumValN(FunctionSummary::FSHT_AllNonCritical, 70 "all-non-critical", "All non-critical edges."), 71 clEnumValN(FunctionSummary::FSHT_All, "all", "All edges."))); 72 73 // Walk through the operands of a given User via worklist iteration and populate 74 // the set of GlobalValue references encountered. Invoked either on an 75 // Instruction or a GlobalVariable (which walks its initializer). 76 // Return true if any of the operands contains blockaddress. This is important 77 // to know when computing summary for global var, because if global variable 78 // references basic block address we can't import it separately from function 79 // containing that basic block. For simplicity we currently don't import such 80 // global vars at all. When importing function we aren't interested if any 81 // instruction in it takes an address of any basic block, because instruction 82 // can only take an address of basic block located in the same function. 83 static bool findRefEdges(ModuleSummaryIndex &Index, const User *CurUser, 84 SetVector<ValueInfo> &RefEdges, 85 SmallPtrSet<const User *, 8> &Visited) { 86 bool HasBlockAddress = false; 87 SmallVector<const User *, 32> Worklist; 88 Worklist.push_back(CurUser); 89 90 while (!Worklist.empty()) { 91 const User *U = Worklist.pop_back_val(); 92 93 if (!Visited.insert(U).second) 94 continue; 95 96 ImmutableCallSite CS(U); 97 98 for (const auto &OI : U->operands()) { 99 const User *Operand = dyn_cast<User>(OI); 100 if (!Operand) 101 continue; 102 if (isa<BlockAddress>(Operand)) { 103 HasBlockAddress = true; 104 continue; 105 } 106 if (auto *GV = dyn_cast<GlobalValue>(Operand)) { 107 // We have a reference to a global value. This should be added to 108 // the reference set unless it is a callee. Callees are handled 109 // specially by WriteFunction and are added to a separate list. 110 if (!(CS && CS.isCallee(&OI))) 111 RefEdges.insert(Index.getOrInsertValueInfo(GV)); 112 continue; 113 } 114 Worklist.push_back(Operand); 115 } 116 } 117 return HasBlockAddress; 118 } 119 120 static CalleeInfo::HotnessType getHotness(uint64_t ProfileCount, 121 ProfileSummaryInfo *PSI) { 122 if (!PSI) 123 return CalleeInfo::HotnessType::Unknown; 124 if (PSI->isHotCount(ProfileCount)) 125 return CalleeInfo::HotnessType::Hot; 126 if (PSI->isColdCount(ProfileCount)) 127 return CalleeInfo::HotnessType::Cold; 128 return CalleeInfo::HotnessType::None; 129 } 130 131 static bool isNonRenamableLocal(const GlobalValue &GV) { 132 return GV.hasSection() && GV.hasLocalLinkage(); 133 } 134 135 /// Determine whether this call has all constant integer arguments (excluding 136 /// "this") and summarize it to VCalls or ConstVCalls as appropriate. 137 static void addVCallToSet(DevirtCallSite Call, GlobalValue::GUID Guid, 138 SetVector<FunctionSummary::VFuncId> &VCalls, 139 SetVector<FunctionSummary::ConstVCall> &ConstVCalls) { 140 std::vector<uint64_t> Args; 141 // Start from the second argument to skip the "this" pointer. 142 for (auto &Arg : make_range(Call.CS.arg_begin() + 1, Call.CS.arg_end())) { 143 auto *CI = dyn_cast<ConstantInt>(Arg); 144 if (!CI || CI->getBitWidth() > 64) { 145 VCalls.insert({Guid, Call.Offset}); 146 return; 147 } 148 Args.push_back(CI->getZExtValue()); 149 } 150 ConstVCalls.insert({{Guid, Call.Offset}, std::move(Args)}); 151 } 152 153 /// If this intrinsic call requires that we add information to the function 154 /// summary, do so via the non-constant reference arguments. 155 static void addIntrinsicToSummary( 156 const CallInst *CI, SetVector<GlobalValue::GUID> &TypeTests, 157 SetVector<FunctionSummary::VFuncId> &TypeTestAssumeVCalls, 158 SetVector<FunctionSummary::VFuncId> &TypeCheckedLoadVCalls, 159 SetVector<FunctionSummary::ConstVCall> &TypeTestAssumeConstVCalls, 160 SetVector<FunctionSummary::ConstVCall> &TypeCheckedLoadConstVCalls, 161 DominatorTree &DT) { 162 switch (CI->getCalledFunction()->getIntrinsicID()) { 163 case Intrinsic::type_test: { 164 auto *TypeMDVal = cast<MetadataAsValue>(CI->getArgOperand(1)); 165 auto *TypeId = dyn_cast<MDString>(TypeMDVal->getMetadata()); 166 if (!TypeId) 167 break; 168 GlobalValue::GUID Guid = GlobalValue::getGUID(TypeId->getString()); 169 170 // Produce a summary from type.test intrinsics. We only summarize type.test 171 // intrinsics that are used other than by an llvm.assume intrinsic. 172 // Intrinsics that are assumed are relevant only to the devirtualization 173 // pass, not the type test lowering pass. 174 bool HasNonAssumeUses = llvm::any_of(CI->uses(), [](const Use &CIU) { 175 auto *AssumeCI = dyn_cast<CallInst>(CIU.getUser()); 176 if (!AssumeCI) 177 return true; 178 Function *F = AssumeCI->getCalledFunction(); 179 return !F || F->getIntrinsicID() != Intrinsic::assume; 180 }); 181 if (HasNonAssumeUses) 182 TypeTests.insert(Guid); 183 184 SmallVector<DevirtCallSite, 4> DevirtCalls; 185 SmallVector<CallInst *, 4> Assumes; 186 findDevirtualizableCallsForTypeTest(DevirtCalls, Assumes, CI, DT); 187 for (auto &Call : DevirtCalls) 188 addVCallToSet(Call, Guid, TypeTestAssumeVCalls, 189 TypeTestAssumeConstVCalls); 190 191 break; 192 } 193 194 case Intrinsic::type_checked_load: { 195 auto *TypeMDVal = cast<MetadataAsValue>(CI->getArgOperand(2)); 196 auto *TypeId = dyn_cast<MDString>(TypeMDVal->getMetadata()); 197 if (!TypeId) 198 break; 199 GlobalValue::GUID Guid = GlobalValue::getGUID(TypeId->getString()); 200 201 SmallVector<DevirtCallSite, 4> DevirtCalls; 202 SmallVector<Instruction *, 4> LoadedPtrs; 203 SmallVector<Instruction *, 4> Preds; 204 bool HasNonCallUses = false; 205 findDevirtualizableCallsForTypeCheckedLoad(DevirtCalls, LoadedPtrs, Preds, 206 HasNonCallUses, CI, DT); 207 // Any non-call uses of the result of llvm.type.checked.load will 208 // prevent us from optimizing away the llvm.type.test. 209 if (HasNonCallUses) 210 TypeTests.insert(Guid); 211 for (auto &Call : DevirtCalls) 212 addVCallToSet(Call, Guid, TypeCheckedLoadVCalls, 213 TypeCheckedLoadConstVCalls); 214 215 break; 216 } 217 default: 218 break; 219 } 220 } 221 222 static bool isNonVolatileLoad(const Instruction *I) { 223 if (const auto *LI = dyn_cast<LoadInst>(I)) 224 return !LI->isVolatile(); 225 226 return false; 227 } 228 229 static void computeFunctionSummary(ModuleSummaryIndex &Index, const Module &M, 230 const Function &F, BlockFrequencyInfo *BFI, 231 ProfileSummaryInfo *PSI, DominatorTree &DT, 232 bool HasLocalsInUsedOrAsm, 233 DenseSet<GlobalValue::GUID> &CantBePromoted, 234 bool IsThinLTO) { 235 // Summary not currently supported for anonymous functions, they should 236 // have been named. 237 assert(F.hasName()); 238 239 unsigned NumInsts = 0; 240 // Map from callee ValueId to profile count. Used to accumulate profile 241 // counts for all static calls to a given callee. 242 MapVector<ValueInfo, CalleeInfo> CallGraphEdges; 243 SetVector<ValueInfo> RefEdges; 244 SetVector<GlobalValue::GUID> TypeTests; 245 SetVector<FunctionSummary::VFuncId> TypeTestAssumeVCalls, 246 TypeCheckedLoadVCalls; 247 SetVector<FunctionSummary::ConstVCall> TypeTestAssumeConstVCalls, 248 TypeCheckedLoadConstVCalls; 249 ICallPromotionAnalysis ICallAnalysis; 250 SmallPtrSet<const User *, 8> Visited; 251 252 // Add personality function, prefix data and prologue data to function's ref 253 // list. 254 findRefEdges(Index, &F, RefEdges, Visited); 255 std::vector<const Instruction *> NonVolatileLoads; 256 257 bool HasInlineAsmMaybeReferencingInternal = false; 258 for (const BasicBlock &BB : F) 259 for (const Instruction &I : BB) { 260 if (isa<DbgInfoIntrinsic>(I)) 261 continue; 262 ++NumInsts; 263 if (isNonVolatileLoad(&I)) { 264 // Postpone processing of non-volatile load instructions 265 // See comments below 266 Visited.insert(&I); 267 NonVolatileLoads.push_back(&I); 268 continue; 269 } 270 findRefEdges(Index, &I, RefEdges, Visited); 271 auto CS = ImmutableCallSite(&I); 272 if (!CS) 273 continue; 274 275 const auto *CI = dyn_cast<CallInst>(&I); 276 // Since we don't know exactly which local values are referenced in inline 277 // assembly, conservatively mark the function as possibly referencing 278 // a local value from inline assembly to ensure we don't export a 279 // reference (which would require renaming and promotion of the 280 // referenced value). 281 if (HasLocalsInUsedOrAsm && CI && CI->isInlineAsm()) 282 HasInlineAsmMaybeReferencingInternal = true; 283 284 auto *CalledValue = CS.getCalledValue(); 285 auto *CalledFunction = CS.getCalledFunction(); 286 if (CalledValue && !CalledFunction) { 287 CalledValue = CalledValue->stripPointerCastsNoFollowAliases(); 288 // Stripping pointer casts can reveal a called function. 289 CalledFunction = dyn_cast<Function>(CalledValue); 290 } 291 // Check if this is an alias to a function. If so, get the 292 // called aliasee for the checks below. 293 if (auto *GA = dyn_cast<GlobalAlias>(CalledValue)) { 294 assert(!CalledFunction && "Expected null called function in callsite for alias"); 295 CalledFunction = dyn_cast<Function>(GA->getBaseObject()); 296 } 297 // Check if this is a direct call to a known function or a known 298 // intrinsic, or an indirect call with profile data. 299 if (CalledFunction) { 300 if (CI && CalledFunction->isIntrinsic()) { 301 addIntrinsicToSummary( 302 CI, TypeTests, TypeTestAssumeVCalls, TypeCheckedLoadVCalls, 303 TypeTestAssumeConstVCalls, TypeCheckedLoadConstVCalls, DT); 304 continue; 305 } 306 // We should have named any anonymous globals 307 assert(CalledFunction->hasName()); 308 auto ScaledCount = PSI->getProfileCount(&I, BFI); 309 auto Hotness = ScaledCount ? getHotness(ScaledCount.getValue(), PSI) 310 : CalleeInfo::HotnessType::Unknown; 311 if (ForceSummaryEdgesCold != FunctionSummary::FSHT_None) 312 Hotness = CalleeInfo::HotnessType::Cold; 313 314 // Use the original CalledValue, in case it was an alias. We want 315 // to record the call edge to the alias in that case. Eventually 316 // an alias summary will be created to associate the alias and 317 // aliasee. 318 auto &ValueInfo = CallGraphEdges[Index.getOrInsertValueInfo( 319 cast<GlobalValue>(CalledValue))]; 320 ValueInfo.updateHotness(Hotness); 321 // Add the relative block frequency to CalleeInfo if there is no profile 322 // information. 323 if (BFI != nullptr && Hotness == CalleeInfo::HotnessType::Unknown) { 324 uint64_t BBFreq = BFI->getBlockFreq(&BB).getFrequency(); 325 uint64_t EntryFreq = BFI->getEntryFreq(); 326 ValueInfo.updateRelBlockFreq(BBFreq, EntryFreq); 327 } 328 } else { 329 // Skip inline assembly calls. 330 if (CI && CI->isInlineAsm()) 331 continue; 332 // Skip direct calls. 333 if (!CalledValue || isa<Constant>(CalledValue)) 334 continue; 335 336 // Check if the instruction has a callees metadata. If so, add callees 337 // to CallGraphEdges to reflect the references from the metadata, and 338 // to enable importing for subsequent indirect call promotion and 339 // inlining. 340 if (auto *MD = I.getMetadata(LLVMContext::MD_callees)) { 341 for (auto &Op : MD->operands()) { 342 Function *Callee = mdconst::extract_or_null<Function>(Op); 343 if (Callee) 344 CallGraphEdges[Index.getOrInsertValueInfo(Callee)]; 345 } 346 } 347 348 uint32_t NumVals, NumCandidates; 349 uint64_t TotalCount; 350 auto CandidateProfileData = 351 ICallAnalysis.getPromotionCandidatesForInstruction( 352 &I, NumVals, TotalCount, NumCandidates); 353 for (auto &Candidate : CandidateProfileData) 354 CallGraphEdges[Index.getOrInsertValueInfo(Candidate.Value)] 355 .updateHotness(getHotness(Candidate.Count, PSI)); 356 } 357 } 358 359 // By now we processed all instructions in a function, except 360 // non-volatile loads. All new refs we add in a loop below 361 // are obviously constant. All constant refs are grouped in the 362 // end of RefEdges vector, so we can use a single integer value 363 // to identify them. 364 unsigned RefCnt = RefEdges.size(); 365 for (const Instruction *I : NonVolatileLoads) { 366 Visited.erase(I); 367 findRefEdges(Index, I, RefEdges, Visited); 368 } 369 std::vector<ValueInfo> Refs = RefEdges.takeVector(); 370 // Regular LTO module doesn't participate in ThinLTO import, 371 // so no reference from it can be readonly, since this would 372 // require importing variable as local copy 373 if (IsThinLTO) 374 for (; RefCnt < Refs.size(); ++RefCnt) 375 Refs[RefCnt].setReadOnly(); 376 377 // Explicit add hot edges to enforce importing for designated GUIDs for 378 // sample PGO, to enable the same inlines as the profiled optimized binary. 379 for (auto &I : F.getImportGUIDs()) 380 CallGraphEdges[Index.getOrInsertValueInfo(I)].updateHotness( 381 ForceSummaryEdgesCold == FunctionSummary::FSHT_All 382 ? CalleeInfo::HotnessType::Cold 383 : CalleeInfo::HotnessType::Critical); 384 385 bool NonRenamableLocal = isNonRenamableLocal(F); 386 bool NotEligibleForImport = 387 NonRenamableLocal || HasInlineAsmMaybeReferencingInternal; 388 GlobalValueSummary::GVFlags Flags(F.getLinkage(), NotEligibleForImport, 389 /* Live = */ false, F.isDSOLocal()); 390 FunctionSummary::FFlags FunFlags{ 391 F.hasFnAttribute(Attribute::ReadNone), 392 F.hasFnAttribute(Attribute::ReadOnly), 393 F.hasFnAttribute(Attribute::NoRecurse), F.returnDoesNotAlias(), 394 // FIXME: refactor this to use the same code that inliner is using. 395 // Don't try to import functions with noinline attribute. 396 F.getAttributes().hasFnAttribute(Attribute::NoInline)}; 397 auto FuncSummary = llvm::make_unique<FunctionSummary>( 398 Flags, NumInsts, FunFlags, /*EntryCount=*/0, std::move(Refs), 399 CallGraphEdges.takeVector(), TypeTests.takeVector(), 400 TypeTestAssumeVCalls.takeVector(), TypeCheckedLoadVCalls.takeVector(), 401 TypeTestAssumeConstVCalls.takeVector(), 402 TypeCheckedLoadConstVCalls.takeVector()); 403 if (NonRenamableLocal) 404 CantBePromoted.insert(F.getGUID()); 405 Index.addGlobalValueSummary(F, std::move(FuncSummary)); 406 } 407 408 static void 409 computeVariableSummary(ModuleSummaryIndex &Index, const GlobalVariable &V, 410 DenseSet<GlobalValue::GUID> &CantBePromoted) { 411 SetVector<ValueInfo> RefEdges; 412 SmallPtrSet<const User *, 8> Visited; 413 bool HasBlockAddress = findRefEdges(Index, &V, RefEdges, Visited); 414 bool NonRenamableLocal = isNonRenamableLocal(V); 415 GlobalValueSummary::GVFlags Flags(V.getLinkage(), NonRenamableLocal, 416 /* Live = */ false, V.isDSOLocal()); 417 418 // Don't mark variables we won't be able to internalize as read-only. 419 GlobalVarSummary::GVarFlags VarFlags( 420 !V.hasComdat() && !V.hasAppendingLinkage() && !V.isInterposable() && 421 !V.hasAvailableExternallyLinkage() && !V.hasDLLExportStorageClass()); 422 auto GVarSummary = llvm::make_unique<GlobalVarSummary>(Flags, VarFlags, 423 RefEdges.takeVector()); 424 if (NonRenamableLocal) 425 CantBePromoted.insert(V.getGUID()); 426 if (HasBlockAddress) 427 GVarSummary->setNotEligibleToImport(); 428 Index.addGlobalValueSummary(V, std::move(GVarSummary)); 429 } 430 431 static void 432 computeAliasSummary(ModuleSummaryIndex &Index, const GlobalAlias &A, 433 DenseSet<GlobalValue::GUID> &CantBePromoted) { 434 bool NonRenamableLocal = isNonRenamableLocal(A); 435 GlobalValueSummary::GVFlags Flags(A.getLinkage(), NonRenamableLocal, 436 /* Live = */ false, A.isDSOLocal()); 437 auto AS = llvm::make_unique<AliasSummary>(Flags); 438 auto *Aliasee = A.getBaseObject(); 439 auto *AliaseeSummary = Index.getGlobalValueSummary(*Aliasee); 440 assert(AliaseeSummary && "Alias expects aliasee summary to be parsed"); 441 AS->setAliasee(AliaseeSummary); 442 if (NonRenamableLocal) 443 CantBePromoted.insert(A.getGUID()); 444 Index.addGlobalValueSummary(A, std::move(AS)); 445 } 446 447 // Set LiveRoot flag on entries matching the given value name. 448 static void setLiveRoot(ModuleSummaryIndex &Index, StringRef Name) { 449 if (ValueInfo VI = Index.getValueInfo(GlobalValue::getGUID(Name))) 450 for (auto &Summary : VI.getSummaryList()) 451 Summary->setLive(true); 452 } 453 454 ModuleSummaryIndex llvm::buildModuleSummaryIndex( 455 const Module &M, 456 std::function<BlockFrequencyInfo *(const Function &F)> GetBFICallback, 457 ProfileSummaryInfo *PSI) { 458 assert(PSI); 459 bool EnableSplitLTOUnit = false; 460 if (auto *MD = mdconst::extract_or_null<ConstantInt>( 461 M.getModuleFlag("EnableSplitLTOUnit"))) 462 EnableSplitLTOUnit = MD->getZExtValue(); 463 ModuleSummaryIndex Index(/*HaveGVs=*/true, EnableSplitLTOUnit); 464 465 // Identify the local values in the llvm.used and llvm.compiler.used sets, 466 // which should not be exported as they would then require renaming and 467 // promotion, but we may have opaque uses e.g. in inline asm. We collect them 468 // here because we use this information to mark functions containing inline 469 // assembly calls as not importable. 470 SmallPtrSet<GlobalValue *, 8> LocalsUsed; 471 SmallPtrSet<GlobalValue *, 8> Used; 472 // First collect those in the llvm.used set. 473 collectUsedGlobalVariables(M, Used, /*CompilerUsed*/ false); 474 // Next collect those in the llvm.compiler.used set. 475 collectUsedGlobalVariables(M, Used, /*CompilerUsed*/ true); 476 DenseSet<GlobalValue::GUID> CantBePromoted; 477 for (auto *V : Used) { 478 if (V->hasLocalLinkage()) { 479 LocalsUsed.insert(V); 480 CantBePromoted.insert(V->getGUID()); 481 } 482 } 483 484 bool HasLocalInlineAsmSymbol = false; 485 if (!M.getModuleInlineAsm().empty()) { 486 // Collect the local values defined by module level asm, and set up 487 // summaries for these symbols so that they can be marked as NoRename, 488 // to prevent export of any use of them in regular IR that would require 489 // renaming within the module level asm. Note we don't need to create a 490 // summary for weak or global defs, as they don't need to be flagged as 491 // NoRename, and defs in module level asm can't be imported anyway. 492 // Also, any values used but not defined within module level asm should 493 // be listed on the llvm.used or llvm.compiler.used global and marked as 494 // referenced from there. 495 ModuleSymbolTable::CollectAsmSymbols( 496 M, [&](StringRef Name, object::BasicSymbolRef::Flags Flags) { 497 // Symbols not marked as Weak or Global are local definitions. 498 if (Flags & (object::BasicSymbolRef::SF_Weak | 499 object::BasicSymbolRef::SF_Global)) 500 return; 501 HasLocalInlineAsmSymbol = true; 502 GlobalValue *GV = M.getNamedValue(Name); 503 if (!GV) 504 return; 505 assert(GV->isDeclaration() && "Def in module asm already has definition"); 506 GlobalValueSummary::GVFlags GVFlags(GlobalValue::InternalLinkage, 507 /* NotEligibleToImport = */ true, 508 /* Live = */ true, 509 /* Local */ GV->isDSOLocal()); 510 CantBePromoted.insert(GV->getGUID()); 511 // Create the appropriate summary type. 512 if (Function *F = dyn_cast<Function>(GV)) { 513 std::unique_ptr<FunctionSummary> Summary = 514 llvm::make_unique<FunctionSummary>( 515 GVFlags, /*InstCount=*/0, 516 FunctionSummary::FFlags{ 517 F->hasFnAttribute(Attribute::ReadNone), 518 F->hasFnAttribute(Attribute::ReadOnly), 519 F->hasFnAttribute(Attribute::NoRecurse), 520 F->returnDoesNotAlias(), 521 /* NoInline = */ false}, 522 /*EntryCount=*/0, ArrayRef<ValueInfo>{}, 523 ArrayRef<FunctionSummary::EdgeTy>{}, 524 ArrayRef<GlobalValue::GUID>{}, 525 ArrayRef<FunctionSummary::VFuncId>{}, 526 ArrayRef<FunctionSummary::VFuncId>{}, 527 ArrayRef<FunctionSummary::ConstVCall>{}, 528 ArrayRef<FunctionSummary::ConstVCall>{}); 529 Index.addGlobalValueSummary(*GV, std::move(Summary)); 530 } else { 531 std::unique_ptr<GlobalVarSummary> Summary = 532 llvm::make_unique<GlobalVarSummary>( 533 GVFlags, GlobalVarSummary::GVarFlags(), 534 ArrayRef<ValueInfo>{}); 535 Index.addGlobalValueSummary(*GV, std::move(Summary)); 536 } 537 }); 538 } 539 540 bool IsThinLTO = true; 541 if (auto *MD = 542 mdconst::extract_or_null<ConstantInt>(M.getModuleFlag("ThinLTO"))) 543 IsThinLTO = MD->getZExtValue(); 544 545 // Compute summaries for all functions defined in module, and save in the 546 // index. 547 for (auto &F : M) { 548 if (F.isDeclaration()) 549 continue; 550 551 DominatorTree DT(const_cast<Function &>(F)); 552 BlockFrequencyInfo *BFI = nullptr; 553 std::unique_ptr<BlockFrequencyInfo> BFIPtr; 554 if (GetBFICallback) 555 BFI = GetBFICallback(F); 556 else if (F.hasProfileData()) { 557 LoopInfo LI{DT}; 558 BranchProbabilityInfo BPI{F, LI}; 559 BFIPtr = llvm::make_unique<BlockFrequencyInfo>(F, BPI, LI); 560 BFI = BFIPtr.get(); 561 } 562 563 computeFunctionSummary(Index, M, F, BFI, PSI, DT, 564 !LocalsUsed.empty() || HasLocalInlineAsmSymbol, 565 CantBePromoted, IsThinLTO); 566 } 567 568 // Compute summaries for all variables defined in module, and save in the 569 // index. 570 for (const GlobalVariable &G : M.globals()) { 571 if (G.isDeclaration()) 572 continue; 573 computeVariableSummary(Index, G, CantBePromoted); 574 } 575 576 // Compute summaries for all aliases defined in module, and save in the 577 // index. 578 for (const GlobalAlias &A : M.aliases()) 579 computeAliasSummary(Index, A, CantBePromoted); 580 581 for (auto *V : LocalsUsed) { 582 auto *Summary = Index.getGlobalValueSummary(*V); 583 assert(Summary && "Missing summary for global value"); 584 Summary->setNotEligibleToImport(); 585 } 586 587 // The linker doesn't know about these LLVM produced values, so we need 588 // to flag them as live in the index to ensure index-based dead value 589 // analysis treats them as live roots of the analysis. 590 setLiveRoot(Index, "llvm.used"); 591 setLiveRoot(Index, "llvm.compiler.used"); 592 setLiveRoot(Index, "llvm.global_ctors"); 593 setLiveRoot(Index, "llvm.global_dtors"); 594 setLiveRoot(Index, "llvm.global.annotations"); 595 596 for (auto &GlobalList : Index) { 597 // Ignore entries for references that are undefined in the current module. 598 if (GlobalList.second.SummaryList.empty()) 599 continue; 600 601 assert(GlobalList.second.SummaryList.size() == 1 && 602 "Expected module's index to have one summary per GUID"); 603 auto &Summary = GlobalList.second.SummaryList[0]; 604 if (!IsThinLTO) { 605 Summary->setNotEligibleToImport(); 606 continue; 607 } 608 609 bool AllRefsCanBeExternallyReferenced = 610 llvm::all_of(Summary->refs(), [&](const ValueInfo &VI) { 611 return !CantBePromoted.count(VI.getGUID()); 612 }); 613 if (!AllRefsCanBeExternallyReferenced) { 614 Summary->setNotEligibleToImport(); 615 continue; 616 } 617 618 if (auto *FuncSummary = dyn_cast<FunctionSummary>(Summary.get())) { 619 bool AllCallsCanBeExternallyReferenced = llvm::all_of( 620 FuncSummary->calls(), [&](const FunctionSummary::EdgeTy &Edge) { 621 return !CantBePromoted.count(Edge.first.getGUID()); 622 }); 623 if (!AllCallsCanBeExternallyReferenced) 624 Summary->setNotEligibleToImport(); 625 } 626 } 627 628 return Index; 629 } 630 631 AnalysisKey ModuleSummaryIndexAnalysis::Key; 632 633 ModuleSummaryIndex 634 ModuleSummaryIndexAnalysis::run(Module &M, ModuleAnalysisManager &AM) { 635 ProfileSummaryInfo &PSI = AM.getResult<ProfileSummaryAnalysis>(M); 636 auto &FAM = AM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager(); 637 return buildModuleSummaryIndex( 638 M, 639 [&FAM](const Function &F) { 640 return &FAM.getResult<BlockFrequencyAnalysis>( 641 *const_cast<Function *>(&F)); 642 }, 643 &PSI); 644 } 645 646 char ModuleSummaryIndexWrapperPass::ID = 0; 647 648 INITIALIZE_PASS_BEGIN(ModuleSummaryIndexWrapperPass, "module-summary-analysis", 649 "Module Summary Analysis", false, true) 650 INITIALIZE_PASS_DEPENDENCY(BlockFrequencyInfoWrapperPass) 651 INITIALIZE_PASS_DEPENDENCY(ProfileSummaryInfoWrapperPass) 652 INITIALIZE_PASS_END(ModuleSummaryIndexWrapperPass, "module-summary-analysis", 653 "Module Summary Analysis", false, true) 654 655 ModulePass *llvm::createModuleSummaryIndexWrapperPass() { 656 return new ModuleSummaryIndexWrapperPass(); 657 } 658 659 ModuleSummaryIndexWrapperPass::ModuleSummaryIndexWrapperPass() 660 : ModulePass(ID) { 661 initializeModuleSummaryIndexWrapperPassPass(*PassRegistry::getPassRegistry()); 662 } 663 664 bool ModuleSummaryIndexWrapperPass::runOnModule(Module &M) { 665 auto *PSI = &getAnalysis<ProfileSummaryInfoWrapperPass>().getPSI(); 666 Index.emplace(buildModuleSummaryIndex( 667 M, 668 [this](const Function &F) { 669 return &(this->getAnalysis<BlockFrequencyInfoWrapperPass>( 670 *const_cast<Function *>(&F)) 671 .getBFI()); 672 }, 673 PSI)); 674 return false; 675 } 676 677 bool ModuleSummaryIndexWrapperPass::doFinalization(Module &M) { 678 Index.reset(); 679 return false; 680 } 681 682 void ModuleSummaryIndexWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const { 683 AU.setPreservesAll(); 684 AU.addRequired<BlockFrequencyInfoWrapperPass>(); 685 AU.addRequired<ProfileSummaryInfoWrapperPass>(); 686 } 687