10b57cec5SDimitry Andric //===- LTO.cpp ------------------------------------------------------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #include "LTO.h" 10bdd1243dSDimitry Andric #include "COFFLinkerContext.h" 110b57cec5SDimitry Andric #include "Config.h" 120b57cec5SDimitry Andric #include "InputFiles.h" 130b57cec5SDimitry Andric #include "Symbols.h" 140b57cec5SDimitry Andric #include "lld/Common/Args.h" 1504eeddc0SDimitry Andric #include "lld/Common/CommonLinkerContext.h" 165f757f3fSDimitry Andric #include "lld/Common/Filesystem.h" 170b57cec5SDimitry Andric #include "lld/Common/Strings.h" 180b57cec5SDimitry Andric #include "lld/Common/TargetOptionsCommandFlags.h" 190b57cec5SDimitry Andric #include "llvm/ADT/STLExtras.h" 200b57cec5SDimitry Andric #include "llvm/ADT/SmallString.h" 210b57cec5SDimitry Andric #include "llvm/ADT/StringRef.h" 220b57cec5SDimitry Andric #include "llvm/ADT/Twine.h" 230b57cec5SDimitry Andric #include "llvm/Bitcode/BitcodeWriter.h" 240b57cec5SDimitry Andric #include "llvm/IR/DiagnosticPrinter.h" 250b57cec5SDimitry Andric #include "llvm/LTO/Config.h" 260b57cec5SDimitry Andric #include "llvm/LTO/LTO.h" 270b57cec5SDimitry Andric #include "llvm/Object/SymbolicFile.h" 28349cc55cSDimitry Andric #include "llvm/Support/Caching.h" 290b57cec5SDimitry Andric #include "llvm/Support/CodeGen.h" 300b57cec5SDimitry Andric #include "llvm/Support/Error.h" 310b57cec5SDimitry Andric #include "llvm/Support/FileSystem.h" 320b57cec5SDimitry Andric #include "llvm/Support/MemoryBuffer.h" 330b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h" 340b57cec5SDimitry Andric #include <algorithm> 350b57cec5SDimitry Andric #include <cstddef> 360b57cec5SDimitry Andric #include <memory> 370b57cec5SDimitry Andric #include <string> 380b57cec5SDimitry Andric #include <system_error> 390b57cec5SDimitry Andric #include <vector> 400b57cec5SDimitry Andric 410b57cec5SDimitry Andric using namespace llvm; 420b57cec5SDimitry Andric using namespace llvm::object; 435ffd83dbSDimitry Andric using namespace lld; 445ffd83dbSDimitry Andric using namespace lld::coff; 450b57cec5SDimitry Andric 46bdd1243dSDimitry Andric std::string BitcodeCompiler::getThinLTOOutputFile(StringRef path) { 4706c3fb27SDimitry Andric return lto::getThinLTOOutputFile(path, ctx.config.thinLTOPrefixReplaceOld, 4806c3fb27SDimitry Andric ctx.config.thinLTOPrefixReplaceNew); 490b57cec5SDimitry Andric } 500b57cec5SDimitry Andric 51bdd1243dSDimitry Andric lto::Config BitcodeCompiler::createConfig() { 520b57cec5SDimitry Andric lto::Config c; 530b57cec5SDimitry Andric c.Options = initTargetOptionsFromCodeGenFlags(); 54fe6060f1SDimitry Andric c.Options.EmitAddrsig = true; 55bdd1243dSDimitry Andric for (StringRef C : ctx.config.mllvmOpts) 56bdd1243dSDimitry Andric c.MllvmArgs.emplace_back(C.str()); 570b57cec5SDimitry Andric 580b57cec5SDimitry Andric // Always emit a section per function/datum with LTO. LLVM LTO should get most 590b57cec5SDimitry Andric // of the benefit of linker GC, but there are still opportunities for ICF. 600b57cec5SDimitry Andric c.Options.FunctionSections = true; 610b57cec5SDimitry Andric c.Options.DataSections = true; 620b57cec5SDimitry Andric 630b57cec5SDimitry Andric // Use static reloc model on 32-bit x86 because it usually results in more 640b57cec5SDimitry Andric // compact code, and because there are also known code generation bugs when 650b57cec5SDimitry Andric // using the PIC model (see PR34306). 66bdd1243dSDimitry Andric if (ctx.config.machine == COFF::IMAGE_FILE_MACHINE_I386) 670b57cec5SDimitry Andric c.RelocModel = Reloc::Static; 680b57cec5SDimitry Andric else 690b57cec5SDimitry Andric c.RelocModel = Reloc::PIC_; 70bdd1243dSDimitry Andric #ifndef NDEBUG 71bdd1243dSDimitry Andric c.DisableVerify = false; 72bdd1243dSDimitry Andric #else 730b57cec5SDimitry Andric c.DisableVerify = true; 74bdd1243dSDimitry Andric #endif 750b57cec5SDimitry Andric c.DiagHandler = diagnosticHandler; 7606c3fb27SDimitry Andric c.DwoDir = ctx.config.dwoDir.str(); 77bdd1243dSDimitry Andric c.OptLevel = ctx.config.ltoo; 780b57cec5SDimitry Andric c.CPU = getCPUStr(); 790b57cec5SDimitry Andric c.MAttrs = getMAttrs(); 805f757f3fSDimitry Andric std::optional<CodeGenOptLevel> optLevelOrNone = CodeGenOpt::getLevel( 8106c3fb27SDimitry Andric ctx.config.ltoCgo.value_or(args::getCGOptLevel(ctx.config.ltoo))); 8206c3fb27SDimitry Andric assert(optLevelOrNone && "Invalid optimization level!"); 8306c3fb27SDimitry Andric c.CGOptLevel = *optLevelOrNone; 84bdd1243dSDimitry Andric c.AlwaysEmitRegularLTOObj = !ctx.config.ltoObjPath.empty(); 85bdd1243dSDimitry Andric c.DebugPassManager = ctx.config.ltoDebugPassManager; 86bdd1243dSDimitry Andric c.CSIRProfile = std::string(ctx.config.ltoCSProfileFile); 87bdd1243dSDimitry Andric c.RunCSIRInstr = ctx.config.ltoCSProfileGenerate; 88bdd1243dSDimitry Andric c.PGOWarnMismatch = ctx.config.ltoPGOWarnMismatch; 89*0fca6ea1SDimitry Andric c.SampleProfile = ctx.config.ltoSampleProfileName; 905f757f3fSDimitry Andric c.TimeTraceEnabled = ctx.config.timeTraceEnabled; 915f757f3fSDimitry Andric c.TimeTraceGranularity = ctx.config.timeTraceGranularity; 925f757f3fSDimitry Andric 935f757f3fSDimitry Andric if (ctx.config.emit == EmitKind::LLVM) { 94*0fca6ea1SDimitry Andric c.PreCodeGenModuleHook = [this](size_t task, const Module &m) { 955f757f3fSDimitry Andric if (std::unique_ptr<raw_fd_ostream> os = 965f757f3fSDimitry Andric openLTOOutputFile(ctx.config.outputFile)) 975f757f3fSDimitry Andric WriteBitcodeToFile(m, *os, false); 985f757f3fSDimitry Andric return false; 995f757f3fSDimitry Andric }; 1005f757f3fSDimitry Andric } else if (ctx.config.emit == EmitKind::ASM) { 1015f757f3fSDimitry Andric c.CGFileType = CodeGenFileType::AssemblyFile; 1025f757f3fSDimitry Andric c.Options.MCOptions.AsmVerbose = true; 1035f757f3fSDimitry Andric } 1040b57cec5SDimitry Andric 105bdd1243dSDimitry Andric if (ctx.config.saveTemps) 106bdd1243dSDimitry Andric checkError(c.addSaveTemps(std::string(ctx.config.outputFile) + ".", 1070b57cec5SDimitry Andric /*UseInputModulePath*/ true)); 1080b57cec5SDimitry Andric return c; 1090b57cec5SDimitry Andric } 1100b57cec5SDimitry Andric 111bdd1243dSDimitry Andric BitcodeCompiler::BitcodeCompiler(COFFLinkerContext &c) : ctx(c) { 1120b57cec5SDimitry Andric // Initialize indexFile. 113bdd1243dSDimitry Andric if (!ctx.config.thinLTOIndexOnlyArg.empty()) 114bdd1243dSDimitry Andric indexFile = openFile(ctx.config.thinLTOIndexOnlyArg); 1150b57cec5SDimitry Andric 1160b57cec5SDimitry Andric // Initialize ltoObj. 1170b57cec5SDimitry Andric lto::ThinBackend backend; 118bdd1243dSDimitry Andric if (ctx.config.thinLTOIndexOnly) { 1190b57cec5SDimitry Andric auto OnIndexWrite = [&](StringRef S) { thinIndices.erase(S); }; 1200b57cec5SDimitry Andric backend = lto::createWriteIndexesThinBackend( 12106c3fb27SDimitry Andric std::string(ctx.config.thinLTOPrefixReplaceOld), 12206c3fb27SDimitry Andric std::string(ctx.config.thinLTOPrefixReplaceNew), 12306c3fb27SDimitry Andric std::string(ctx.config.thinLTOPrefixReplaceNativeObject), 124bdd1243dSDimitry Andric ctx.config.thinLTOEmitImportsFiles, indexFile.get(), OnIndexWrite); 1255ffd83dbSDimitry Andric } else { 1265ffd83dbSDimitry Andric backend = lto::createInProcessThinBackend( 127bdd1243dSDimitry Andric llvm::heavyweight_hardware_concurrency(ctx.config.thinLTOJobs)); 1280b57cec5SDimitry Andric } 1290b57cec5SDimitry Andric 13085868e8aSDimitry Andric ltoObj = std::make_unique<lto::LTO>(createConfig(), backend, 131bdd1243dSDimitry Andric ctx.config.ltoPartitions); 1320b57cec5SDimitry Andric } 1330b57cec5SDimitry Andric 1340b57cec5SDimitry Andric BitcodeCompiler::~BitcodeCompiler() = default; 1350b57cec5SDimitry Andric 1360b57cec5SDimitry Andric static void undefine(Symbol *s) { replaceSymbol<Undefined>(s, s->getName()); } 1370b57cec5SDimitry Andric 1380b57cec5SDimitry Andric void BitcodeCompiler::add(BitcodeFile &f) { 1390b57cec5SDimitry Andric lto::InputFile &obj = *f.obj; 1400b57cec5SDimitry Andric unsigned symNum = 0; 1410b57cec5SDimitry Andric std::vector<Symbol *> symBodies = f.getSymbols(); 1420b57cec5SDimitry Andric std::vector<lto::SymbolResolution> resols(symBodies.size()); 1430b57cec5SDimitry Andric 144bdd1243dSDimitry Andric if (ctx.config.thinLTOIndexOnly) 1450b57cec5SDimitry Andric thinIndices.insert(obj.getName()); 1460b57cec5SDimitry Andric 1470b57cec5SDimitry Andric // Provide a resolution to the LTO API for each symbol. 1480b57cec5SDimitry Andric for (const lto::InputFile::Symbol &objSym : obj.symbols()) { 1490b57cec5SDimitry Andric Symbol *sym = symBodies[symNum]; 1500b57cec5SDimitry Andric lto::SymbolResolution &r = resols[symNum]; 1510b57cec5SDimitry Andric ++symNum; 1520b57cec5SDimitry Andric 1530b57cec5SDimitry Andric // Ideally we shouldn't check for SF_Undefined but currently IRObjectFile 1540b57cec5SDimitry Andric // reports two symbols for module ASM defined. Without this check, lld 1550b57cec5SDimitry Andric // flags an undefined in IR with a definition in ASM as prevailing. 1560b57cec5SDimitry Andric // Once IRObjectFile is fixed to report only one symbol this hack can 1570b57cec5SDimitry Andric // be removed. 1580b57cec5SDimitry Andric r.Prevailing = !objSym.isUndefined() && sym->getFile() == &f; 1590b57cec5SDimitry Andric r.VisibleToRegularObj = sym->isUsedInRegularObj; 1600b57cec5SDimitry Andric if (r.Prevailing) 1610b57cec5SDimitry Andric undefine(sym); 162e8d8bef9SDimitry Andric 163e8d8bef9SDimitry Andric // We tell LTO to not apply interprocedural optimization for wrapped 164e8d8bef9SDimitry Andric // (with -wrap) symbols because otherwise LTO would inline them while 165e8d8bef9SDimitry Andric // their values are still not final. 166e8d8bef9SDimitry Andric r.LinkerRedefined = !sym->canInline; 1670b57cec5SDimitry Andric } 1680b57cec5SDimitry Andric checkError(ltoObj->add(std::move(f.obj), resols)); 1690b57cec5SDimitry Andric } 1700b57cec5SDimitry Andric 1710b57cec5SDimitry Andric // Merge all the bitcode files we have seen, codegen the result 1720b57cec5SDimitry Andric // and return the resulting objects. 173bdd1243dSDimitry Andric std::vector<InputFile *> BitcodeCompiler::compile() { 1740b57cec5SDimitry Andric unsigned maxTasks = ltoObj->getMaxTasks(); 1750b57cec5SDimitry Andric buf.resize(maxTasks); 1760b57cec5SDimitry Andric files.resize(maxTasks); 177bdd1243dSDimitry Andric file_names.resize(maxTasks); 1780b57cec5SDimitry Andric 1790b57cec5SDimitry Andric // The /lldltocache option specifies the path to a directory in which to cache 1800b57cec5SDimitry Andric // native object files for ThinLTO incremental builds. If a path was 1810b57cec5SDimitry Andric // specified, configure LTO to use it as the cache directory. 182349cc55cSDimitry Andric FileCache cache; 183bdd1243dSDimitry Andric if (!ctx.config.ltoCache.empty()) 184bdd1243dSDimitry Andric cache = check(localCache("ThinLTO", "Thin", ctx.config.ltoCache, 185bdd1243dSDimitry Andric [&](size_t task, const Twine &moduleName, 186bdd1243dSDimitry Andric std::unique_ptr<MemoryBuffer> mb) { 1870b57cec5SDimitry Andric files[task] = std::move(mb); 188bdd1243dSDimitry Andric file_names[task] = moduleName.str(); 1890b57cec5SDimitry Andric })); 1900b57cec5SDimitry Andric 1910b57cec5SDimitry Andric checkError(ltoObj->run( 192bdd1243dSDimitry Andric [&](size_t task, const Twine &moduleName) { 193bdd1243dSDimitry Andric buf[task].first = moduleName.str(); 194349cc55cSDimitry Andric return std::make_unique<CachedFileStream>( 195bdd1243dSDimitry Andric std::make_unique<raw_svector_ostream>(buf[task].second)); 1960b57cec5SDimitry Andric }, 1970b57cec5SDimitry Andric cache)); 1980b57cec5SDimitry Andric 1990b57cec5SDimitry Andric // Emit empty index files for non-indexed files 2000b57cec5SDimitry Andric for (StringRef s : thinIndices) { 2010b57cec5SDimitry Andric std::string path = getThinLTOOutputFile(s); 2020b57cec5SDimitry Andric openFile(path + ".thinlto.bc"); 203bdd1243dSDimitry Andric if (ctx.config.thinLTOEmitImportsFiles) 2040b57cec5SDimitry Andric openFile(path + ".imports"); 2050b57cec5SDimitry Andric } 2060b57cec5SDimitry Andric 2070b57cec5SDimitry Andric // ThinLTO with index only option is required to generate only the index 2080b57cec5SDimitry Andric // files. After that, we exit from linker and ThinLTO backend runs in a 2090b57cec5SDimitry Andric // distributed environment. 210bdd1243dSDimitry Andric if (ctx.config.thinLTOIndexOnly) { 211bdd1243dSDimitry Andric if (!ctx.config.ltoObjPath.empty()) 212bdd1243dSDimitry Andric saveBuffer(buf[0].second, ctx.config.ltoObjPath); 2130b57cec5SDimitry Andric if (indexFile) 2140b57cec5SDimitry Andric indexFile->close(); 2150b57cec5SDimitry Andric return {}; 2160b57cec5SDimitry Andric } 2170b57cec5SDimitry Andric 218bdd1243dSDimitry Andric if (!ctx.config.ltoCache.empty()) 219bdd1243dSDimitry Andric pruneCache(ctx.config.ltoCache, ctx.config.ltoCachePolicy, files); 2200b57cec5SDimitry Andric 2215ffd83dbSDimitry Andric std::vector<InputFile *> ret; 2225f757f3fSDimitry Andric bool emitASM = ctx.config.emit == EmitKind::ASM; 2235f757f3fSDimitry Andric const char *Ext = emitASM ? ".s" : ".obj"; 2240b57cec5SDimitry Andric for (unsigned i = 0; i != maxTasks; ++i) { 225bdd1243dSDimitry Andric StringRef bitcodeFilePath; 2265ffd83dbSDimitry Andric // Get the native object contents either from the cache or from memory. Do 2275ffd83dbSDimitry Andric // not use the cached MemoryBuffer directly, or the PDB will not be 2285ffd83dbSDimitry Andric // deterministic. 2295ffd83dbSDimitry Andric StringRef objBuf; 230bdd1243dSDimitry Andric if (files[i]) { 2315ffd83dbSDimitry Andric objBuf = files[i]->getBuffer(); 232bdd1243dSDimitry Andric bitcodeFilePath = file_names[i]; 233bdd1243dSDimitry Andric } else { 234bdd1243dSDimitry Andric objBuf = buf[i].second; 235bdd1243dSDimitry Andric bitcodeFilePath = buf[i].first; 236bdd1243dSDimitry Andric } 2375ffd83dbSDimitry Andric if (objBuf.empty()) 2385ffd83dbSDimitry Andric continue; 2395ffd83dbSDimitry Andric 240bdd1243dSDimitry Andric // If the input bitcode file is path/to/a.obj, then the corresponding lto 241bdd1243dSDimitry Andric // object file name will look something like: path/to/main.exe.lto.a.obj. 242bdd1243dSDimitry Andric StringRef ltoObjName; 243bdd1243dSDimitry Andric if (bitcodeFilePath == "ld-temp.o") { 244bdd1243dSDimitry Andric ltoObjName = 245bdd1243dSDimitry Andric saver().save(Twine(ctx.config.outputFile) + ".lto" + 2465f757f3fSDimitry Andric (i == 0 ? Twine("") : Twine('.') + Twine(i)) + Ext); 247bdd1243dSDimitry Andric } else { 248bdd1243dSDimitry Andric StringRef directory = sys::path::parent_path(bitcodeFilePath); 2495f757f3fSDimitry Andric StringRef baseName = sys::path::stem(bitcodeFilePath); 250bdd1243dSDimitry Andric StringRef outputFileBaseName = sys::path::filename(ctx.config.outputFile); 251bdd1243dSDimitry Andric SmallString<64> path; 252bdd1243dSDimitry Andric sys::path::append(path, directory, 2535f757f3fSDimitry Andric outputFileBaseName + ".lto." + baseName + Ext); 254bdd1243dSDimitry Andric sys::path::remove_dots(path, true); 255bdd1243dSDimitry Andric ltoObjName = saver().save(path.str()); 256bdd1243dSDimitry Andric } 2575f757f3fSDimitry Andric if (ctx.config.saveTemps || emitASM) 258bdd1243dSDimitry Andric saveBuffer(buf[i].second, ltoObjName); 2595f757f3fSDimitry Andric if (!emitASM) 260349cc55cSDimitry Andric ret.push_back(make<ObjFile>(ctx, MemoryBufferRef(objBuf, ltoObjName))); 2615ffd83dbSDimitry Andric } 2620b57cec5SDimitry Andric 2630b57cec5SDimitry Andric return ret; 2640b57cec5SDimitry Andric } 265