10eae32dcSDimitry Andric //===-- llvm/Debuginfod/Debuginfod.cpp - Debuginfod client library --------===// 20eae32dcSDimitry Andric // 30eae32dcSDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40eae32dcSDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50eae32dcSDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60eae32dcSDimitry Andric // 70eae32dcSDimitry Andric //===----------------------------------------------------------------------===// 80eae32dcSDimitry Andric /// 90eae32dcSDimitry Andric /// \file 100eae32dcSDimitry Andric /// 11753f127fSDimitry Andric /// This file contains several definitions for the debuginfod client and server. 12753f127fSDimitry Andric /// For the client, this file defines the fetchInfo function. For the server, 13753f127fSDimitry Andric /// this file defines the DebuginfodLogEntry and DebuginfodServer structs, as 14753f127fSDimitry Andric /// well as the DebuginfodLog, DebuginfodCollection classes. The fetchInfo 15753f127fSDimitry Andric /// function retrieves any of the three supported artifact types: (executable, 16753f127fSDimitry Andric /// debuginfo, source file) associated with a build-id from debuginfod servers. 17753f127fSDimitry Andric /// If a source file is to be fetched, its absolute path must be specified in 18753f127fSDimitry Andric /// the Description argument to fetchInfo. The DebuginfodLogEntry, 19753f127fSDimitry Andric /// DebuginfodLog, and DebuginfodCollection are used by the DebuginfodServer to 20753f127fSDimitry Andric /// scan the local filesystem for binaries and serve the debuginfod protocol. 210eae32dcSDimitry Andric /// 220eae32dcSDimitry Andric //===----------------------------------------------------------------------===// 230eae32dcSDimitry Andric 240eae32dcSDimitry Andric #include "llvm/Debuginfod/Debuginfod.h" 25bdd1243dSDimitry Andric #include "llvm/ADT/StringExtras.h" 260eae32dcSDimitry Andric #include "llvm/ADT/StringRef.h" 27753f127fSDimitry Andric #include "llvm/BinaryFormat/Magic.h" 28753f127fSDimitry Andric #include "llvm/DebugInfo/DWARF/DWARFContext.h" 29753f127fSDimitry Andric #include "llvm/DebugInfo/Symbolize/Symbolize.h" 300eae32dcSDimitry Andric #include "llvm/Debuginfod/HTTPClient.h" 31bdd1243dSDimitry Andric #include "llvm/Object/BuildID.h" 32753f127fSDimitry Andric #include "llvm/Object/ELFObjectFile.h" 330eae32dcSDimitry Andric #include "llvm/Support/CachePruning.h" 340eae32dcSDimitry Andric #include "llvm/Support/Caching.h" 3504eeddc0SDimitry Andric #include "llvm/Support/Errc.h" 360eae32dcSDimitry Andric #include "llvm/Support/Error.h" 370eae32dcSDimitry Andric #include "llvm/Support/FileUtilities.h" 38bdd1243dSDimitry Andric #include "llvm/Support/MemoryBuffer.h" 3904eeddc0SDimitry Andric #include "llvm/Support/Path.h" 40753f127fSDimitry Andric #include "llvm/Support/ThreadPool.h" 410eae32dcSDimitry Andric #include "llvm/Support/xxhash.h" 420eae32dcSDimitry Andric 43753f127fSDimitry Andric #include <atomic> 44*5f757f3fSDimitry Andric #include <optional> 45bdd1243dSDimitry Andric #include <thread> 46753f127fSDimitry Andric 470eae32dcSDimitry Andric namespace llvm { 48bdd1243dSDimitry Andric 49bdd1243dSDimitry Andric using llvm::object::BuildIDRef; 50bdd1243dSDimitry Andric 51*5f757f3fSDimitry Andric namespace { 52*5f757f3fSDimitry Andric std::optional<SmallVector<StringRef>> DebuginfodUrls; 53*5f757f3fSDimitry Andric // Many Readers/Single Writer lock protecting the global debuginfod URL list. 54*5f757f3fSDimitry Andric llvm::sys::RWMutex UrlsMutex; 55*5f757f3fSDimitry Andric } // namespace 56*5f757f3fSDimitry Andric 57*5f757f3fSDimitry Andric static std::string uniqueKey(llvm::StringRef S) { 58*5f757f3fSDimitry Andric return utostr(xxh3_64bits(S)); 59*5f757f3fSDimitry Andric } 600eae32dcSDimitry Andric 610eae32dcSDimitry Andric // Returns a binary BuildID as a normalized hex string. 620eae32dcSDimitry Andric // Uses lowercase for compatibility with common debuginfod servers. 630eae32dcSDimitry Andric static std::string buildIDToString(BuildIDRef ID) { 640eae32dcSDimitry Andric return llvm::toHex(ID, /*LowerCase=*/true); 650eae32dcSDimitry Andric } 660eae32dcSDimitry Andric 671ac55f4cSDimitry Andric bool canUseDebuginfod() { 681ac55f4cSDimitry Andric return HTTPClient::isAvailable() && !getDefaultDebuginfodUrls().empty(); 691ac55f4cSDimitry Andric } 701ac55f4cSDimitry Andric 711ac55f4cSDimitry Andric SmallVector<StringRef> getDefaultDebuginfodUrls() { 72*5f757f3fSDimitry Andric std::shared_lock<llvm::sys::RWMutex> ReadGuard(UrlsMutex); 73*5f757f3fSDimitry Andric if (!DebuginfodUrls) { 74*5f757f3fSDimitry Andric // Only read from the environment variable if the user hasn't already 75*5f757f3fSDimitry Andric // set the value 76*5f757f3fSDimitry Andric ReadGuard.unlock(); 77*5f757f3fSDimitry Andric std::unique_lock<llvm::sys::RWMutex> WriteGuard(UrlsMutex); 78*5f757f3fSDimitry Andric DebuginfodUrls = SmallVector<StringRef>(); 79*5f757f3fSDimitry Andric if (const char *DebuginfodUrlsEnv = std::getenv("DEBUGINFOD_URLS")) { 80*5f757f3fSDimitry Andric StringRef(DebuginfodUrlsEnv) 81*5f757f3fSDimitry Andric .split(DebuginfodUrls.value(), " ", -1, false); 82*5f757f3fSDimitry Andric } 83*5f757f3fSDimitry Andric WriteGuard.unlock(); 84*5f757f3fSDimitry Andric ReadGuard.lock(); 85*5f757f3fSDimitry Andric } 86*5f757f3fSDimitry Andric return DebuginfodUrls.value(); 87*5f757f3fSDimitry Andric } 880eae32dcSDimitry Andric 89*5f757f3fSDimitry Andric // Set the default debuginfod URL list, override the environment variable 90*5f757f3fSDimitry Andric void setDefaultDebuginfodUrls(const SmallVector<StringRef> &URLs) { 91*5f757f3fSDimitry Andric std::unique_lock<llvm::sys::RWMutex> WriteGuard(UrlsMutex); 92*5f757f3fSDimitry Andric DebuginfodUrls = URLs; 930eae32dcSDimitry Andric } 940eae32dcSDimitry Andric 95753f127fSDimitry Andric /// Finds a default local file caching directory for the debuginfod client, 96753f127fSDimitry Andric /// first checking DEBUGINFOD_CACHE_PATH. 970eae32dcSDimitry Andric Expected<std::string> getDefaultDebuginfodCacheDirectory() { 980eae32dcSDimitry Andric if (const char *CacheDirectoryEnv = std::getenv("DEBUGINFOD_CACHE_PATH")) 990eae32dcSDimitry Andric return CacheDirectoryEnv; 1000eae32dcSDimitry Andric 1010eae32dcSDimitry Andric SmallString<64> CacheDirectory; 1020eae32dcSDimitry Andric if (!sys::path::cache_directory(CacheDirectory)) 1030eae32dcSDimitry Andric return createStringError( 1040eae32dcSDimitry Andric errc::io_error, "Unable to determine appropriate cache directory."); 10504eeddc0SDimitry Andric sys::path::append(CacheDirectory, "llvm-debuginfod", "client"); 1060eae32dcSDimitry Andric return std::string(CacheDirectory); 1070eae32dcSDimitry Andric } 1080eae32dcSDimitry Andric 1090eae32dcSDimitry Andric std::chrono::milliseconds getDefaultDebuginfodTimeout() { 1100eae32dcSDimitry Andric long Timeout; 1110eae32dcSDimitry Andric const char *DebuginfodTimeoutEnv = std::getenv("DEBUGINFOD_TIMEOUT"); 1120eae32dcSDimitry Andric if (DebuginfodTimeoutEnv && 1130eae32dcSDimitry Andric to_integer(StringRef(DebuginfodTimeoutEnv).trim(), Timeout, 10)) 1140eae32dcSDimitry Andric return std::chrono::milliseconds(Timeout * 1000); 1150eae32dcSDimitry Andric 1160eae32dcSDimitry Andric return std::chrono::milliseconds(90 * 1000); 1170eae32dcSDimitry Andric } 1180eae32dcSDimitry Andric 1190eae32dcSDimitry Andric /// The following functions fetch a debuginfod artifact to a file in a local 1200eae32dcSDimitry Andric /// cache and return the cached file path. They first search the local cache, 1210eae32dcSDimitry Andric /// followed by the debuginfod servers. 1220eae32dcSDimitry Andric 1230eae32dcSDimitry Andric Expected<std::string> getCachedOrDownloadSource(BuildIDRef ID, 1240eae32dcSDimitry Andric StringRef SourceFilePath) { 1250eae32dcSDimitry Andric SmallString<64> UrlPath; 1260eae32dcSDimitry Andric sys::path::append(UrlPath, sys::path::Style::posix, "buildid", 1270eae32dcSDimitry Andric buildIDToString(ID), "source", 1280eae32dcSDimitry Andric sys::path::convert_to_slash(SourceFilePath)); 1290eae32dcSDimitry Andric return getCachedOrDownloadArtifact(uniqueKey(UrlPath), UrlPath); 1300eae32dcSDimitry Andric } 1310eae32dcSDimitry Andric 1320eae32dcSDimitry Andric Expected<std::string> getCachedOrDownloadExecutable(BuildIDRef ID) { 1330eae32dcSDimitry Andric SmallString<64> UrlPath; 1340eae32dcSDimitry Andric sys::path::append(UrlPath, sys::path::Style::posix, "buildid", 1350eae32dcSDimitry Andric buildIDToString(ID), "executable"); 1360eae32dcSDimitry Andric return getCachedOrDownloadArtifact(uniqueKey(UrlPath), UrlPath); 1370eae32dcSDimitry Andric } 1380eae32dcSDimitry Andric 1390eae32dcSDimitry Andric Expected<std::string> getCachedOrDownloadDebuginfo(BuildIDRef ID) { 1400eae32dcSDimitry Andric SmallString<64> UrlPath; 1410eae32dcSDimitry Andric sys::path::append(UrlPath, sys::path::Style::posix, "buildid", 1420eae32dcSDimitry Andric buildIDToString(ID), "debuginfo"); 1430eae32dcSDimitry Andric return getCachedOrDownloadArtifact(uniqueKey(UrlPath), UrlPath); 1440eae32dcSDimitry Andric } 1450eae32dcSDimitry Andric 1460eae32dcSDimitry Andric // General fetching function. 1470eae32dcSDimitry Andric Expected<std::string> getCachedOrDownloadArtifact(StringRef UniqueKey, 1480eae32dcSDimitry Andric StringRef UrlPath) { 1490eae32dcSDimitry Andric SmallString<10> CacheDir; 1500eae32dcSDimitry Andric 1510eae32dcSDimitry Andric Expected<std::string> CacheDirOrErr = getDefaultDebuginfodCacheDirectory(); 1520eae32dcSDimitry Andric if (!CacheDirOrErr) 1530eae32dcSDimitry Andric return CacheDirOrErr.takeError(); 1540eae32dcSDimitry Andric CacheDir = *CacheDirOrErr; 1550eae32dcSDimitry Andric 1560eae32dcSDimitry Andric return getCachedOrDownloadArtifact(UniqueKey, UrlPath, CacheDir, 1571ac55f4cSDimitry Andric getDefaultDebuginfodUrls(), 1580eae32dcSDimitry Andric getDefaultDebuginfodTimeout()); 1590eae32dcSDimitry Andric } 1600eae32dcSDimitry Andric 16181ad6265SDimitry Andric namespace { 16281ad6265SDimitry Andric 16381ad6265SDimitry Andric /// A simple handler which streams the returned data to a cache file. The cache 16481ad6265SDimitry Andric /// file is only created if a 200 OK status is observed. 16581ad6265SDimitry Andric class StreamedHTTPResponseHandler : public HTTPResponseHandler { 16681ad6265SDimitry Andric using CreateStreamFn = 16781ad6265SDimitry Andric std::function<Expected<std::unique_ptr<CachedFileStream>>()>; 16881ad6265SDimitry Andric CreateStreamFn CreateStream; 16981ad6265SDimitry Andric HTTPClient &Client; 17081ad6265SDimitry Andric std::unique_ptr<CachedFileStream> FileStream; 17181ad6265SDimitry Andric 17281ad6265SDimitry Andric public: 17381ad6265SDimitry Andric StreamedHTTPResponseHandler(CreateStreamFn CreateStream, HTTPClient &Client) 17481ad6265SDimitry Andric : CreateStream(CreateStream), Client(Client) {} 17581ad6265SDimitry Andric virtual ~StreamedHTTPResponseHandler() = default; 17681ad6265SDimitry Andric 17781ad6265SDimitry Andric Error handleBodyChunk(StringRef BodyChunk) override; 17881ad6265SDimitry Andric }; 17981ad6265SDimitry Andric 18081ad6265SDimitry Andric } // namespace 18181ad6265SDimitry Andric 18281ad6265SDimitry Andric Error StreamedHTTPResponseHandler::handleBodyChunk(StringRef BodyChunk) { 18381ad6265SDimitry Andric if (!FileStream) { 1841ac55f4cSDimitry Andric unsigned Code = Client.responseCode(); 1851ac55f4cSDimitry Andric if (Code && Code != 200) 18681ad6265SDimitry Andric return Error::success(); 18781ad6265SDimitry Andric Expected<std::unique_ptr<CachedFileStream>> FileStreamOrError = 18881ad6265SDimitry Andric CreateStream(); 18981ad6265SDimitry Andric if (!FileStreamOrError) 19081ad6265SDimitry Andric return FileStreamOrError.takeError(); 19181ad6265SDimitry Andric FileStream = std::move(*FileStreamOrError); 19281ad6265SDimitry Andric } 19381ad6265SDimitry Andric *FileStream->OS << BodyChunk; 19481ad6265SDimitry Andric return Error::success(); 19581ad6265SDimitry Andric } 19681ad6265SDimitry Andric 197bdd1243dSDimitry Andric // An over-accepting simplification of the HTTP RFC 7230 spec. 198bdd1243dSDimitry Andric static bool isHeader(StringRef S) { 199bdd1243dSDimitry Andric StringRef Name; 200bdd1243dSDimitry Andric StringRef Value; 201bdd1243dSDimitry Andric std::tie(Name, Value) = S.split(':'); 202bdd1243dSDimitry Andric if (Name.empty() || Value.empty()) 203bdd1243dSDimitry Andric return false; 204bdd1243dSDimitry Andric return all_of(Name, [](char C) { return llvm::isPrint(C) && C != ' '; }) && 205bdd1243dSDimitry Andric all_of(Value, [](char C) { return llvm::isPrint(C) || C == '\t'; }); 206bdd1243dSDimitry Andric } 207bdd1243dSDimitry Andric 208bdd1243dSDimitry Andric static SmallVector<std::string, 0> getHeaders() { 209bdd1243dSDimitry Andric const char *Filename = getenv("DEBUGINFOD_HEADERS_FILE"); 210bdd1243dSDimitry Andric if (!Filename) 211bdd1243dSDimitry Andric return {}; 212bdd1243dSDimitry Andric ErrorOr<std::unique_ptr<MemoryBuffer>> HeadersFile = 213bdd1243dSDimitry Andric MemoryBuffer::getFile(Filename, /*IsText=*/true); 214bdd1243dSDimitry Andric if (!HeadersFile) 215bdd1243dSDimitry Andric return {}; 216bdd1243dSDimitry Andric 217bdd1243dSDimitry Andric SmallVector<std::string, 0> Headers; 218bdd1243dSDimitry Andric uint64_t LineNumber = 0; 219bdd1243dSDimitry Andric for (StringRef Line : llvm::split((*HeadersFile)->getBuffer(), '\n')) { 220bdd1243dSDimitry Andric LineNumber++; 221bdd1243dSDimitry Andric if (!Line.empty() && Line.back() == '\r') 222bdd1243dSDimitry Andric Line = Line.drop_back(); 223bdd1243dSDimitry Andric if (!isHeader(Line)) { 224bdd1243dSDimitry Andric if (!all_of(Line, llvm::isSpace)) 225bdd1243dSDimitry Andric WithColor::warning() 226bdd1243dSDimitry Andric << "could not parse debuginfod header: " << Filename << ':' 227bdd1243dSDimitry Andric << LineNumber << '\n'; 228bdd1243dSDimitry Andric continue; 229bdd1243dSDimitry Andric } 230bdd1243dSDimitry Andric Headers.emplace_back(Line); 231bdd1243dSDimitry Andric } 232bdd1243dSDimitry Andric return Headers; 233bdd1243dSDimitry Andric } 234bdd1243dSDimitry Andric 2350eae32dcSDimitry Andric Expected<std::string> getCachedOrDownloadArtifact( 2360eae32dcSDimitry Andric StringRef UniqueKey, StringRef UrlPath, StringRef CacheDirectoryPath, 2370eae32dcSDimitry Andric ArrayRef<StringRef> DebuginfodUrls, std::chrono::milliseconds Timeout) { 2380eae32dcSDimitry Andric SmallString<64> AbsCachedArtifactPath; 2390eae32dcSDimitry Andric sys::path::append(AbsCachedArtifactPath, CacheDirectoryPath, 2400eae32dcSDimitry Andric "llvmcache-" + UniqueKey); 2410eae32dcSDimitry Andric 2420eae32dcSDimitry Andric Expected<FileCache> CacheOrErr = 2430eae32dcSDimitry Andric localCache("Debuginfod-client", ".debuginfod-client", CacheDirectoryPath); 2440eae32dcSDimitry Andric if (!CacheOrErr) 2450eae32dcSDimitry Andric return CacheOrErr.takeError(); 2460eae32dcSDimitry Andric 2470eae32dcSDimitry Andric FileCache Cache = *CacheOrErr; 2480eae32dcSDimitry Andric // We choose an arbitrary Task parameter as we do not make use of it. 2490eae32dcSDimitry Andric unsigned Task = 0; 250bdd1243dSDimitry Andric Expected<AddStreamFn> CacheAddStreamOrErr = Cache(Task, UniqueKey, ""); 2510eae32dcSDimitry Andric if (!CacheAddStreamOrErr) 2520eae32dcSDimitry Andric return CacheAddStreamOrErr.takeError(); 2530eae32dcSDimitry Andric AddStreamFn &CacheAddStream = *CacheAddStreamOrErr; 2540eae32dcSDimitry Andric if (!CacheAddStream) 2550eae32dcSDimitry Andric return std::string(AbsCachedArtifactPath); 2560eae32dcSDimitry Andric // The artifact was not found in the local cache, query the debuginfod 2570eae32dcSDimitry Andric // servers. 2580eae32dcSDimitry Andric if (!HTTPClient::isAvailable()) 2590eae32dcSDimitry Andric return createStringError(errc::io_error, 2600eae32dcSDimitry Andric "No working HTTP client is available."); 2610eae32dcSDimitry Andric 2620eae32dcSDimitry Andric if (!HTTPClient::IsInitialized) 2630eae32dcSDimitry Andric return createStringError( 2640eae32dcSDimitry Andric errc::io_error, 2650eae32dcSDimitry Andric "A working HTTP client is available, but it is not initialized. To " 2660eae32dcSDimitry Andric "allow Debuginfod to make HTTP requests, call HTTPClient::initialize() " 2670eae32dcSDimitry Andric "at the beginning of main."); 2680eae32dcSDimitry Andric 2690eae32dcSDimitry Andric HTTPClient Client; 2700eae32dcSDimitry Andric Client.setTimeout(Timeout); 2710eae32dcSDimitry Andric for (StringRef ServerUrl : DebuginfodUrls) { 2720eae32dcSDimitry Andric SmallString<64> ArtifactUrl; 2730eae32dcSDimitry Andric sys::path::append(ArtifactUrl, sys::path::Style::posix, ServerUrl, UrlPath); 2740eae32dcSDimitry Andric 27581ad6265SDimitry Andric // Perform the HTTP request and if successful, write the response body to 27681ad6265SDimitry Andric // the cache. 27706c3fb27SDimitry Andric { 278bdd1243dSDimitry Andric StreamedHTTPResponseHandler Handler( 279bdd1243dSDimitry Andric [&]() { return CacheAddStream(Task, ""); }, Client); 28081ad6265SDimitry Andric HTTPRequest Request(ArtifactUrl); 281bdd1243dSDimitry Andric Request.Headers = getHeaders(); 28281ad6265SDimitry Andric Error Err = Client.perform(Request, Handler); 28381ad6265SDimitry Andric if (Err) 28481ad6265SDimitry Andric return std::move(Err); 2850eae32dcSDimitry Andric 2861ac55f4cSDimitry Andric unsigned Code = Client.responseCode(); 2871ac55f4cSDimitry Andric if (Code && Code != 200) 2880eae32dcSDimitry Andric continue; 28906c3fb27SDimitry Andric } 29006c3fb27SDimitry Andric 29106c3fb27SDimitry Andric Expected<CachePruningPolicy> PruningPolicyOrErr = 29206c3fb27SDimitry Andric parseCachePruningPolicy(std::getenv("DEBUGINFOD_CACHE_POLICY")); 29306c3fb27SDimitry Andric if (!PruningPolicyOrErr) 29406c3fb27SDimitry Andric return PruningPolicyOrErr.takeError(); 29506c3fb27SDimitry Andric pruneCache(CacheDirectoryPath, *PruningPolicyOrErr); 2960eae32dcSDimitry Andric 2970eae32dcSDimitry Andric // Return the path to the artifact on disk. 2980eae32dcSDimitry Andric return std::string(AbsCachedArtifactPath); 2990eae32dcSDimitry Andric } 3000eae32dcSDimitry Andric 3010eae32dcSDimitry Andric return createStringError(errc::argument_out_of_domain, "build id not found"); 3020eae32dcSDimitry Andric } 303753f127fSDimitry Andric 304753f127fSDimitry Andric DebuginfodLogEntry::DebuginfodLogEntry(const Twine &Message) 305753f127fSDimitry Andric : Message(Message.str()) {} 306753f127fSDimitry Andric 307753f127fSDimitry Andric void DebuginfodLog::push(const Twine &Message) { 308753f127fSDimitry Andric push(DebuginfodLogEntry(Message)); 309753f127fSDimitry Andric } 310753f127fSDimitry Andric 311753f127fSDimitry Andric void DebuginfodLog::push(DebuginfodLogEntry Entry) { 312753f127fSDimitry Andric { 313753f127fSDimitry Andric std::lock_guard<std::mutex> Guard(QueueMutex); 314753f127fSDimitry Andric LogEntryQueue.push(Entry); 315753f127fSDimitry Andric } 316753f127fSDimitry Andric QueueCondition.notify_one(); 317753f127fSDimitry Andric } 318753f127fSDimitry Andric 319753f127fSDimitry Andric DebuginfodLogEntry DebuginfodLog::pop() { 320753f127fSDimitry Andric { 321753f127fSDimitry Andric std::unique_lock<std::mutex> Guard(QueueMutex); 322753f127fSDimitry Andric // Wait for messages to be pushed into the queue. 323753f127fSDimitry Andric QueueCondition.wait(Guard, [&] { return !LogEntryQueue.empty(); }); 324753f127fSDimitry Andric } 325753f127fSDimitry Andric std::lock_guard<std::mutex> Guard(QueueMutex); 326753f127fSDimitry Andric if (!LogEntryQueue.size()) 327753f127fSDimitry Andric llvm_unreachable("Expected message in the queue."); 328753f127fSDimitry Andric 329753f127fSDimitry Andric DebuginfodLogEntry Entry = LogEntryQueue.front(); 330753f127fSDimitry Andric LogEntryQueue.pop(); 331753f127fSDimitry Andric return Entry; 332753f127fSDimitry Andric } 333753f127fSDimitry Andric 334753f127fSDimitry Andric DebuginfodCollection::DebuginfodCollection(ArrayRef<StringRef> PathsRef, 335753f127fSDimitry Andric DebuginfodLog &Log, ThreadPool &Pool, 336753f127fSDimitry Andric double MinInterval) 337753f127fSDimitry Andric : Log(Log), Pool(Pool), MinInterval(MinInterval) { 338753f127fSDimitry Andric for (StringRef Path : PathsRef) 339753f127fSDimitry Andric Paths.push_back(Path.str()); 340753f127fSDimitry Andric } 341753f127fSDimitry Andric 342753f127fSDimitry Andric Error DebuginfodCollection::update() { 343753f127fSDimitry Andric std::lock_guard<sys::Mutex> Guard(UpdateMutex); 344753f127fSDimitry Andric if (UpdateTimer.isRunning()) 345753f127fSDimitry Andric UpdateTimer.stopTimer(); 346753f127fSDimitry Andric UpdateTimer.clear(); 347753f127fSDimitry Andric for (const std::string &Path : Paths) { 348753f127fSDimitry Andric Log.push("Updating binaries at path " + Path); 349753f127fSDimitry Andric if (Error Err = findBinaries(Path)) 350753f127fSDimitry Andric return Err; 351753f127fSDimitry Andric } 352753f127fSDimitry Andric Log.push("Updated collection"); 353753f127fSDimitry Andric UpdateTimer.startTimer(); 354753f127fSDimitry Andric return Error::success(); 355753f127fSDimitry Andric } 356753f127fSDimitry Andric 357753f127fSDimitry Andric Expected<bool> DebuginfodCollection::updateIfStale() { 358753f127fSDimitry Andric if (!UpdateTimer.isRunning()) 359753f127fSDimitry Andric return false; 360753f127fSDimitry Andric UpdateTimer.stopTimer(); 361753f127fSDimitry Andric double Time = UpdateTimer.getTotalTime().getWallTime(); 362753f127fSDimitry Andric UpdateTimer.startTimer(); 363753f127fSDimitry Andric if (Time < MinInterval) 364753f127fSDimitry Andric return false; 365753f127fSDimitry Andric if (Error Err = update()) 366753f127fSDimitry Andric return std::move(Err); 367753f127fSDimitry Andric return true; 368753f127fSDimitry Andric } 369753f127fSDimitry Andric 370753f127fSDimitry Andric Error DebuginfodCollection::updateForever(std::chrono::milliseconds Interval) { 371753f127fSDimitry Andric while (true) { 372753f127fSDimitry Andric if (Error Err = update()) 373753f127fSDimitry Andric return Err; 374753f127fSDimitry Andric std::this_thread::sleep_for(Interval); 375753f127fSDimitry Andric } 376753f127fSDimitry Andric llvm_unreachable("updateForever loop should never end"); 377753f127fSDimitry Andric } 378753f127fSDimitry Andric 379753f127fSDimitry Andric static bool hasELFMagic(StringRef FilePath) { 380753f127fSDimitry Andric file_magic Type; 381753f127fSDimitry Andric std::error_code EC = identify_magic(FilePath, Type); 382753f127fSDimitry Andric if (EC) 383753f127fSDimitry Andric return false; 384753f127fSDimitry Andric switch (Type) { 385753f127fSDimitry Andric case file_magic::elf: 386753f127fSDimitry Andric case file_magic::elf_relocatable: 387753f127fSDimitry Andric case file_magic::elf_executable: 388753f127fSDimitry Andric case file_magic::elf_shared_object: 389753f127fSDimitry Andric case file_magic::elf_core: 390753f127fSDimitry Andric return true; 391753f127fSDimitry Andric default: 392753f127fSDimitry Andric return false; 393753f127fSDimitry Andric } 394753f127fSDimitry Andric } 395753f127fSDimitry Andric 396753f127fSDimitry Andric Error DebuginfodCollection::findBinaries(StringRef Path) { 397753f127fSDimitry Andric std::error_code EC; 398753f127fSDimitry Andric sys::fs::recursive_directory_iterator I(Twine(Path), EC), E; 399753f127fSDimitry Andric std::mutex IteratorMutex; 400753f127fSDimitry Andric ThreadPoolTaskGroup IteratorGroup(Pool); 401753f127fSDimitry Andric for (unsigned WorkerIndex = 0; WorkerIndex < Pool.getThreadCount(); 402753f127fSDimitry Andric WorkerIndex++) { 403753f127fSDimitry Andric IteratorGroup.async([&, this]() -> void { 404753f127fSDimitry Andric std::string FilePath; 405753f127fSDimitry Andric while (true) { 406753f127fSDimitry Andric { 407753f127fSDimitry Andric // Check if iteration is over or there is an error during iteration 408753f127fSDimitry Andric std::lock_guard<std::mutex> Guard(IteratorMutex); 409753f127fSDimitry Andric if (I == E || EC) 410753f127fSDimitry Andric return; 411753f127fSDimitry Andric // Grab a file path from the directory iterator and advance the 412753f127fSDimitry Andric // iterator. 413753f127fSDimitry Andric FilePath = I->path(); 414753f127fSDimitry Andric I.increment(EC); 415753f127fSDimitry Andric } 416753f127fSDimitry Andric 417753f127fSDimitry Andric // Inspect the file at this path to determine if it is debuginfo. 418753f127fSDimitry Andric if (!hasELFMagic(FilePath)) 419753f127fSDimitry Andric continue; 420753f127fSDimitry Andric 421753f127fSDimitry Andric Expected<object::OwningBinary<object::Binary>> BinOrErr = 422753f127fSDimitry Andric object::createBinary(FilePath); 423753f127fSDimitry Andric 424753f127fSDimitry Andric if (!BinOrErr) { 425753f127fSDimitry Andric consumeError(BinOrErr.takeError()); 426753f127fSDimitry Andric continue; 427753f127fSDimitry Andric } 428753f127fSDimitry Andric object::Binary *Bin = std::move(BinOrErr.get().getBinary()); 429753f127fSDimitry Andric if (!Bin->isObject()) 430753f127fSDimitry Andric continue; 431753f127fSDimitry Andric 432753f127fSDimitry Andric // TODO: Support non-ELF binaries 433753f127fSDimitry Andric object::ELFObjectFileBase *Object = 434753f127fSDimitry Andric dyn_cast<object::ELFObjectFileBase>(Bin); 435753f127fSDimitry Andric if (!Object) 436753f127fSDimitry Andric continue; 437753f127fSDimitry Andric 43806c3fb27SDimitry Andric BuildIDRef ID = getBuildID(Object); 43906c3fb27SDimitry Andric if (ID.empty()) 440753f127fSDimitry Andric continue; 441753f127fSDimitry Andric 44206c3fb27SDimitry Andric std::string IDString = buildIDToString(ID); 443bdd1243dSDimitry Andric if (Object->hasDebugInfo()) { 444753f127fSDimitry Andric std::lock_guard<sys::RWMutex> DebugBinariesGuard(DebugBinariesMutex); 445bdd1243dSDimitry Andric (void)DebugBinaries.try_emplace(IDString, std::move(FilePath)); 446753f127fSDimitry Andric } else { 447753f127fSDimitry Andric std::lock_guard<sys::RWMutex> BinariesGuard(BinariesMutex); 448bdd1243dSDimitry Andric (void)Binaries.try_emplace(IDString, std::move(FilePath)); 449753f127fSDimitry Andric } 450753f127fSDimitry Andric } 451753f127fSDimitry Andric }); 452753f127fSDimitry Andric } 453753f127fSDimitry Andric IteratorGroup.wait(); 454753f127fSDimitry Andric std::unique_lock<std::mutex> Guard(IteratorMutex); 455753f127fSDimitry Andric if (EC) 456753f127fSDimitry Andric return errorCodeToError(EC); 457753f127fSDimitry Andric return Error::success(); 458753f127fSDimitry Andric } 459753f127fSDimitry Andric 460bdd1243dSDimitry Andric Expected<std::optional<std::string>> 461753f127fSDimitry Andric DebuginfodCollection::getBinaryPath(BuildIDRef ID) { 462753f127fSDimitry Andric Log.push("getting binary path of ID " + buildIDToString(ID)); 463753f127fSDimitry Andric std::shared_lock<sys::RWMutex> Guard(BinariesMutex); 464753f127fSDimitry Andric auto Loc = Binaries.find(buildIDToString(ID)); 465753f127fSDimitry Andric if (Loc != Binaries.end()) { 466753f127fSDimitry Andric std::string Path = Loc->getValue(); 467753f127fSDimitry Andric return Path; 468753f127fSDimitry Andric } 469bdd1243dSDimitry Andric return std::nullopt; 470753f127fSDimitry Andric } 471753f127fSDimitry Andric 472bdd1243dSDimitry Andric Expected<std::optional<std::string>> 473753f127fSDimitry Andric DebuginfodCollection::getDebugBinaryPath(BuildIDRef ID) { 474753f127fSDimitry Andric Log.push("getting debug binary path of ID " + buildIDToString(ID)); 475753f127fSDimitry Andric std::shared_lock<sys::RWMutex> Guard(DebugBinariesMutex); 476753f127fSDimitry Andric auto Loc = DebugBinaries.find(buildIDToString(ID)); 477753f127fSDimitry Andric if (Loc != DebugBinaries.end()) { 478753f127fSDimitry Andric std::string Path = Loc->getValue(); 479753f127fSDimitry Andric return Path; 480753f127fSDimitry Andric } 481bdd1243dSDimitry Andric return std::nullopt; 482753f127fSDimitry Andric } 483753f127fSDimitry Andric 484753f127fSDimitry Andric Expected<std::string> DebuginfodCollection::findBinaryPath(BuildIDRef ID) { 485753f127fSDimitry Andric { 486753f127fSDimitry Andric // Check collection; perform on-demand update if stale. 487bdd1243dSDimitry Andric Expected<std::optional<std::string>> PathOrErr = getBinaryPath(ID); 488753f127fSDimitry Andric if (!PathOrErr) 489753f127fSDimitry Andric return PathOrErr.takeError(); 490bdd1243dSDimitry Andric std::optional<std::string> Path = *PathOrErr; 491753f127fSDimitry Andric if (!Path) { 492753f127fSDimitry Andric Expected<bool> UpdatedOrErr = updateIfStale(); 493753f127fSDimitry Andric if (!UpdatedOrErr) 494753f127fSDimitry Andric return UpdatedOrErr.takeError(); 495753f127fSDimitry Andric if (*UpdatedOrErr) { 496753f127fSDimitry Andric // Try once more. 497753f127fSDimitry Andric PathOrErr = getBinaryPath(ID); 498753f127fSDimitry Andric if (!PathOrErr) 499753f127fSDimitry Andric return PathOrErr.takeError(); 500753f127fSDimitry Andric Path = *PathOrErr; 501753f127fSDimitry Andric } 502753f127fSDimitry Andric } 503753f127fSDimitry Andric if (Path) 504bdd1243dSDimitry Andric return *Path; 505753f127fSDimitry Andric } 506753f127fSDimitry Andric 507753f127fSDimitry Andric // Try federation. 508753f127fSDimitry Andric Expected<std::string> PathOrErr = getCachedOrDownloadExecutable(ID); 509753f127fSDimitry Andric if (!PathOrErr) 510753f127fSDimitry Andric consumeError(PathOrErr.takeError()); 511753f127fSDimitry Andric 512753f127fSDimitry Andric // Fall back to debug binary. 513753f127fSDimitry Andric return findDebugBinaryPath(ID); 514753f127fSDimitry Andric } 515753f127fSDimitry Andric 516753f127fSDimitry Andric Expected<std::string> DebuginfodCollection::findDebugBinaryPath(BuildIDRef ID) { 517753f127fSDimitry Andric // Check collection; perform on-demand update if stale. 518bdd1243dSDimitry Andric Expected<std::optional<std::string>> PathOrErr = getDebugBinaryPath(ID); 519753f127fSDimitry Andric if (!PathOrErr) 520753f127fSDimitry Andric return PathOrErr.takeError(); 521bdd1243dSDimitry Andric std::optional<std::string> Path = *PathOrErr; 522753f127fSDimitry Andric if (!Path) { 523753f127fSDimitry Andric Expected<bool> UpdatedOrErr = updateIfStale(); 524753f127fSDimitry Andric if (!UpdatedOrErr) 525753f127fSDimitry Andric return UpdatedOrErr.takeError(); 526753f127fSDimitry Andric if (*UpdatedOrErr) { 527753f127fSDimitry Andric // Try once more. 528753f127fSDimitry Andric PathOrErr = getBinaryPath(ID); 529753f127fSDimitry Andric if (!PathOrErr) 530753f127fSDimitry Andric return PathOrErr.takeError(); 531753f127fSDimitry Andric Path = *PathOrErr; 532753f127fSDimitry Andric } 533753f127fSDimitry Andric } 534753f127fSDimitry Andric if (Path) 535bdd1243dSDimitry Andric return *Path; 536753f127fSDimitry Andric 537753f127fSDimitry Andric // Try federation. 538753f127fSDimitry Andric return getCachedOrDownloadDebuginfo(ID); 539753f127fSDimitry Andric } 540753f127fSDimitry Andric 541753f127fSDimitry Andric DebuginfodServer::DebuginfodServer(DebuginfodLog &Log, 542753f127fSDimitry Andric DebuginfodCollection &Collection) 543753f127fSDimitry Andric : Log(Log), Collection(Collection) { 544753f127fSDimitry Andric cantFail( 545753f127fSDimitry Andric Server.get(R"(/buildid/(.*)/debuginfo)", [&](HTTPServerRequest Request) { 546753f127fSDimitry Andric Log.push("GET " + Request.UrlPath); 547753f127fSDimitry Andric std::string IDString; 548753f127fSDimitry Andric if (!tryGetFromHex(Request.UrlPathMatches[0], IDString)) { 549753f127fSDimitry Andric Request.setResponse( 550753f127fSDimitry Andric {404, "text/plain", "Build ID is not a hex string\n"}); 551753f127fSDimitry Andric return; 552753f127fSDimitry Andric } 553bdd1243dSDimitry Andric object::BuildID ID(IDString.begin(), IDString.end()); 554753f127fSDimitry Andric Expected<std::string> PathOrErr = Collection.findDebugBinaryPath(ID); 555753f127fSDimitry Andric if (Error Err = PathOrErr.takeError()) { 556753f127fSDimitry Andric consumeError(std::move(Err)); 557753f127fSDimitry Andric Request.setResponse({404, "text/plain", "Build ID not found\n"}); 558753f127fSDimitry Andric return; 559753f127fSDimitry Andric } 560753f127fSDimitry Andric streamFile(Request, *PathOrErr); 561753f127fSDimitry Andric })); 562753f127fSDimitry Andric cantFail( 563753f127fSDimitry Andric Server.get(R"(/buildid/(.*)/executable)", [&](HTTPServerRequest Request) { 564753f127fSDimitry Andric Log.push("GET " + Request.UrlPath); 565753f127fSDimitry Andric std::string IDString; 566753f127fSDimitry Andric if (!tryGetFromHex(Request.UrlPathMatches[0], IDString)) { 567753f127fSDimitry Andric Request.setResponse( 568753f127fSDimitry Andric {404, "text/plain", "Build ID is not a hex string\n"}); 569753f127fSDimitry Andric return; 570753f127fSDimitry Andric } 571bdd1243dSDimitry Andric object::BuildID ID(IDString.begin(), IDString.end()); 572753f127fSDimitry Andric Expected<std::string> PathOrErr = Collection.findBinaryPath(ID); 573753f127fSDimitry Andric if (Error Err = PathOrErr.takeError()) { 574753f127fSDimitry Andric consumeError(std::move(Err)); 575753f127fSDimitry Andric Request.setResponse({404, "text/plain", "Build ID not found\n"}); 576753f127fSDimitry Andric return; 577753f127fSDimitry Andric } 578753f127fSDimitry Andric streamFile(Request, *PathOrErr); 579753f127fSDimitry Andric })); 580753f127fSDimitry Andric } 581753f127fSDimitry Andric 5820eae32dcSDimitry Andric } // namespace llvm 583