xref: /openbsd-src/gnu/llvm/compiler-rt/lib/sanitizer_common/sanitizer_symbolizer_mac.cpp (revision 810390e339a5425391477d5d41c78d7cab2424ac)
13cab2bb3Spatrick //===-- sanitizer_symbolizer_mac.cpp --------------------------------------===//
23cab2bb3Spatrick //
33cab2bb3Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
43cab2bb3Spatrick // See https://llvm.org/LICENSE.txt for license information.
53cab2bb3Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
63cab2bb3Spatrick //
73cab2bb3Spatrick //===----------------------------------------------------------------------===//
83cab2bb3Spatrick //
93cab2bb3Spatrick // This file is shared between various sanitizers' runtime libraries.
103cab2bb3Spatrick //
113cab2bb3Spatrick // Implementation of Mac-specific "atos" symbolizer.
123cab2bb3Spatrick //===----------------------------------------------------------------------===//
133cab2bb3Spatrick 
143cab2bb3Spatrick #include "sanitizer_platform.h"
15*810390e3Srobert #if SANITIZER_APPLE
163cab2bb3Spatrick 
173cab2bb3Spatrick #include "sanitizer_allocator_internal.h"
183cab2bb3Spatrick #include "sanitizer_mac.h"
193cab2bb3Spatrick #include "sanitizer_symbolizer_mac.h"
203cab2bb3Spatrick 
213cab2bb3Spatrick #include <dlfcn.h>
223cab2bb3Spatrick #include <errno.h>
233cab2bb3Spatrick #include <stdlib.h>
243cab2bb3Spatrick #include <sys/wait.h>
253cab2bb3Spatrick #include <unistd.h>
263cab2bb3Spatrick #include <util.h>
273cab2bb3Spatrick 
283cab2bb3Spatrick namespace __sanitizer {
293cab2bb3Spatrick 
SymbolizePC(uptr addr,SymbolizedStack * stack)303cab2bb3Spatrick bool DlAddrSymbolizer::SymbolizePC(uptr addr, SymbolizedStack *stack) {
313cab2bb3Spatrick   Dl_info info;
323cab2bb3Spatrick   int result = dladdr((const void *)addr, &info);
333cab2bb3Spatrick   if (!result) return false;
343cab2bb3Spatrick 
35d89ec533Spatrick   // Compute offset if possible. `dladdr()` doesn't always ensure that `addr >=
36d89ec533Spatrick   // sym_addr` so only compute the offset when this holds. Failure to find the
37d89ec533Spatrick   // function offset is not treated as a failure because it might still be
38d89ec533Spatrick   // possible to get the symbol name.
39d89ec533Spatrick   uptr sym_addr = reinterpret_cast<uptr>(info.dli_saddr);
40d89ec533Spatrick   if (addr >= sym_addr) {
41d89ec533Spatrick     stack->info.function_offset = addr - sym_addr;
42d89ec533Spatrick   }
43d89ec533Spatrick 
443cab2bb3Spatrick   const char *demangled = DemangleSwiftAndCXX(info.dli_sname);
453cab2bb3Spatrick   if (!demangled) return false;
463cab2bb3Spatrick   stack->info.function = internal_strdup(demangled);
473cab2bb3Spatrick   return true;
483cab2bb3Spatrick }
493cab2bb3Spatrick 
SymbolizeData(uptr addr,DataInfo * datainfo)503cab2bb3Spatrick bool DlAddrSymbolizer::SymbolizeData(uptr addr, DataInfo *datainfo) {
513cab2bb3Spatrick   Dl_info info;
523cab2bb3Spatrick   int result = dladdr((const void *)addr, &info);
533cab2bb3Spatrick   if (!result) return false;
543cab2bb3Spatrick   const char *demangled = DemangleSwiftAndCXX(info.dli_sname);
553cab2bb3Spatrick   datainfo->name = internal_strdup(demangled);
563cab2bb3Spatrick   datainfo->start = (uptr)info.dli_saddr;
573cab2bb3Spatrick   return true;
583cab2bb3Spatrick }
593cab2bb3Spatrick 
60d89ec533Spatrick class AtosSymbolizerProcess final : public SymbolizerProcess {
613cab2bb3Spatrick  public:
AtosSymbolizerProcess(const char * path)621f9cb04fSpatrick   explicit AtosSymbolizerProcess(const char *path)
633cab2bb3Spatrick       : SymbolizerProcess(path, /*use_posix_spawn*/ true) {
641f9cb04fSpatrick     pid_str_[0] = '\0';
651f9cb04fSpatrick   }
661f9cb04fSpatrick 
673cab2bb3Spatrick  private:
StartSymbolizerSubprocess()683cab2bb3Spatrick   bool StartSymbolizerSubprocess() override {
691f9cb04fSpatrick     // Put the string command line argument in the object so that it outlives
701f9cb04fSpatrick     // the call to GetArgV.
71*810390e3Srobert     internal_snprintf(pid_str_, sizeof(pid_str_), "%d", (int)internal_getpid());
721f9cb04fSpatrick 
73*810390e3Srobert     // Configure sandbox before starting atos process.
743cab2bb3Spatrick     return SymbolizerProcess::StartSymbolizerSubprocess();
753cab2bb3Spatrick   }
763cab2bb3Spatrick 
ReachedEndOfOutput(const char * buffer,uptr length) const773cab2bb3Spatrick   bool ReachedEndOfOutput(const char *buffer, uptr length) const override {
783cab2bb3Spatrick     return (length >= 1 && buffer[length - 1] == '\n');
793cab2bb3Spatrick   }
803cab2bb3Spatrick 
GetArgV(const char * path_to_binary,const char * (& argv)[kArgVMax]) const813cab2bb3Spatrick   void GetArgV(const char *path_to_binary,
823cab2bb3Spatrick                const char *(&argv)[kArgVMax]) const override {
833cab2bb3Spatrick     int i = 0;
843cab2bb3Spatrick     argv[i++] = path_to_binary;
853cab2bb3Spatrick     argv[i++] = "-p";
863cab2bb3Spatrick     argv[i++] = &pid_str_[0];
871f9cb04fSpatrick     if (GetMacosAlignedVersion() == MacosVersion(10, 9)) {
883cab2bb3Spatrick       // On Mavericks atos prints a deprecation warning which we suppress by
893cab2bb3Spatrick       // passing -d. The warning isn't present on other OSX versions, even the
903cab2bb3Spatrick       // newer ones.
913cab2bb3Spatrick       argv[i++] = "-d";
923cab2bb3Spatrick     }
933cab2bb3Spatrick     argv[i++] = nullptr;
94*810390e3Srobert     CHECK_LE(i, kArgVMax);
953cab2bb3Spatrick   }
963cab2bb3Spatrick 
973cab2bb3Spatrick   char pid_str_[16];
983cab2bb3Spatrick };
993cab2bb3Spatrick 
1001f9cb04fSpatrick #undef K_ATOS_ENV_VAR
1011f9cb04fSpatrick 
ParseCommandOutput(const char * str,uptr addr,char ** out_name,char ** out_module,char ** out_file,uptr * line,uptr * start_address)1023cab2bb3Spatrick static bool ParseCommandOutput(const char *str, uptr addr, char **out_name,
1033cab2bb3Spatrick                                char **out_module, char **out_file, uptr *line,
1043cab2bb3Spatrick                                uptr *start_address) {
1053cab2bb3Spatrick   // Trim ending newlines.
1063cab2bb3Spatrick   char *trim;
1073cab2bb3Spatrick   ExtractTokenUpToDelimiter(str, "\n", &trim);
1083cab2bb3Spatrick 
1093cab2bb3Spatrick   // The line from `atos` is in one of these formats:
1103cab2bb3Spatrick   //   myfunction (in library.dylib) (sourcefile.c:17)
1113cab2bb3Spatrick   //   myfunction (in library.dylib) + 0x1fe
1123cab2bb3Spatrick   //   myfunction (in library.dylib) + 15
1133cab2bb3Spatrick   //   0xdeadbeef (in library.dylib) + 0x1fe
1143cab2bb3Spatrick   //   0xdeadbeef (in library.dylib) + 15
1153cab2bb3Spatrick   //   0xdeadbeef (in library.dylib)
1163cab2bb3Spatrick   //   0xdeadbeef
1173cab2bb3Spatrick 
1183cab2bb3Spatrick   const char *rest = trim;
1193cab2bb3Spatrick   char *symbol_name;
1203cab2bb3Spatrick   rest = ExtractTokenUpToDelimiter(rest, " (in ", &symbol_name);
1213cab2bb3Spatrick   if (rest[0] == '\0') {
1223cab2bb3Spatrick     InternalFree(symbol_name);
1233cab2bb3Spatrick     InternalFree(trim);
1243cab2bb3Spatrick     return false;
1253cab2bb3Spatrick   }
1263cab2bb3Spatrick 
1273cab2bb3Spatrick   if (internal_strncmp(symbol_name, "0x", 2) != 0)
1283cab2bb3Spatrick     *out_name = symbol_name;
1293cab2bb3Spatrick   else
1303cab2bb3Spatrick     InternalFree(symbol_name);
1313cab2bb3Spatrick   rest = ExtractTokenUpToDelimiter(rest, ") ", out_module);
1323cab2bb3Spatrick 
1333cab2bb3Spatrick   if (rest[0] == '(') {
1343cab2bb3Spatrick     if (out_file) {
1353cab2bb3Spatrick       rest++;
1363cab2bb3Spatrick       rest = ExtractTokenUpToDelimiter(rest, ":", out_file);
1373cab2bb3Spatrick       char *extracted_line_number;
1383cab2bb3Spatrick       rest = ExtractTokenUpToDelimiter(rest, ")", &extracted_line_number);
1393cab2bb3Spatrick       if (line) *line = (uptr)internal_atoll(extracted_line_number);
1403cab2bb3Spatrick       InternalFree(extracted_line_number);
1413cab2bb3Spatrick     }
1423cab2bb3Spatrick   } else if (rest[0] == '+') {
1433cab2bb3Spatrick     rest += 2;
1443cab2bb3Spatrick     uptr offset = internal_atoll(rest);
1453cab2bb3Spatrick     if (start_address) *start_address = addr - offset;
1463cab2bb3Spatrick   }
1473cab2bb3Spatrick 
1483cab2bb3Spatrick   InternalFree(trim);
1493cab2bb3Spatrick   return true;
1503cab2bb3Spatrick }
1513cab2bb3Spatrick 
AtosSymbolizer(const char * path,LowLevelAllocator * allocator)1523cab2bb3Spatrick AtosSymbolizer::AtosSymbolizer(const char *path, LowLevelAllocator *allocator)
1531f9cb04fSpatrick     : process_(new (*allocator) AtosSymbolizerProcess(path)) {}
1543cab2bb3Spatrick 
SymbolizePC(uptr addr,SymbolizedStack * stack)1553cab2bb3Spatrick bool AtosSymbolizer::SymbolizePC(uptr addr, SymbolizedStack *stack) {
1563cab2bb3Spatrick   if (!process_) return false;
1573cab2bb3Spatrick   if (addr == 0) return false;
1583cab2bb3Spatrick   char command[32];
1593cab2bb3Spatrick   internal_snprintf(command, sizeof(command), "0x%zx\n", addr);
1603cab2bb3Spatrick   const char *buf = process_->SendCommand(command);
1613cab2bb3Spatrick   if (!buf) return false;
1623cab2bb3Spatrick   uptr line;
1633cab2bb3Spatrick   uptr start_address = AddressInfo::kUnknown;
1643cab2bb3Spatrick   if (!ParseCommandOutput(buf, addr, &stack->info.function, &stack->info.module,
1653cab2bb3Spatrick                           &stack->info.file, &line, &start_address)) {
1663cab2bb3Spatrick     process_ = nullptr;
1673cab2bb3Spatrick     return false;
1683cab2bb3Spatrick   }
1693cab2bb3Spatrick   stack->info.line = (int)line;
1703cab2bb3Spatrick 
1713cab2bb3Spatrick   if (start_address == AddressInfo::kUnknown) {
1723cab2bb3Spatrick     // Fallback to dladdr() to get function start address if atos doesn't report
1733cab2bb3Spatrick     // it.
1743cab2bb3Spatrick     Dl_info info;
1753cab2bb3Spatrick     int result = dladdr((const void *)addr, &info);
1763cab2bb3Spatrick     if (result)
1773cab2bb3Spatrick       start_address = reinterpret_cast<uptr>(info.dli_saddr);
1783cab2bb3Spatrick   }
1793cab2bb3Spatrick 
180d89ec533Spatrick   // Only assign to `function_offset` if we were able to get the function's
181d89ec533Spatrick   // start address and we got a sensible `start_address` (dladdr doesn't always
182d89ec533Spatrick   // ensure that `addr >= sym_addr`).
183d89ec533Spatrick   if (start_address != AddressInfo::kUnknown && addr >= start_address) {
1843cab2bb3Spatrick     stack->info.function_offset = addr - start_address;
1853cab2bb3Spatrick   }
1863cab2bb3Spatrick   return true;
1873cab2bb3Spatrick }
1883cab2bb3Spatrick 
SymbolizeData(uptr addr,DataInfo * info)1893cab2bb3Spatrick bool AtosSymbolizer::SymbolizeData(uptr addr, DataInfo *info) {
1903cab2bb3Spatrick   if (!process_) return false;
1913cab2bb3Spatrick   char command[32];
1923cab2bb3Spatrick   internal_snprintf(command, sizeof(command), "0x%zx\n", addr);
1933cab2bb3Spatrick   const char *buf = process_->SendCommand(command);
1943cab2bb3Spatrick   if (!buf) return false;
1953cab2bb3Spatrick   if (!ParseCommandOutput(buf, addr, &info->name, &info->module, nullptr,
1963cab2bb3Spatrick                           nullptr, &info->start)) {
1973cab2bb3Spatrick     process_ = nullptr;
1983cab2bb3Spatrick     return false;
1993cab2bb3Spatrick   }
2003cab2bb3Spatrick   return true;
2013cab2bb3Spatrick }
2023cab2bb3Spatrick 
2033cab2bb3Spatrick }  // namespace __sanitizer
2043cab2bb3Spatrick 
205*810390e3Srobert #endif  // SANITIZER_APPLE
206