xref: /openbsd-src/gnu/llvm/compiler-rt/lib/sanitizer_common/sanitizer_procmaps_common.cpp (revision 810390e339a5425391477d5d41c78d7cab2424ac)
13cab2bb3Spatrick //===-- sanitizer_procmaps_common.cpp -------------------------------------===//
23cab2bb3Spatrick //
33cab2bb3Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
43cab2bb3Spatrick // See https://llvm.org/LICENSE.txt for license information.
53cab2bb3Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
63cab2bb3Spatrick //
73cab2bb3Spatrick //===----------------------------------------------------------------------===//
83cab2bb3Spatrick //
93cab2bb3Spatrick // Information about the process mappings (common parts).
103cab2bb3Spatrick //===----------------------------------------------------------------------===//
113cab2bb3Spatrick 
123cab2bb3Spatrick #include "sanitizer_platform.h"
133cab2bb3Spatrick 
143cab2bb3Spatrick #if SANITIZER_FREEBSD || SANITIZER_LINUX || SANITIZER_NETBSD ||                \
15d89ec533Spatrick     SANITIZER_SOLARIS
163cab2bb3Spatrick 
173cab2bb3Spatrick #include "sanitizer_common.h"
183cab2bb3Spatrick #include "sanitizer_placement_new.h"
193cab2bb3Spatrick #include "sanitizer_procmaps.h"
203cab2bb3Spatrick 
213cab2bb3Spatrick namespace __sanitizer {
223cab2bb3Spatrick 
233cab2bb3Spatrick static ProcSelfMapsBuff cached_proc_self_maps;
243cab2bb3Spatrick static StaticSpinMutex cache_lock;
253cab2bb3Spatrick 
TranslateDigit(char c)263cab2bb3Spatrick static int TranslateDigit(char c) {
273cab2bb3Spatrick   if (c >= '0' && c <= '9')
283cab2bb3Spatrick     return c - '0';
293cab2bb3Spatrick   if (c >= 'a' && c <= 'f')
303cab2bb3Spatrick     return c - 'a' + 10;
313cab2bb3Spatrick   if (c >= 'A' && c <= 'F')
323cab2bb3Spatrick     return c - 'A' + 10;
333cab2bb3Spatrick   return -1;
343cab2bb3Spatrick }
353cab2bb3Spatrick 
363cab2bb3Spatrick // Parse a number and promote 'p' up to the first non-digit character.
ParseNumber(const char ** p,int base)373cab2bb3Spatrick static uptr ParseNumber(const char **p, int base) {
383cab2bb3Spatrick   uptr n = 0;
393cab2bb3Spatrick   int d;
403cab2bb3Spatrick   CHECK(base >= 2 && base <= 16);
413cab2bb3Spatrick   while ((d = TranslateDigit(**p)) >= 0 && d < base) {
423cab2bb3Spatrick     n = n * base + d;
433cab2bb3Spatrick     (*p)++;
443cab2bb3Spatrick   }
453cab2bb3Spatrick   return n;
463cab2bb3Spatrick }
473cab2bb3Spatrick 
IsDecimal(char c)483cab2bb3Spatrick bool IsDecimal(char c) {
493cab2bb3Spatrick   int d = TranslateDigit(c);
503cab2bb3Spatrick   return d >= 0 && d < 10;
513cab2bb3Spatrick }
523cab2bb3Spatrick 
ParseDecimal(const char ** p)533cab2bb3Spatrick uptr ParseDecimal(const char **p) {
543cab2bb3Spatrick   return ParseNumber(p, 10);
553cab2bb3Spatrick }
563cab2bb3Spatrick 
IsHex(char c)573cab2bb3Spatrick bool IsHex(char c) {
583cab2bb3Spatrick   int d = TranslateDigit(c);
593cab2bb3Spatrick   return d >= 0 && d < 16;
603cab2bb3Spatrick }
613cab2bb3Spatrick 
ParseHex(const char ** p)623cab2bb3Spatrick uptr ParseHex(const char **p) {
633cab2bb3Spatrick   return ParseNumber(p, 16);
643cab2bb3Spatrick }
653cab2bb3Spatrick 
AddAddressRanges(LoadedModule * module)663cab2bb3Spatrick void MemoryMappedSegment::AddAddressRanges(LoadedModule *module) {
673cab2bb3Spatrick   // data_ should be unused on this platform
683cab2bb3Spatrick   CHECK(!data_);
693cab2bb3Spatrick   module->addAddressRange(start, end, IsExecutable(), IsWritable());
703cab2bb3Spatrick }
713cab2bb3Spatrick 
MemoryMappingLayout(bool cache_enabled)723cab2bb3Spatrick MemoryMappingLayout::MemoryMappingLayout(bool cache_enabled) {
733cab2bb3Spatrick   // FIXME: in the future we may want to cache the mappings on demand only.
743cab2bb3Spatrick   if (cache_enabled)
753cab2bb3Spatrick     CacheMemoryMappings();
763cab2bb3Spatrick 
773cab2bb3Spatrick   // Read maps after the cache update to capture the maps/unmaps happening in
783cab2bb3Spatrick   // the process of updating.
793cab2bb3Spatrick   ReadProcMaps(&data_.proc_self_maps);
803cab2bb3Spatrick   if (cache_enabled && data_.proc_self_maps.mmaped_size == 0)
813cab2bb3Spatrick     LoadFromCache();
823cab2bb3Spatrick 
833cab2bb3Spatrick   Reset();
843cab2bb3Spatrick }
853cab2bb3Spatrick 
Error() const863cab2bb3Spatrick bool MemoryMappingLayout::Error() const {
873cab2bb3Spatrick   return data_.current == nullptr;
883cab2bb3Spatrick }
893cab2bb3Spatrick 
~MemoryMappingLayout()903cab2bb3Spatrick MemoryMappingLayout::~MemoryMappingLayout() {
913cab2bb3Spatrick   // Only unmap the buffer if it is different from the cached one. Otherwise
923cab2bb3Spatrick   // it will be unmapped when the cache is refreshed.
933cab2bb3Spatrick   if (data_.proc_self_maps.data != cached_proc_self_maps.data)
943cab2bb3Spatrick     UnmapOrDie(data_.proc_self_maps.data, data_.proc_self_maps.mmaped_size);
953cab2bb3Spatrick }
963cab2bb3Spatrick 
Reset()973cab2bb3Spatrick void MemoryMappingLayout::Reset() {
983cab2bb3Spatrick   data_.current = data_.proc_self_maps.data;
993cab2bb3Spatrick }
1003cab2bb3Spatrick 
1013cab2bb3Spatrick // static
CacheMemoryMappings()1023cab2bb3Spatrick void MemoryMappingLayout::CacheMemoryMappings() {
1033cab2bb3Spatrick   ProcSelfMapsBuff new_proc_self_maps;
1043cab2bb3Spatrick   ReadProcMaps(&new_proc_self_maps);
1053cab2bb3Spatrick   // Don't invalidate the cache if the mappings are unavailable.
1063cab2bb3Spatrick   if (new_proc_self_maps.mmaped_size == 0)
1073cab2bb3Spatrick     return;
1083cab2bb3Spatrick   SpinMutexLock l(&cache_lock);
1093cab2bb3Spatrick   if (cached_proc_self_maps.mmaped_size)
1103cab2bb3Spatrick     UnmapOrDie(cached_proc_self_maps.data, cached_proc_self_maps.mmaped_size);
1113cab2bb3Spatrick   cached_proc_self_maps = new_proc_self_maps;
1123cab2bb3Spatrick }
1133cab2bb3Spatrick 
LoadFromCache()1143cab2bb3Spatrick void MemoryMappingLayout::LoadFromCache() {
1153cab2bb3Spatrick   SpinMutexLock l(&cache_lock);
1163cab2bb3Spatrick   if (cached_proc_self_maps.data)
1173cab2bb3Spatrick     data_.proc_self_maps = cached_proc_self_maps;
1183cab2bb3Spatrick }
1193cab2bb3Spatrick 
DumpListOfModules(InternalMmapVectorNoCtor<LoadedModule> * modules)1203cab2bb3Spatrick void MemoryMappingLayout::DumpListOfModules(
1213cab2bb3Spatrick     InternalMmapVectorNoCtor<LoadedModule> *modules) {
1223cab2bb3Spatrick   Reset();
123d89ec533Spatrick   InternalMmapVector<char> module_name(kMaxPathLength);
1243cab2bb3Spatrick   MemoryMappedSegment segment(module_name.data(), module_name.size());
1253cab2bb3Spatrick   for (uptr i = 0; Next(&segment); i++) {
1263cab2bb3Spatrick     const char *cur_name = segment.filename;
1273cab2bb3Spatrick     if (cur_name[0] == '\0')
1283cab2bb3Spatrick       continue;
1293cab2bb3Spatrick     // Don't subtract 'cur_beg' from the first entry:
1303cab2bb3Spatrick     // * If a binary is compiled w/o -pie, then the first entry in
1313cab2bb3Spatrick     //   process maps is likely the binary itself (all dynamic libs
1323cab2bb3Spatrick     //   are mapped higher in address space). For such a binary,
1333cab2bb3Spatrick     //   instruction offset in binary coincides with the actual
1343cab2bb3Spatrick     //   instruction address in virtual memory (as code section
1353cab2bb3Spatrick     //   is mapped to a fixed memory range).
1363cab2bb3Spatrick     // * If a binary is compiled with -pie, all the modules are
1373cab2bb3Spatrick     //   mapped high at address space (in particular, higher than
1383cab2bb3Spatrick     //   shadow memory of the tool), so the module can't be the
1393cab2bb3Spatrick     //   first entry.
1403cab2bb3Spatrick     uptr base_address = (i ? segment.start : 0) - segment.offset;
1413cab2bb3Spatrick     LoadedModule cur_module;
1423cab2bb3Spatrick     cur_module.set(cur_name, base_address);
1433cab2bb3Spatrick     segment.AddAddressRanges(&cur_module);
1443cab2bb3Spatrick     modules->push_back(cur_module);
1453cab2bb3Spatrick   }
1463cab2bb3Spatrick }
1473cab2bb3Spatrick 
148*810390e3Srobert #if SANITIZER_LINUX || SANITIZER_ANDROID || SANITIZER_SOLARIS || SANITIZER_NETBSD
GetMemoryProfile(fill_profile_f cb,uptr * stats)149*810390e3Srobert void GetMemoryProfile(fill_profile_f cb, uptr *stats) {
1503cab2bb3Spatrick   char *smaps = nullptr;
1513cab2bb3Spatrick   uptr smaps_cap = 0;
1523cab2bb3Spatrick   uptr smaps_len = 0;
1533cab2bb3Spatrick   if (!ReadFileToBuffer("/proc/self/smaps", &smaps, &smaps_cap, &smaps_len))
1543cab2bb3Spatrick     return;
155*810390e3Srobert   ParseUnixMemoryProfile(cb, stats, smaps, smaps_len);
156*810390e3Srobert   UnmapOrDie(smaps, smaps_cap);
157*810390e3Srobert }
158*810390e3Srobert 
ParseUnixMemoryProfile(fill_profile_f cb,uptr * stats,char * smaps,uptr smaps_len)159*810390e3Srobert void ParseUnixMemoryProfile(fill_profile_f cb, uptr *stats, char *smaps,
160*810390e3Srobert                             uptr smaps_len) {
1613cab2bb3Spatrick   uptr start = 0;
1623cab2bb3Spatrick   bool file = false;
1633cab2bb3Spatrick   const char *pos = smaps;
164*810390e3Srobert   char *end = smaps + smaps_len;
165*810390e3Srobert   if (smaps_len < 2)
166*810390e3Srobert     return;
167*810390e3Srobert   // The following parsing can crash on almost every line
168*810390e3Srobert   // in the case of malformed/truncated input.
169*810390e3Srobert   // Fixing that is hard b/c e.g. ParseDecimal does not
170*810390e3Srobert   // even accept end of the buffer and assumes well-formed input.
171*810390e3Srobert   // So instead we patch end of the input a bit,
172*810390e3Srobert   // it does not affect well-formed complete inputs.
173*810390e3Srobert   *--end = 0;
174*810390e3Srobert   *--end = '\n';
175*810390e3Srobert   while (pos < end) {
1763cab2bb3Spatrick     if (IsHex(pos[0])) {
1773cab2bb3Spatrick       start = ParseHex(&pos);
1783cab2bb3Spatrick       for (; *pos != '/' && *pos > '\n'; pos++) {}
1793cab2bb3Spatrick       file = *pos == '/';
1803cab2bb3Spatrick     } else if (internal_strncmp(pos, "Rss:", 4) == 0) {
181*810390e3Srobert       while (pos < end && !IsDecimal(*pos)) pos++;
1823cab2bb3Spatrick       uptr rss = ParseDecimal(&pos) * 1024;
183*810390e3Srobert       cb(start, rss, file, stats);
1843cab2bb3Spatrick     }
1853cab2bb3Spatrick     while (*pos++ != '\n') {}
1863cab2bb3Spatrick   }
1873cab2bb3Spatrick }
188*810390e3Srobert #endif
1893cab2bb3Spatrick 
1903cab2bb3Spatrick } // namespace __sanitizer
1913cab2bb3Spatrick 
1923cab2bb3Spatrick #endif
193