xref: /openbsd-src/gnu/llvm/compiler-rt/lib/fuzzer/FuzzerUtil.cpp (revision 810390e339a5425391477d5d41c78d7cab2424ac)
13cab2bb3Spatrick //===- FuzzerUtil.cpp - Misc utils ----------------------------------------===//
23cab2bb3Spatrick //
33cab2bb3Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
43cab2bb3Spatrick // See https://llvm.org/LICENSE.txt for license information.
53cab2bb3Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
63cab2bb3Spatrick //
73cab2bb3Spatrick //===----------------------------------------------------------------------===//
83cab2bb3Spatrick // Misc utils.
93cab2bb3Spatrick //===----------------------------------------------------------------------===//
103cab2bb3Spatrick 
113cab2bb3Spatrick #include "FuzzerUtil.h"
123cab2bb3Spatrick #include "FuzzerIO.h"
133cab2bb3Spatrick #include "FuzzerInternal.h"
143cab2bb3Spatrick #include <cassert>
153cab2bb3Spatrick #include <chrono>
163cab2bb3Spatrick #include <cstring>
173cab2bb3Spatrick #include <errno.h>
183cab2bb3Spatrick #include <mutex>
193cab2bb3Spatrick #include <signal.h>
203cab2bb3Spatrick #include <sstream>
213cab2bb3Spatrick #include <stdio.h>
223cab2bb3Spatrick #include <sys/types.h>
233cab2bb3Spatrick #include <thread>
243cab2bb3Spatrick 
253cab2bb3Spatrick namespace fuzzer {
263cab2bb3Spatrick 
PrintHexArray(const uint8_t * Data,size_t Size,const char * PrintAfter)273cab2bb3Spatrick void PrintHexArray(const uint8_t *Data, size_t Size,
283cab2bb3Spatrick                    const char *PrintAfter) {
293cab2bb3Spatrick   for (size_t i = 0; i < Size; i++)
303cab2bb3Spatrick     Printf("0x%x,", (unsigned)Data[i]);
313cab2bb3Spatrick   Printf("%s", PrintAfter);
323cab2bb3Spatrick }
333cab2bb3Spatrick 
Print(const Unit & v,const char * PrintAfter)343cab2bb3Spatrick void Print(const Unit &v, const char *PrintAfter) {
353cab2bb3Spatrick   PrintHexArray(v.data(), v.size(), PrintAfter);
363cab2bb3Spatrick }
373cab2bb3Spatrick 
PrintASCIIByte(uint8_t Byte)383cab2bb3Spatrick void PrintASCIIByte(uint8_t Byte) {
393cab2bb3Spatrick   if (Byte == '\\')
403cab2bb3Spatrick     Printf("\\\\");
413cab2bb3Spatrick   else if (Byte == '"')
423cab2bb3Spatrick     Printf("\\\"");
433cab2bb3Spatrick   else if (Byte >= 32 && Byte < 127)
443cab2bb3Spatrick     Printf("%c", Byte);
453cab2bb3Spatrick   else
46*810390e3Srobert     Printf("\\%03o", Byte);
473cab2bb3Spatrick }
483cab2bb3Spatrick 
PrintASCII(const uint8_t * Data,size_t Size,const char * PrintAfter)493cab2bb3Spatrick void PrintASCII(const uint8_t *Data, size_t Size, const char *PrintAfter) {
503cab2bb3Spatrick   for (size_t i = 0; i < Size; i++)
513cab2bb3Spatrick     PrintASCIIByte(Data[i]);
523cab2bb3Spatrick   Printf("%s", PrintAfter);
533cab2bb3Spatrick }
543cab2bb3Spatrick 
PrintASCII(const Unit & U,const char * PrintAfter)553cab2bb3Spatrick void PrintASCII(const Unit &U, const char *PrintAfter) {
563cab2bb3Spatrick   PrintASCII(U.data(), U.size(), PrintAfter);
573cab2bb3Spatrick }
583cab2bb3Spatrick 
ToASCII(uint8_t * Data,size_t Size)593cab2bb3Spatrick bool ToASCII(uint8_t *Data, size_t Size) {
603cab2bb3Spatrick   bool Changed = false;
613cab2bb3Spatrick   for (size_t i = 0; i < Size; i++) {
623cab2bb3Spatrick     uint8_t &X = Data[i];
633cab2bb3Spatrick     auto NewX = X;
643cab2bb3Spatrick     NewX &= 127;
653cab2bb3Spatrick     if (!isspace(NewX) && !isprint(NewX))
663cab2bb3Spatrick       NewX = ' ';
673cab2bb3Spatrick     Changed |= NewX != X;
683cab2bb3Spatrick     X = NewX;
693cab2bb3Spatrick   }
703cab2bb3Spatrick   return Changed;
713cab2bb3Spatrick }
723cab2bb3Spatrick 
IsASCII(const Unit & U)733cab2bb3Spatrick bool IsASCII(const Unit &U) { return IsASCII(U.data(), U.size()); }
743cab2bb3Spatrick 
IsASCII(const uint8_t * Data,size_t Size)753cab2bb3Spatrick bool IsASCII(const uint8_t *Data, size_t Size) {
763cab2bb3Spatrick   for (size_t i = 0; i < Size; i++)
773cab2bb3Spatrick     if (!(isprint(Data[i]) || isspace(Data[i]))) return false;
783cab2bb3Spatrick   return true;
793cab2bb3Spatrick }
803cab2bb3Spatrick 
ParseOneDictionaryEntry(const std::string & Str,Unit * U)813cab2bb3Spatrick bool ParseOneDictionaryEntry(const std::string &Str, Unit *U) {
823cab2bb3Spatrick   U->clear();
833cab2bb3Spatrick   if (Str.empty()) return false;
843cab2bb3Spatrick   size_t L = 0, R = Str.size() - 1;  // We are parsing the range [L,R].
853cab2bb3Spatrick   // Skip spaces from both sides.
863cab2bb3Spatrick   while (L < R && isspace(Str[L])) L++;
873cab2bb3Spatrick   while (R > L && isspace(Str[R])) R--;
883cab2bb3Spatrick   if (R - L < 2) return false;
893cab2bb3Spatrick   // Check the closing "
903cab2bb3Spatrick   if (Str[R] != '"') return false;
913cab2bb3Spatrick   R--;
923cab2bb3Spatrick   // Find the opening "
933cab2bb3Spatrick   while (L < R && Str[L] != '"') L++;
943cab2bb3Spatrick   if (L >= R) return false;
953cab2bb3Spatrick   assert(Str[L] == '\"');
963cab2bb3Spatrick   L++;
973cab2bb3Spatrick   assert(L <= R);
983cab2bb3Spatrick   for (size_t Pos = L; Pos <= R; Pos++) {
993cab2bb3Spatrick     uint8_t V = (uint8_t)Str[Pos];
1003cab2bb3Spatrick     if (!isprint(V) && !isspace(V)) return false;
1013cab2bb3Spatrick     if (V =='\\') {
1023cab2bb3Spatrick       // Handle '\\'
1033cab2bb3Spatrick       if (Pos + 1 <= R && (Str[Pos + 1] == '\\' || Str[Pos + 1] == '"')) {
1043cab2bb3Spatrick         U->push_back(Str[Pos + 1]);
1053cab2bb3Spatrick         Pos++;
1063cab2bb3Spatrick         continue;
1073cab2bb3Spatrick       }
1083cab2bb3Spatrick       // Handle '\xAB'
1093cab2bb3Spatrick       if (Pos + 3 <= R && Str[Pos + 1] == 'x'
1103cab2bb3Spatrick            && isxdigit(Str[Pos + 2]) && isxdigit(Str[Pos + 3])) {
1113cab2bb3Spatrick         char Hex[] = "0xAA";
1123cab2bb3Spatrick         Hex[2] = Str[Pos + 2];
1133cab2bb3Spatrick         Hex[3] = Str[Pos + 3];
114d89ec533Spatrick         U->push_back(static_cast<uint8_t>(strtol(Hex, nullptr, 16)));
1153cab2bb3Spatrick         Pos += 3;
1163cab2bb3Spatrick         continue;
1173cab2bb3Spatrick       }
1183cab2bb3Spatrick       return false;  // Invalid escape.
1193cab2bb3Spatrick     } else {
1203cab2bb3Spatrick       // Any other character.
1213cab2bb3Spatrick       U->push_back(V);
1223cab2bb3Spatrick     }
1233cab2bb3Spatrick   }
1243cab2bb3Spatrick   return true;
1253cab2bb3Spatrick }
1263cab2bb3Spatrick 
ParseDictionaryFile(const std::string & Text,std::vector<Unit> * Units)127*810390e3Srobert bool ParseDictionaryFile(const std::string &Text, std::vector<Unit> *Units) {
1283cab2bb3Spatrick   if (Text.empty()) {
1293cab2bb3Spatrick     Printf("ParseDictionaryFile: file does not exist or is empty\n");
1303cab2bb3Spatrick     return false;
1313cab2bb3Spatrick   }
1323cab2bb3Spatrick   std::istringstream ISS(Text);
1333cab2bb3Spatrick   Units->clear();
1343cab2bb3Spatrick   Unit U;
1353cab2bb3Spatrick   int LineNo = 0;
1363cab2bb3Spatrick   std::string S;
1373cab2bb3Spatrick   while (std::getline(ISS, S, '\n')) {
1383cab2bb3Spatrick     LineNo++;
1393cab2bb3Spatrick     size_t Pos = 0;
1403cab2bb3Spatrick     while (Pos < S.size() && isspace(S[Pos])) Pos++;  // Skip spaces.
1413cab2bb3Spatrick     if (Pos == S.size()) continue;  // Empty line.
1423cab2bb3Spatrick     if (S[Pos] == '#') continue;  // Comment line.
1433cab2bb3Spatrick     if (ParseOneDictionaryEntry(S, &U)) {
1443cab2bb3Spatrick       Units->push_back(U);
1453cab2bb3Spatrick     } else {
1463cab2bb3Spatrick       Printf("ParseDictionaryFile: error in line %d\n\t\t%s\n", LineNo,
1473cab2bb3Spatrick              S.c_str());
1483cab2bb3Spatrick       return false;
1493cab2bb3Spatrick     }
1503cab2bb3Spatrick   }
1513cab2bb3Spatrick   return true;
1523cab2bb3Spatrick }
1533cab2bb3Spatrick 
1541f9cb04fSpatrick // Code duplicated (and tested) in llvm/include/llvm/Support/Base64.h
Base64(const Unit & U)1553cab2bb3Spatrick std::string Base64(const Unit &U) {
1563cab2bb3Spatrick   static const char Table[] = "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
1573cab2bb3Spatrick                               "abcdefghijklmnopqrstuvwxyz"
1583cab2bb3Spatrick                               "0123456789+/";
1591f9cb04fSpatrick   std::string Buffer;
1601f9cb04fSpatrick   Buffer.resize(((U.size() + 2) / 3) * 4);
1611f9cb04fSpatrick 
1621f9cb04fSpatrick   size_t i = 0, j = 0;
1631f9cb04fSpatrick   for (size_t n = U.size() / 3 * 3; i < n; i += 3, j += 4) {
1641f9cb04fSpatrick     uint32_t x = ((unsigned char)U[i] << 16) | ((unsigned char)U[i + 1] << 8) |
1651f9cb04fSpatrick                  (unsigned char)U[i + 2];
1661f9cb04fSpatrick     Buffer[j + 0] = Table[(x >> 18) & 63];
1671f9cb04fSpatrick     Buffer[j + 1] = Table[(x >> 12) & 63];
1681f9cb04fSpatrick     Buffer[j + 2] = Table[(x >> 6) & 63];
1691f9cb04fSpatrick     Buffer[j + 3] = Table[x & 63];
1703cab2bb3Spatrick   }
1713cab2bb3Spatrick   if (i + 1 == U.size()) {
1721f9cb04fSpatrick     uint32_t x = ((unsigned char)U[i] << 16);
1731f9cb04fSpatrick     Buffer[j + 0] = Table[(x >> 18) & 63];
1741f9cb04fSpatrick     Buffer[j + 1] = Table[(x >> 12) & 63];
1751f9cb04fSpatrick     Buffer[j + 2] = '=';
1761f9cb04fSpatrick     Buffer[j + 3] = '=';
1773cab2bb3Spatrick   } else if (i + 2 == U.size()) {
1781f9cb04fSpatrick     uint32_t x = ((unsigned char)U[i] << 16) | ((unsigned char)U[i + 1] << 8);
1791f9cb04fSpatrick     Buffer[j + 0] = Table[(x >> 18) & 63];
1801f9cb04fSpatrick     Buffer[j + 1] = Table[(x >> 12) & 63];
1811f9cb04fSpatrick     Buffer[j + 2] = Table[(x >> 6) & 63];
1821f9cb04fSpatrick     Buffer[j + 3] = '=';
1833cab2bb3Spatrick   }
1841f9cb04fSpatrick   return Buffer;
1853cab2bb3Spatrick }
1863cab2bb3Spatrick 
1873cab2bb3Spatrick static std::mutex SymbolizeMutex;
1883cab2bb3Spatrick 
DescribePC(const char * SymbolizedFMT,uintptr_t PC)1893cab2bb3Spatrick std::string DescribePC(const char *SymbolizedFMT, uintptr_t PC) {
1903cab2bb3Spatrick   std::unique_lock<std::mutex> l(SymbolizeMutex, std::try_to_lock);
1913cab2bb3Spatrick   if (!EF->__sanitizer_symbolize_pc || !l.owns_lock())
1923cab2bb3Spatrick     return "<can not symbolize>";
1933cab2bb3Spatrick   char PcDescr[1024] = {};
1943cab2bb3Spatrick   EF->__sanitizer_symbolize_pc(reinterpret_cast<void*>(PC),
1953cab2bb3Spatrick                                SymbolizedFMT, PcDescr, sizeof(PcDescr));
1963cab2bb3Spatrick   PcDescr[sizeof(PcDescr) - 1] = 0;  // Just in case.
1973cab2bb3Spatrick   return PcDescr;
1983cab2bb3Spatrick }
1993cab2bb3Spatrick 
PrintPC(const char * SymbolizedFMT,const char * FallbackFMT,uintptr_t PC)2003cab2bb3Spatrick void PrintPC(const char *SymbolizedFMT, const char *FallbackFMT, uintptr_t PC) {
2013cab2bb3Spatrick   if (EF->__sanitizer_symbolize_pc)
2023cab2bb3Spatrick     Printf("%s", DescribePC(SymbolizedFMT, PC).c_str());
2033cab2bb3Spatrick   else
2043cab2bb3Spatrick     Printf(FallbackFMT, PC);
2053cab2bb3Spatrick }
2063cab2bb3Spatrick 
PrintStackTrace()2073cab2bb3Spatrick void PrintStackTrace() {
2083cab2bb3Spatrick   std::unique_lock<std::mutex> l(SymbolizeMutex, std::try_to_lock);
2093cab2bb3Spatrick   if (EF->__sanitizer_print_stack_trace && l.owns_lock())
2103cab2bb3Spatrick     EF->__sanitizer_print_stack_trace();
2113cab2bb3Spatrick }
2123cab2bb3Spatrick 
PrintMemoryProfile()2133cab2bb3Spatrick void PrintMemoryProfile() {
2143cab2bb3Spatrick   std::unique_lock<std::mutex> l(SymbolizeMutex, std::try_to_lock);
2153cab2bb3Spatrick   if (EF->__sanitizer_print_memory_profile && l.owns_lock())
2163cab2bb3Spatrick     EF->__sanitizer_print_memory_profile(95, 8);
2173cab2bb3Spatrick }
2183cab2bb3Spatrick 
NumberOfCpuCores()2193cab2bb3Spatrick unsigned NumberOfCpuCores() {
2203cab2bb3Spatrick   unsigned N = std::thread::hardware_concurrency();
2213cab2bb3Spatrick   if (!N) {
2223cab2bb3Spatrick     Printf("WARNING: std::thread::hardware_concurrency not well defined for "
2233cab2bb3Spatrick            "your platform. Assuming CPU count of 1.\n");
2243cab2bb3Spatrick     N = 1;
2253cab2bb3Spatrick   }
2263cab2bb3Spatrick   return N;
2273cab2bb3Spatrick }
2283cab2bb3Spatrick 
SimpleFastHash(const void * Data,size_t Size,uint64_t Initial)229d89ec533Spatrick uint64_t SimpleFastHash(const void *Data, size_t Size, uint64_t Initial) {
230d89ec533Spatrick   uint64_t Res = Initial;
231d89ec533Spatrick   const uint8_t *Bytes = static_cast<const uint8_t *>(Data);
2323cab2bb3Spatrick   for (size_t i = 0; i < Size; i++)
233d89ec533Spatrick     Res = Res * 11 + Bytes[i];
2343cab2bb3Spatrick   return Res;
2353cab2bb3Spatrick }
2363cab2bb3Spatrick 
2373cab2bb3Spatrick }  // namespace fuzzer
238