1*d89ec533Spatrick //===-- FuzzerInterceptors.cpp --------------------------------------------===//
2*d89ec533Spatrick //
3*d89ec533Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*d89ec533Spatrick // See https://llvm.org/LICENSE.txt for license information.
5*d89ec533Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*d89ec533Spatrick //
7*d89ec533Spatrick //===----------------------------------------------------------------------===//
8*d89ec533Spatrick // Intercept certain libc functions to aid fuzzing.
9*d89ec533Spatrick // Linked only when other RTs that define their own interceptors are not linked.
10*d89ec533Spatrick //===----------------------------------------------------------------------===//
11*d89ec533Spatrick
12*d89ec533Spatrick #include "FuzzerPlatform.h"
13*d89ec533Spatrick
14*d89ec533Spatrick #if LIBFUZZER_LINUX
15*d89ec533Spatrick
16*d89ec533Spatrick #define GET_CALLER_PC() __builtin_return_address(0)
17*d89ec533Spatrick
18*d89ec533Spatrick #define PTR_TO_REAL(x) real_##x
19*d89ec533Spatrick #define REAL(x) __interception::PTR_TO_REAL(x)
20*d89ec533Spatrick #define FUNC_TYPE(x) x##_type
21*d89ec533Spatrick #define DEFINE_REAL(ret_type, func, ...) \
22*d89ec533Spatrick typedef ret_type (*FUNC_TYPE(func))(__VA_ARGS__); \
23*d89ec533Spatrick namespace __interception { \
24*d89ec533Spatrick FUNC_TYPE(func) PTR_TO_REAL(func); \
25*d89ec533Spatrick }
26*d89ec533Spatrick
27*d89ec533Spatrick #include <cassert>
28*d89ec533Spatrick #include <cstddef> // for size_t
29*d89ec533Spatrick #include <cstdint>
30*d89ec533Spatrick #include <dlfcn.h> // for dlsym()
31*d89ec533Spatrick
getFuncAddr(const char * name,uintptr_t wrapper_addr)32*d89ec533Spatrick static void *getFuncAddr(const char *name, uintptr_t wrapper_addr) {
33*d89ec533Spatrick void *addr = dlsym(RTLD_NEXT, name);
34*d89ec533Spatrick if (!addr) {
35*d89ec533Spatrick // If the lookup using RTLD_NEXT failed, the sanitizer runtime library is
36*d89ec533Spatrick // later in the library search order than the DSO that we are trying to
37*d89ec533Spatrick // intercept, which means that we cannot intercept this function. We still
38*d89ec533Spatrick // want the address of the real definition, though, so look it up using
39*d89ec533Spatrick // RTLD_DEFAULT.
40*d89ec533Spatrick addr = dlsym(RTLD_DEFAULT, name);
41*d89ec533Spatrick
42*d89ec533Spatrick // In case `name' is not loaded, dlsym ends up finding the actual wrapper.
43*d89ec533Spatrick // We don't want to intercept the wrapper and have it point to itself.
44*d89ec533Spatrick if (reinterpret_cast<uintptr_t>(addr) == wrapper_addr)
45*d89ec533Spatrick addr = nullptr;
46*d89ec533Spatrick }
47*d89ec533Spatrick return addr;
48*d89ec533Spatrick }
49*d89ec533Spatrick
50*d89ec533Spatrick static int FuzzerInited = 0;
51*d89ec533Spatrick static bool FuzzerInitIsRunning;
52*d89ec533Spatrick
53*d89ec533Spatrick static void fuzzerInit();
54*d89ec533Spatrick
ensureFuzzerInited()55*d89ec533Spatrick static void ensureFuzzerInited() {
56*d89ec533Spatrick assert(!FuzzerInitIsRunning);
57*d89ec533Spatrick if (!FuzzerInited) {
58*d89ec533Spatrick fuzzerInit();
59*d89ec533Spatrick }
60*d89ec533Spatrick }
61*d89ec533Spatrick
internal_strcmp_strncmp(const char * s1,const char * s2,bool strncmp,size_t n)62*d89ec533Spatrick static int internal_strcmp_strncmp(const char *s1, const char *s2, bool strncmp,
63*d89ec533Spatrick size_t n) {
64*d89ec533Spatrick size_t i = 0;
65*d89ec533Spatrick while (true) {
66*d89ec533Spatrick if (strncmp) {
67*d89ec533Spatrick if (i == n)
68*d89ec533Spatrick break;
69*d89ec533Spatrick i++;
70*d89ec533Spatrick }
71*d89ec533Spatrick unsigned c1 = *s1;
72*d89ec533Spatrick unsigned c2 = *s2;
73*d89ec533Spatrick if (c1 != c2)
74*d89ec533Spatrick return (c1 < c2) ? -1 : 1;
75*d89ec533Spatrick if (c1 == 0)
76*d89ec533Spatrick break;
77*d89ec533Spatrick s1++;
78*d89ec533Spatrick s2++;
79*d89ec533Spatrick }
80*d89ec533Spatrick return 0;
81*d89ec533Spatrick }
82*d89ec533Spatrick
internal_strncmp(const char * s1,const char * s2,size_t n)83*d89ec533Spatrick static int internal_strncmp(const char *s1, const char *s2, size_t n) {
84*d89ec533Spatrick return internal_strcmp_strncmp(s1, s2, true, n);
85*d89ec533Spatrick }
86*d89ec533Spatrick
internal_strcmp(const char * s1,const char * s2)87*d89ec533Spatrick static int internal_strcmp(const char *s1, const char *s2) {
88*d89ec533Spatrick return internal_strcmp_strncmp(s1, s2, false, 0);
89*d89ec533Spatrick }
90*d89ec533Spatrick
internal_memcmp(const void * s1,const void * s2,size_t n)91*d89ec533Spatrick static int internal_memcmp(const void *s1, const void *s2, size_t n) {
92*d89ec533Spatrick const uint8_t *t1 = static_cast<const uint8_t *>(s1);
93*d89ec533Spatrick const uint8_t *t2 = static_cast<const uint8_t *>(s2);
94*d89ec533Spatrick for (size_t i = 0; i < n; ++i, ++t1, ++t2)
95*d89ec533Spatrick if (*t1 != *t2)
96*d89ec533Spatrick return *t1 < *t2 ? -1 : 1;
97*d89ec533Spatrick return 0;
98*d89ec533Spatrick }
99*d89ec533Spatrick
internal_strlen(const char * s)100*d89ec533Spatrick static size_t internal_strlen(const char *s) {
101*d89ec533Spatrick size_t i = 0;
102*d89ec533Spatrick while (s[i])
103*d89ec533Spatrick i++;
104*d89ec533Spatrick return i;
105*d89ec533Spatrick }
106*d89ec533Spatrick
internal_strstr(const char * haystack,const char * needle)107*d89ec533Spatrick static char *internal_strstr(const char *haystack, const char *needle) {
108*d89ec533Spatrick // This is O(N^2), but we are not using it in hot places.
109*d89ec533Spatrick size_t len1 = internal_strlen(haystack);
110*d89ec533Spatrick size_t len2 = internal_strlen(needle);
111*d89ec533Spatrick if (len1 < len2)
112*d89ec533Spatrick return nullptr;
113*d89ec533Spatrick for (size_t pos = 0; pos <= len1 - len2; pos++) {
114*d89ec533Spatrick if (internal_memcmp(haystack + pos, needle, len2) == 0)
115*d89ec533Spatrick return const_cast<char *>(haystack) + pos;
116*d89ec533Spatrick }
117*d89ec533Spatrick return nullptr;
118*d89ec533Spatrick }
119*d89ec533Spatrick
120*d89ec533Spatrick extern "C" {
121*d89ec533Spatrick
122*d89ec533Spatrick // Weak hooks forward-declared to avoid dependency on
123*d89ec533Spatrick // <sanitizer/common_interface_defs.h>.
124*d89ec533Spatrick void __sanitizer_weak_hook_memcmp(void *called_pc, const void *s1,
125*d89ec533Spatrick const void *s2, size_t n, int result);
126*d89ec533Spatrick void __sanitizer_weak_hook_strncmp(void *called_pc, const char *s1,
127*d89ec533Spatrick const char *s2, size_t n, int result);
128*d89ec533Spatrick void __sanitizer_weak_hook_strncasecmp(void *called_pc, const char *s1,
129*d89ec533Spatrick const char *s2, size_t n, int result);
130*d89ec533Spatrick void __sanitizer_weak_hook_strcmp(void *called_pc, const char *s1,
131*d89ec533Spatrick const char *s2, int result);
132*d89ec533Spatrick void __sanitizer_weak_hook_strcasecmp(void *called_pc, const char *s1,
133*d89ec533Spatrick const char *s2, int result);
134*d89ec533Spatrick void __sanitizer_weak_hook_strstr(void *called_pc, const char *s1,
135*d89ec533Spatrick const char *s2, char *result);
136*d89ec533Spatrick void __sanitizer_weak_hook_strcasestr(void *called_pc, const char *s1,
137*d89ec533Spatrick const char *s2, char *result);
138*d89ec533Spatrick void __sanitizer_weak_hook_memmem(void *called_pc, const void *s1, size_t len1,
139*d89ec533Spatrick const void *s2, size_t len2, void *result);
140*d89ec533Spatrick
DEFINE_REAL(int,bcmp,const void *,const void *,size_t)141*d89ec533Spatrick DEFINE_REAL(int, bcmp, const void *, const void *, size_t)
142*d89ec533Spatrick DEFINE_REAL(int, memcmp, const void *, const void *, size_t)
143*d89ec533Spatrick DEFINE_REAL(int, strncmp, const char *, const char *, size_t)
144*d89ec533Spatrick DEFINE_REAL(int, strcmp, const char *, const char *)
145*d89ec533Spatrick DEFINE_REAL(int, strncasecmp, const char *, const char *, size_t)
146*d89ec533Spatrick DEFINE_REAL(int, strcasecmp, const char *, const char *)
147*d89ec533Spatrick DEFINE_REAL(char *, strstr, const char *, const char *)
148*d89ec533Spatrick DEFINE_REAL(char *, strcasestr, const char *, const char *)
149*d89ec533Spatrick DEFINE_REAL(void *, memmem, const void *, size_t, const void *, size_t)
150*d89ec533Spatrick
151*d89ec533Spatrick ATTRIBUTE_INTERFACE int bcmp(const char *s1, const char *s2, size_t n) {
152*d89ec533Spatrick if (!FuzzerInited)
153*d89ec533Spatrick return internal_memcmp(s1, s2, n);
154*d89ec533Spatrick int result = REAL(bcmp)(s1, s2, n);
155*d89ec533Spatrick __sanitizer_weak_hook_memcmp(GET_CALLER_PC(), s1, s2, n, result);
156*d89ec533Spatrick return result;
157*d89ec533Spatrick }
158*d89ec533Spatrick
memcmp(const void * s1,const void * s2,size_t n)159*d89ec533Spatrick ATTRIBUTE_INTERFACE int memcmp(const void *s1, const void *s2, size_t n) {
160*d89ec533Spatrick if (!FuzzerInited)
161*d89ec533Spatrick return internal_memcmp(s1, s2, n);
162*d89ec533Spatrick int result = REAL(memcmp)(s1, s2, n);
163*d89ec533Spatrick __sanitizer_weak_hook_memcmp(GET_CALLER_PC(), s1, s2, n, result);
164*d89ec533Spatrick return result;
165*d89ec533Spatrick }
166*d89ec533Spatrick
strncmp(const char * s1,const char * s2,size_t n)167*d89ec533Spatrick ATTRIBUTE_INTERFACE int strncmp(const char *s1, const char *s2, size_t n) {
168*d89ec533Spatrick if (!FuzzerInited)
169*d89ec533Spatrick return internal_strncmp(s1, s2, n);
170*d89ec533Spatrick int result = REAL(strncmp)(s1, s2, n);
171*d89ec533Spatrick __sanitizer_weak_hook_strncmp(GET_CALLER_PC(), s1, s2, n, result);
172*d89ec533Spatrick return result;
173*d89ec533Spatrick }
174*d89ec533Spatrick
strcmp(const char * s1,const char * s2)175*d89ec533Spatrick ATTRIBUTE_INTERFACE int strcmp(const char *s1, const char *s2) {
176*d89ec533Spatrick if (!FuzzerInited)
177*d89ec533Spatrick return internal_strcmp(s1, s2);
178*d89ec533Spatrick int result = REAL(strcmp)(s1, s2);
179*d89ec533Spatrick __sanitizer_weak_hook_strcmp(GET_CALLER_PC(), s1, s2, result);
180*d89ec533Spatrick return result;
181*d89ec533Spatrick }
182*d89ec533Spatrick
strncasecmp(const char * s1,const char * s2,size_t n)183*d89ec533Spatrick ATTRIBUTE_INTERFACE int strncasecmp(const char *s1, const char *s2, size_t n) {
184*d89ec533Spatrick ensureFuzzerInited();
185*d89ec533Spatrick int result = REAL(strncasecmp)(s1, s2, n);
186*d89ec533Spatrick __sanitizer_weak_hook_strncasecmp(GET_CALLER_PC(), s1, s2, n, result);
187*d89ec533Spatrick return result;
188*d89ec533Spatrick }
189*d89ec533Spatrick
strcasecmp(const char * s1,const char * s2)190*d89ec533Spatrick ATTRIBUTE_INTERFACE int strcasecmp(const char *s1, const char *s2) {
191*d89ec533Spatrick ensureFuzzerInited();
192*d89ec533Spatrick int result = REAL(strcasecmp)(s1, s2);
193*d89ec533Spatrick __sanitizer_weak_hook_strcasecmp(GET_CALLER_PC(), s1, s2, result);
194*d89ec533Spatrick return result;
195*d89ec533Spatrick }
196*d89ec533Spatrick
strstr(const char * s1,const char * s2)197*d89ec533Spatrick ATTRIBUTE_INTERFACE char *strstr(const char *s1, const char *s2) {
198*d89ec533Spatrick if (!FuzzerInited)
199*d89ec533Spatrick return internal_strstr(s1, s2);
200*d89ec533Spatrick char *result = REAL(strstr)(s1, s2);
201*d89ec533Spatrick __sanitizer_weak_hook_strstr(GET_CALLER_PC(), s1, s2, result);
202*d89ec533Spatrick return result;
203*d89ec533Spatrick }
204*d89ec533Spatrick
strcasestr(const char * s1,const char * s2)205*d89ec533Spatrick ATTRIBUTE_INTERFACE char *strcasestr(const char *s1, const char *s2) {
206*d89ec533Spatrick ensureFuzzerInited();
207*d89ec533Spatrick char *result = REAL(strcasestr)(s1, s2);
208*d89ec533Spatrick __sanitizer_weak_hook_strcasestr(GET_CALLER_PC(), s1, s2, result);
209*d89ec533Spatrick return result;
210*d89ec533Spatrick }
211*d89ec533Spatrick
212*d89ec533Spatrick ATTRIBUTE_INTERFACE
memmem(const void * s1,size_t len1,const void * s2,size_t len2)213*d89ec533Spatrick void *memmem(const void *s1, size_t len1, const void *s2, size_t len2) {
214*d89ec533Spatrick ensureFuzzerInited();
215*d89ec533Spatrick void *result = REAL(memmem)(s1, len1, s2, len2);
216*d89ec533Spatrick __sanitizer_weak_hook_memmem(GET_CALLER_PC(), s1, len1, s2, len2, result);
217*d89ec533Spatrick return result;
218*d89ec533Spatrick }
219*d89ec533Spatrick
220*d89ec533Spatrick __attribute__((section(".preinit_array"),
221*d89ec533Spatrick used)) static void (*__local_fuzzer_preinit)(void) = fuzzerInit;
222*d89ec533Spatrick
223*d89ec533Spatrick } // extern "C"
224*d89ec533Spatrick
fuzzerInit()225*d89ec533Spatrick static void fuzzerInit() {
226*d89ec533Spatrick assert(!FuzzerInitIsRunning);
227*d89ec533Spatrick if (FuzzerInited)
228*d89ec533Spatrick return;
229*d89ec533Spatrick FuzzerInitIsRunning = true;
230*d89ec533Spatrick
231*d89ec533Spatrick REAL(bcmp) = reinterpret_cast<memcmp_type>(
232*d89ec533Spatrick getFuncAddr("bcmp", reinterpret_cast<uintptr_t>(&bcmp)));
233*d89ec533Spatrick REAL(memcmp) = reinterpret_cast<memcmp_type>(
234*d89ec533Spatrick getFuncAddr("memcmp", reinterpret_cast<uintptr_t>(&memcmp)));
235*d89ec533Spatrick REAL(strncmp) = reinterpret_cast<strncmp_type>(
236*d89ec533Spatrick getFuncAddr("strncmp", reinterpret_cast<uintptr_t>(&strncmp)));
237*d89ec533Spatrick REAL(strcmp) = reinterpret_cast<strcmp_type>(
238*d89ec533Spatrick getFuncAddr("strcmp", reinterpret_cast<uintptr_t>(&strcmp)));
239*d89ec533Spatrick REAL(strncasecmp) = reinterpret_cast<strncasecmp_type>(
240*d89ec533Spatrick getFuncAddr("strncasecmp", reinterpret_cast<uintptr_t>(&strncasecmp)));
241*d89ec533Spatrick REAL(strcasecmp) = reinterpret_cast<strcasecmp_type>(
242*d89ec533Spatrick getFuncAddr("strcasecmp", reinterpret_cast<uintptr_t>(&strcasecmp)));
243*d89ec533Spatrick REAL(strstr) = reinterpret_cast<strstr_type>(
244*d89ec533Spatrick getFuncAddr("strstr", reinterpret_cast<uintptr_t>(&strstr)));
245*d89ec533Spatrick REAL(strcasestr) = reinterpret_cast<strcasestr_type>(
246*d89ec533Spatrick getFuncAddr("strcasestr", reinterpret_cast<uintptr_t>(&strcasestr)));
247*d89ec533Spatrick REAL(memmem) = reinterpret_cast<memmem_type>(
248*d89ec533Spatrick getFuncAddr("memmem", reinterpret_cast<uintptr_t>(&memmem)));
249*d89ec533Spatrick
250*d89ec533Spatrick FuzzerInitIsRunning = false;
251*d89ec533Spatrick FuzzerInited = 1;
252*d89ec533Spatrick }
253*d89ec533Spatrick
254*d89ec533Spatrick #endif
255