xref: /freebsd-src/contrib/jemalloc/src/hook.c (revision c5ad81420c495d1d5de04209b0ec4fcb435c322c)
1*c5ad8142SEric van Gyzen #include "jemalloc/internal/jemalloc_preamble.h"
2*c5ad8142SEric van Gyzen 
3*c5ad8142SEric van Gyzen #include "jemalloc/internal/hook.h"
4*c5ad8142SEric van Gyzen 
5*c5ad8142SEric van Gyzen #include "jemalloc/internal/atomic.h"
6*c5ad8142SEric van Gyzen #include "jemalloc/internal/mutex.h"
7*c5ad8142SEric van Gyzen #include "jemalloc/internal/seq.h"
8*c5ad8142SEric van Gyzen 
9*c5ad8142SEric van Gyzen typedef struct hooks_internal_s hooks_internal_t;
10*c5ad8142SEric van Gyzen struct hooks_internal_s {
11*c5ad8142SEric van Gyzen 	hooks_t hooks;
12*c5ad8142SEric van Gyzen 	bool in_use;
13*c5ad8142SEric van Gyzen };
14*c5ad8142SEric van Gyzen 
15*c5ad8142SEric van Gyzen seq_define(hooks_internal_t, hooks)
16*c5ad8142SEric van Gyzen 
17*c5ad8142SEric van Gyzen static atomic_u_t nhooks = ATOMIC_INIT(0);
18*c5ad8142SEric van Gyzen static seq_hooks_t hooks[HOOK_MAX];
19*c5ad8142SEric van Gyzen static malloc_mutex_t hooks_mu;
20*c5ad8142SEric van Gyzen 
21*c5ad8142SEric van Gyzen bool
hook_boot()22*c5ad8142SEric van Gyzen hook_boot() {
23*c5ad8142SEric van Gyzen 	return malloc_mutex_init(&hooks_mu, "hooks", WITNESS_RANK_HOOK,
24*c5ad8142SEric van Gyzen 	    malloc_mutex_rank_exclusive);
25*c5ad8142SEric van Gyzen }
26*c5ad8142SEric van Gyzen 
27*c5ad8142SEric van Gyzen static void *
hook_install_locked(hooks_t * to_install)28*c5ad8142SEric van Gyzen hook_install_locked(hooks_t *to_install) {
29*c5ad8142SEric van Gyzen 	hooks_internal_t hooks_internal;
30*c5ad8142SEric van Gyzen 	for (int i = 0; i < HOOK_MAX; i++) {
31*c5ad8142SEric van Gyzen 		bool success = seq_try_load_hooks(&hooks_internal, &hooks[i]);
32*c5ad8142SEric van Gyzen 		/* We hold mu; no concurrent access. */
33*c5ad8142SEric van Gyzen 		assert(success);
34*c5ad8142SEric van Gyzen 		if (!hooks_internal.in_use) {
35*c5ad8142SEric van Gyzen 			hooks_internal.hooks = *to_install;
36*c5ad8142SEric van Gyzen 			hooks_internal.in_use = true;
37*c5ad8142SEric van Gyzen 			seq_store_hooks(&hooks[i], &hooks_internal);
38*c5ad8142SEric van Gyzen 			atomic_store_u(&nhooks,
39*c5ad8142SEric van Gyzen 			    atomic_load_u(&nhooks, ATOMIC_RELAXED) + 1,
40*c5ad8142SEric van Gyzen 			    ATOMIC_RELAXED);
41*c5ad8142SEric van Gyzen 			return &hooks[i];
42*c5ad8142SEric van Gyzen 		}
43*c5ad8142SEric van Gyzen 	}
44*c5ad8142SEric van Gyzen 	return NULL;
45*c5ad8142SEric van Gyzen }
46*c5ad8142SEric van Gyzen 
47*c5ad8142SEric van Gyzen void *
hook_install(tsdn_t * tsdn,hooks_t * to_install)48*c5ad8142SEric van Gyzen hook_install(tsdn_t *tsdn, hooks_t *to_install) {
49*c5ad8142SEric van Gyzen 	malloc_mutex_lock(tsdn, &hooks_mu);
50*c5ad8142SEric van Gyzen 	void *ret = hook_install_locked(to_install);
51*c5ad8142SEric van Gyzen 	if (ret != NULL) {
52*c5ad8142SEric van Gyzen 		tsd_global_slow_inc(tsdn);
53*c5ad8142SEric van Gyzen 	}
54*c5ad8142SEric van Gyzen 	malloc_mutex_unlock(tsdn, &hooks_mu);
55*c5ad8142SEric van Gyzen 	return ret;
56*c5ad8142SEric van Gyzen }
57*c5ad8142SEric van Gyzen 
58*c5ad8142SEric van Gyzen static void
hook_remove_locked(seq_hooks_t * to_remove)59*c5ad8142SEric van Gyzen hook_remove_locked(seq_hooks_t *to_remove) {
60*c5ad8142SEric van Gyzen 	hooks_internal_t hooks_internal;
61*c5ad8142SEric van Gyzen 	bool success = seq_try_load_hooks(&hooks_internal, to_remove);
62*c5ad8142SEric van Gyzen 	/* We hold mu; no concurrent access. */
63*c5ad8142SEric van Gyzen 	assert(success);
64*c5ad8142SEric van Gyzen 	/* Should only remove hooks that were added. */
65*c5ad8142SEric van Gyzen 	assert(hooks_internal.in_use);
66*c5ad8142SEric van Gyzen 	hooks_internal.in_use = false;
67*c5ad8142SEric van Gyzen 	seq_store_hooks(to_remove, &hooks_internal);
68*c5ad8142SEric van Gyzen 	atomic_store_u(&nhooks, atomic_load_u(&nhooks, ATOMIC_RELAXED) - 1,
69*c5ad8142SEric van Gyzen 	    ATOMIC_RELAXED);
70*c5ad8142SEric van Gyzen }
71*c5ad8142SEric van Gyzen 
72*c5ad8142SEric van Gyzen void
hook_remove(tsdn_t * tsdn,void * opaque)73*c5ad8142SEric van Gyzen hook_remove(tsdn_t *tsdn, void *opaque) {
74*c5ad8142SEric van Gyzen 	if (config_debug) {
75*c5ad8142SEric van Gyzen 		char *hooks_begin = (char *)&hooks[0];
76*c5ad8142SEric van Gyzen 		char *hooks_end = (char *)&hooks[HOOK_MAX];
77*c5ad8142SEric van Gyzen 		char *hook = (char *)opaque;
78*c5ad8142SEric van Gyzen 		assert(hooks_begin <= hook && hook < hooks_end
79*c5ad8142SEric van Gyzen 		    && (hook - hooks_begin) % sizeof(seq_hooks_t) == 0);
80*c5ad8142SEric van Gyzen 	}
81*c5ad8142SEric van Gyzen 	malloc_mutex_lock(tsdn, &hooks_mu);
82*c5ad8142SEric van Gyzen 	hook_remove_locked((seq_hooks_t *)opaque);
83*c5ad8142SEric van Gyzen 	tsd_global_slow_dec(tsdn);
84*c5ad8142SEric van Gyzen 	malloc_mutex_unlock(tsdn, &hooks_mu);
85*c5ad8142SEric van Gyzen }
86*c5ad8142SEric van Gyzen 
87*c5ad8142SEric van Gyzen #define FOR_EACH_HOOK_BEGIN(hooks_internal_ptr)				\
88*c5ad8142SEric van Gyzen for (int for_each_hook_counter = 0;					\
89*c5ad8142SEric van Gyzen     for_each_hook_counter < HOOK_MAX;					\
90*c5ad8142SEric van Gyzen     for_each_hook_counter++) {						\
91*c5ad8142SEric van Gyzen 	bool for_each_hook_success = seq_try_load_hooks(		\
92*c5ad8142SEric van Gyzen 	    (hooks_internal_ptr), &hooks[for_each_hook_counter]);	\
93*c5ad8142SEric van Gyzen 	if (!for_each_hook_success) {					\
94*c5ad8142SEric van Gyzen 		continue;						\
95*c5ad8142SEric van Gyzen 	}								\
96*c5ad8142SEric van Gyzen 	if (!(hooks_internal_ptr)->in_use) {				\
97*c5ad8142SEric van Gyzen 		continue;						\
98*c5ad8142SEric van Gyzen 	}
99*c5ad8142SEric van Gyzen #define FOR_EACH_HOOK_END						\
100*c5ad8142SEric van Gyzen }
101*c5ad8142SEric van Gyzen 
102*c5ad8142SEric van Gyzen static bool *
hook_reentrantp()103*c5ad8142SEric van Gyzen hook_reentrantp() {
104*c5ad8142SEric van Gyzen 	/*
105*c5ad8142SEric van Gyzen 	 * We prevent user reentrancy within hooks.  This is basically just a
106*c5ad8142SEric van Gyzen 	 * thread-local bool that triggers an early-exit.
107*c5ad8142SEric van Gyzen 	 *
108*c5ad8142SEric van Gyzen 	 * We don't fold in_hook into reentrancy.  There are two reasons for
109*c5ad8142SEric van Gyzen 	 * this:
110*c5ad8142SEric van Gyzen 	 * - Right now, we turn on reentrancy during things like extent hook
111*c5ad8142SEric van Gyzen 	 *   execution.  Allocating during extent hooks is not officially
112*c5ad8142SEric van Gyzen 	 *   supported, but we don't want to break it for the time being.  These
113*c5ad8142SEric van Gyzen 	 *   sorts of allocations should probably still be hooked, though.
114*c5ad8142SEric van Gyzen 	 * - If a hook allocates, we may want it to be relatively fast (after
115*c5ad8142SEric van Gyzen 	 *   all, it executes on every allocator operation).  Turning on
116*c5ad8142SEric van Gyzen 	 *   reentrancy is a fairly heavyweight mode (disabling tcache,
117*c5ad8142SEric van Gyzen 	 *   redirecting to arena 0, etc.).  It's possible we may one day want
118*c5ad8142SEric van Gyzen 	 *   to turn on reentrant mode here, if it proves too difficult to keep
119*c5ad8142SEric van Gyzen 	 *   this working.  But that's fairly easy for us to see; OTOH, people
120*c5ad8142SEric van Gyzen 	 *   not using hooks because they're too slow is easy for us to miss.
121*c5ad8142SEric van Gyzen 	 *
122*c5ad8142SEric van Gyzen 	 * The tricky part is
123*c5ad8142SEric van Gyzen 	 * that this code might get invoked even if we don't have access to tsd.
124*c5ad8142SEric van Gyzen 	 * This function mimics getting a pointer to thread-local data, except
125*c5ad8142SEric van Gyzen 	 * that it might secretly return a pointer to some global data if we
126*c5ad8142SEric van Gyzen 	 * know that the caller will take the early-exit path.
127*c5ad8142SEric van Gyzen 	 * If we return a bool that indicates that we are reentrant, then the
128*c5ad8142SEric van Gyzen 	 * caller will go down the early exit path, leaving the global
129*c5ad8142SEric van Gyzen 	 * untouched.
130*c5ad8142SEric van Gyzen 	 */
131*c5ad8142SEric van Gyzen 	static bool in_hook_global = true;
132*c5ad8142SEric van Gyzen 	tsdn_t *tsdn = tsdn_fetch();
133*c5ad8142SEric van Gyzen 	tcache_t *tcache = tsdn_tcachep_get(tsdn);
134*c5ad8142SEric van Gyzen 	if (tcache != NULL) {
135*c5ad8142SEric van Gyzen 		return &tcache->in_hook;
136*c5ad8142SEric van Gyzen 	}
137*c5ad8142SEric van Gyzen 	return &in_hook_global;
138*c5ad8142SEric van Gyzen }
139*c5ad8142SEric van Gyzen 
140*c5ad8142SEric van Gyzen #define HOOK_PROLOGUE							\
141*c5ad8142SEric van Gyzen 	if (likely(atomic_load_u(&nhooks, ATOMIC_RELAXED) == 0)) {	\
142*c5ad8142SEric van Gyzen 		return;							\
143*c5ad8142SEric van Gyzen 	}								\
144*c5ad8142SEric van Gyzen 	bool *in_hook = hook_reentrantp();				\
145*c5ad8142SEric van Gyzen 	if (*in_hook) {							\
146*c5ad8142SEric van Gyzen 		return;							\
147*c5ad8142SEric van Gyzen 	}								\
148*c5ad8142SEric van Gyzen 	*in_hook = true;
149*c5ad8142SEric van Gyzen 
150*c5ad8142SEric van Gyzen #define HOOK_EPILOGUE							\
151*c5ad8142SEric van Gyzen 	*in_hook = false;
152*c5ad8142SEric van Gyzen 
153*c5ad8142SEric van Gyzen void
hook_invoke_alloc(hook_alloc_t type,void * result,uintptr_t result_raw,uintptr_t args_raw[3])154*c5ad8142SEric van Gyzen hook_invoke_alloc(hook_alloc_t type, void *result, uintptr_t result_raw,
155*c5ad8142SEric van Gyzen     uintptr_t args_raw[3]) {
156*c5ad8142SEric van Gyzen 	HOOK_PROLOGUE
157*c5ad8142SEric van Gyzen 
158*c5ad8142SEric van Gyzen 	hooks_internal_t hook;
159*c5ad8142SEric van Gyzen 	FOR_EACH_HOOK_BEGIN(&hook)
160*c5ad8142SEric van Gyzen 		hook_alloc h = hook.hooks.alloc_hook;
161*c5ad8142SEric van Gyzen 		if (h != NULL) {
162*c5ad8142SEric van Gyzen 			h(hook.hooks.extra, type, result, result_raw, args_raw);
163*c5ad8142SEric van Gyzen 		}
164*c5ad8142SEric van Gyzen 	FOR_EACH_HOOK_END
165*c5ad8142SEric van Gyzen 
166*c5ad8142SEric van Gyzen 	HOOK_EPILOGUE
167*c5ad8142SEric van Gyzen }
168*c5ad8142SEric van Gyzen 
169*c5ad8142SEric van Gyzen void
hook_invoke_dalloc(hook_dalloc_t type,void * address,uintptr_t args_raw[3])170*c5ad8142SEric van Gyzen hook_invoke_dalloc(hook_dalloc_t type, void *address, uintptr_t args_raw[3]) {
171*c5ad8142SEric van Gyzen 	HOOK_PROLOGUE
172*c5ad8142SEric van Gyzen 	hooks_internal_t hook;
173*c5ad8142SEric van Gyzen 	FOR_EACH_HOOK_BEGIN(&hook)
174*c5ad8142SEric van Gyzen 		hook_dalloc h = hook.hooks.dalloc_hook;
175*c5ad8142SEric van Gyzen 		if (h != NULL) {
176*c5ad8142SEric van Gyzen 			h(hook.hooks.extra, type, address, args_raw);
177*c5ad8142SEric van Gyzen 		}
178*c5ad8142SEric van Gyzen 	FOR_EACH_HOOK_END
179*c5ad8142SEric van Gyzen 	HOOK_EPILOGUE
180*c5ad8142SEric van Gyzen }
181*c5ad8142SEric van Gyzen 
182*c5ad8142SEric van Gyzen void
hook_invoke_expand(hook_expand_t type,void * address,size_t old_usize,size_t new_usize,uintptr_t result_raw,uintptr_t args_raw[4])183*c5ad8142SEric van Gyzen hook_invoke_expand(hook_expand_t type, void *address, size_t old_usize,
184*c5ad8142SEric van Gyzen     size_t new_usize, uintptr_t result_raw, uintptr_t args_raw[4]) {
185*c5ad8142SEric van Gyzen 	HOOK_PROLOGUE
186*c5ad8142SEric van Gyzen 	hooks_internal_t hook;
187*c5ad8142SEric van Gyzen 	FOR_EACH_HOOK_BEGIN(&hook)
188*c5ad8142SEric van Gyzen 		hook_expand h = hook.hooks.expand_hook;
189*c5ad8142SEric van Gyzen 		if (h != NULL) {
190*c5ad8142SEric van Gyzen 			h(hook.hooks.extra, type, address, old_usize, new_usize,
191*c5ad8142SEric van Gyzen 			    result_raw, args_raw);
192*c5ad8142SEric van Gyzen 		}
193*c5ad8142SEric van Gyzen 	FOR_EACH_HOOK_END
194*c5ad8142SEric van Gyzen 	HOOK_EPILOGUE
195*c5ad8142SEric van Gyzen }
196