xref: /freebsd-src/contrib/jemalloc/src/tsd.c (revision c5ad81420c495d1d5de04209b0ec4fcb435c322c)
1a4bd5210SJason Evans #define JEMALLOC_TSD_C_
2b7eaed25SJason Evans #include "jemalloc/internal/jemalloc_preamble.h"
3b7eaed25SJason Evans #include "jemalloc/internal/jemalloc_internal_includes.h"
4b7eaed25SJason Evans 
5b7eaed25SJason Evans #include "jemalloc/internal/assert.h"
6b7eaed25SJason Evans #include "jemalloc/internal/mutex.h"
7b7eaed25SJason Evans #include "jemalloc/internal/rtree.h"
8a4bd5210SJason Evans 
9a4bd5210SJason Evans /******************************************************************************/
10a4bd5210SJason Evans /* Data. */
11a4bd5210SJason Evans 
12a4bd5210SJason Evans static unsigned ncleanups;
13a4bd5210SJason Evans static malloc_tsd_cleanup_t cleanups[MALLOC_TSD_CLEANUPS_MAX];
14a4bd5210SJason Evans 
15*c5ad8142SEric van Gyzen /* TSD_INITIALIZER triggers "-Wmissing-field-initializer" */
16*c5ad8142SEric van Gyzen JEMALLOC_DIAGNOSTIC_PUSH
17*c5ad8142SEric van Gyzen JEMALLOC_DIAGNOSTIC_IGNORE_MISSING_STRUCT_FIELD_INITIALIZERS
18*c5ad8142SEric van Gyzen 
19b7eaed25SJason Evans #ifdef JEMALLOC_MALLOC_THREAD_CLEANUP
20*c5ad8142SEric van Gyzen JEMALLOC_TSD_TYPE_ATTR(tsd_t) tsd_tls = TSD_INITIALIZER;
21*c5ad8142SEric van Gyzen JEMALLOC_TSD_TYPE_ATTR(bool) JEMALLOC_TLS_MODEL tsd_initialized = false;
22b7eaed25SJason Evans bool tsd_booted = false;
23b7eaed25SJason Evans #elif (defined(JEMALLOC_TLS))
24*c5ad8142SEric van Gyzen JEMALLOC_TSD_TYPE_ATTR(tsd_t) tsd_tls = TSD_INITIALIZER;
25b7eaed25SJason Evans pthread_key_t tsd_tsd;
26b7eaed25SJason Evans bool tsd_booted = false;
27b7eaed25SJason Evans #elif (defined(_WIN32))
28b7eaed25SJason Evans DWORD tsd_tsd;
29b7eaed25SJason Evans tsd_wrapper_t tsd_boot_wrapper = {false, TSD_INITIALIZER};
30b7eaed25SJason Evans bool tsd_booted = false;
31b7eaed25SJason Evans #else
32b7eaed25SJason Evans 
33b7eaed25SJason Evans /*
34b7eaed25SJason Evans  * This contains a mutex, but it's pretty convenient to allow the mutex code to
35b7eaed25SJason Evans  * have a dependency on tsd.  So we define the struct here, and only refer to it
36b7eaed25SJason Evans  * by pointer in the header.
37b7eaed25SJason Evans  */
38b7eaed25SJason Evans struct tsd_init_head_s {
39b7eaed25SJason Evans 	ql_head(tsd_init_block_t) blocks;
40b7eaed25SJason Evans 	malloc_mutex_t lock;
41b7eaed25SJason Evans };
42b7eaed25SJason Evans 
43b7eaed25SJason Evans pthread_key_t tsd_tsd;
44b7eaed25SJason Evans tsd_init_head_t	tsd_init_head = {
45b7eaed25SJason Evans 	ql_head_initializer(blocks),
46b7eaed25SJason Evans 	MALLOC_MUTEX_INITIALIZER
47b7eaed25SJason Evans };
48*c5ad8142SEric van Gyzen 
49b7eaed25SJason Evans tsd_wrapper_t tsd_boot_wrapper = {
50b7eaed25SJason Evans 	false,
51b7eaed25SJason Evans 	TSD_INITIALIZER
52b7eaed25SJason Evans };
53b7eaed25SJason Evans bool tsd_booted = false;
54b7eaed25SJason Evans #endif
55b7eaed25SJason Evans 
56*c5ad8142SEric van Gyzen JEMALLOC_DIAGNOSTIC_POP
57d0e79aa3SJason Evans 
58a4bd5210SJason Evans /******************************************************************************/
59a4bd5210SJason Evans 
60*c5ad8142SEric van Gyzen /* A list of all the tsds in the nominal state. */
61*c5ad8142SEric van Gyzen typedef ql_head(tsd_t) tsd_list_t;
62*c5ad8142SEric van Gyzen static tsd_list_t tsd_nominal_tsds = ql_head_initializer(tsd_nominal_tsds);
63*c5ad8142SEric van Gyzen static malloc_mutex_t tsd_nominal_tsds_lock;
64*c5ad8142SEric van Gyzen 
65*c5ad8142SEric van Gyzen /* How many slow-path-enabling features are turned on. */
66*c5ad8142SEric van Gyzen static atomic_u32_t tsd_global_slow_count = ATOMIC_INIT(0);
67*c5ad8142SEric van Gyzen 
68*c5ad8142SEric van Gyzen static bool
tsd_in_nominal_list(tsd_t * tsd)69*c5ad8142SEric van Gyzen tsd_in_nominal_list(tsd_t *tsd) {
70*c5ad8142SEric van Gyzen 	tsd_t *tsd_list;
71*c5ad8142SEric van Gyzen 	bool found = false;
72*c5ad8142SEric van Gyzen 	/*
73*c5ad8142SEric van Gyzen 	 * We don't know that tsd is nominal; it might not be safe to get data
74*c5ad8142SEric van Gyzen 	 * out of it here.
75*c5ad8142SEric van Gyzen 	 */
76*c5ad8142SEric van Gyzen 	malloc_mutex_lock(TSDN_NULL, &tsd_nominal_tsds_lock);
77*c5ad8142SEric van Gyzen 	ql_foreach(tsd_list, &tsd_nominal_tsds, TSD_MANGLE(tcache).tsd_link) {
78*c5ad8142SEric van Gyzen 		if (tsd == tsd_list) {
79*c5ad8142SEric van Gyzen 			found = true;
80*c5ad8142SEric van Gyzen 			break;
81*c5ad8142SEric van Gyzen 		}
82*c5ad8142SEric van Gyzen 	}
83*c5ad8142SEric van Gyzen 	malloc_mutex_unlock(TSDN_NULL, &tsd_nominal_tsds_lock);
84*c5ad8142SEric van Gyzen 	return found;
85*c5ad8142SEric van Gyzen }
86*c5ad8142SEric van Gyzen 
87*c5ad8142SEric van Gyzen static void
tsd_add_nominal(tsd_t * tsd)88*c5ad8142SEric van Gyzen tsd_add_nominal(tsd_t *tsd) {
89*c5ad8142SEric van Gyzen 	assert(!tsd_in_nominal_list(tsd));
90*c5ad8142SEric van Gyzen 	assert(tsd_state_get(tsd) <= tsd_state_nominal_max);
91*c5ad8142SEric van Gyzen 	ql_elm_new(tsd, TSD_MANGLE(tcache).tsd_link);
92*c5ad8142SEric van Gyzen 	malloc_mutex_lock(tsd_tsdn(tsd), &tsd_nominal_tsds_lock);
93*c5ad8142SEric van Gyzen 	ql_tail_insert(&tsd_nominal_tsds, tsd, TSD_MANGLE(tcache).tsd_link);
94*c5ad8142SEric van Gyzen 	malloc_mutex_unlock(tsd_tsdn(tsd), &tsd_nominal_tsds_lock);
95*c5ad8142SEric van Gyzen }
96*c5ad8142SEric van Gyzen 
97*c5ad8142SEric van Gyzen static void
tsd_remove_nominal(tsd_t * tsd)98*c5ad8142SEric van Gyzen tsd_remove_nominal(tsd_t *tsd) {
99*c5ad8142SEric van Gyzen 	assert(tsd_in_nominal_list(tsd));
100*c5ad8142SEric van Gyzen 	assert(tsd_state_get(tsd) <= tsd_state_nominal_max);
101*c5ad8142SEric van Gyzen 	malloc_mutex_lock(tsd_tsdn(tsd), &tsd_nominal_tsds_lock);
102*c5ad8142SEric van Gyzen 	ql_remove(&tsd_nominal_tsds, tsd, TSD_MANGLE(tcache).tsd_link);
103*c5ad8142SEric van Gyzen 	malloc_mutex_unlock(tsd_tsdn(tsd), &tsd_nominal_tsds_lock);
104*c5ad8142SEric van Gyzen }
105*c5ad8142SEric van Gyzen 
106*c5ad8142SEric van Gyzen static void
tsd_force_recompute(tsdn_t * tsdn)107*c5ad8142SEric van Gyzen tsd_force_recompute(tsdn_t *tsdn) {
108*c5ad8142SEric van Gyzen 	/*
109*c5ad8142SEric van Gyzen 	 * The stores to tsd->state here need to synchronize with the exchange
110*c5ad8142SEric van Gyzen 	 * in tsd_slow_update.
111*c5ad8142SEric van Gyzen 	 */
112*c5ad8142SEric van Gyzen 	atomic_fence(ATOMIC_RELEASE);
113*c5ad8142SEric van Gyzen 	malloc_mutex_lock(tsdn, &tsd_nominal_tsds_lock);
114*c5ad8142SEric van Gyzen 	tsd_t *remote_tsd;
115*c5ad8142SEric van Gyzen 	ql_foreach(remote_tsd, &tsd_nominal_tsds, TSD_MANGLE(tcache).tsd_link) {
116*c5ad8142SEric van Gyzen 		assert(tsd_atomic_load(&remote_tsd->state, ATOMIC_RELAXED)
117*c5ad8142SEric van Gyzen 		    <= tsd_state_nominal_max);
118*c5ad8142SEric van Gyzen 		tsd_atomic_store(&remote_tsd->state, tsd_state_nominal_recompute,
119*c5ad8142SEric van Gyzen 		    ATOMIC_RELAXED);
120*c5ad8142SEric van Gyzen 	}
121*c5ad8142SEric van Gyzen 	malloc_mutex_unlock(tsdn, &tsd_nominal_tsds_lock);
122*c5ad8142SEric van Gyzen }
123*c5ad8142SEric van Gyzen 
124*c5ad8142SEric van Gyzen void
tsd_global_slow_inc(tsdn_t * tsdn)125*c5ad8142SEric van Gyzen tsd_global_slow_inc(tsdn_t *tsdn) {
126*c5ad8142SEric van Gyzen 	atomic_fetch_add_u32(&tsd_global_slow_count, 1, ATOMIC_RELAXED);
127*c5ad8142SEric van Gyzen 	/*
128*c5ad8142SEric van Gyzen 	 * We unconditionally force a recompute, even if the global slow count
129*c5ad8142SEric van Gyzen 	 * was already positive.  If we didn't, then it would be possible for us
130*c5ad8142SEric van Gyzen 	 * to return to the user, have the user synchronize externally with some
131*c5ad8142SEric van Gyzen 	 * other thread, and then have that other thread not have picked up the
132*c5ad8142SEric van Gyzen 	 * update yet (since the original incrementing thread might still be
133*c5ad8142SEric van Gyzen 	 * making its way through the tsd list).
134*c5ad8142SEric van Gyzen 	 */
135*c5ad8142SEric van Gyzen 	tsd_force_recompute(tsdn);
136*c5ad8142SEric van Gyzen }
137*c5ad8142SEric van Gyzen 
tsd_global_slow_dec(tsdn_t * tsdn)138*c5ad8142SEric van Gyzen void tsd_global_slow_dec(tsdn_t *tsdn) {
139*c5ad8142SEric van Gyzen 	atomic_fetch_sub_u32(&tsd_global_slow_count, 1, ATOMIC_RELAXED);
140*c5ad8142SEric van Gyzen 	/* See the note in ..._inc(). */
141*c5ad8142SEric van Gyzen 	tsd_force_recompute(tsdn);
142*c5ad8142SEric van Gyzen }
143*c5ad8142SEric van Gyzen 
144*c5ad8142SEric van Gyzen static bool
tsd_local_slow(tsd_t * tsd)145*c5ad8142SEric van Gyzen tsd_local_slow(tsd_t *tsd) {
146*c5ad8142SEric van Gyzen 	return !tsd_tcache_enabled_get(tsd)
147*c5ad8142SEric van Gyzen 	    || tsd_reentrancy_level_get(tsd) > 0;
148*c5ad8142SEric van Gyzen }
149*c5ad8142SEric van Gyzen 
150*c5ad8142SEric van Gyzen bool
tsd_global_slow()151*c5ad8142SEric van Gyzen tsd_global_slow() {
152*c5ad8142SEric van Gyzen 	return atomic_load_u32(&tsd_global_slow_count, ATOMIC_RELAXED) > 0;
153*c5ad8142SEric van Gyzen }
154*c5ad8142SEric van Gyzen 
155*c5ad8142SEric van Gyzen /******************************************************************************/
156*c5ad8142SEric van Gyzen 
157*c5ad8142SEric van Gyzen static uint8_t
tsd_state_compute(tsd_t * tsd)158*c5ad8142SEric van Gyzen tsd_state_compute(tsd_t *tsd) {
159*c5ad8142SEric van Gyzen 	if (!tsd_nominal(tsd)) {
160*c5ad8142SEric van Gyzen 		return tsd_state_get(tsd);
161*c5ad8142SEric van Gyzen 	}
162*c5ad8142SEric van Gyzen 	/* We're in *a* nominal state; but which one? */
163*c5ad8142SEric van Gyzen 	if (malloc_slow || tsd_local_slow(tsd) || tsd_global_slow()) {
164*c5ad8142SEric van Gyzen 		return tsd_state_nominal_slow;
165*c5ad8142SEric van Gyzen 	} else {
166*c5ad8142SEric van Gyzen 		return tsd_state_nominal;
167*c5ad8142SEric van Gyzen 	}
168*c5ad8142SEric van Gyzen }
169*c5ad8142SEric van Gyzen 
170b7eaed25SJason Evans void
tsd_slow_update(tsd_t * tsd)171b7eaed25SJason Evans tsd_slow_update(tsd_t *tsd) {
172*c5ad8142SEric van Gyzen 	uint8_t old_state;
173*c5ad8142SEric van Gyzen 	do {
174*c5ad8142SEric van Gyzen 		uint8_t new_state = tsd_state_compute(tsd);
175*c5ad8142SEric van Gyzen 		old_state = tsd_atomic_exchange(&tsd->state, new_state,
176*c5ad8142SEric van Gyzen 		    ATOMIC_ACQUIRE);
177*c5ad8142SEric van Gyzen 	} while (old_state == tsd_state_nominal_recompute);
178*c5ad8142SEric van Gyzen }
179*c5ad8142SEric van Gyzen 
180*c5ad8142SEric van Gyzen void
tsd_state_set(tsd_t * tsd,uint8_t new_state)181*c5ad8142SEric van Gyzen tsd_state_set(tsd_t *tsd, uint8_t new_state) {
182*c5ad8142SEric van Gyzen 	/* Only the tsd module can change the state *to* recompute. */
183*c5ad8142SEric van Gyzen 	assert(new_state != tsd_state_nominal_recompute);
184*c5ad8142SEric van Gyzen 	uint8_t old_state = tsd_atomic_load(&tsd->state, ATOMIC_RELAXED);
185*c5ad8142SEric van Gyzen 	if (old_state > tsd_state_nominal_max) {
186*c5ad8142SEric van Gyzen 		/*
187*c5ad8142SEric van Gyzen 		 * Not currently in the nominal list, but it might need to be
188*c5ad8142SEric van Gyzen 		 * inserted there.
189*c5ad8142SEric van Gyzen 		 */
190*c5ad8142SEric van Gyzen 		assert(!tsd_in_nominal_list(tsd));
191*c5ad8142SEric van Gyzen 		tsd_atomic_store(&tsd->state, new_state, ATOMIC_RELAXED);
192*c5ad8142SEric van Gyzen 		if (new_state <= tsd_state_nominal_max) {
193*c5ad8142SEric van Gyzen 			tsd_add_nominal(tsd);
194*c5ad8142SEric van Gyzen 		}
195b7eaed25SJason Evans 	} else {
196*c5ad8142SEric van Gyzen 		/*
197*c5ad8142SEric van Gyzen 		 * We're currently nominal.  If the new state is non-nominal,
198*c5ad8142SEric van Gyzen 		 * great; we take ourselves off the list and just enter the new
199*c5ad8142SEric van Gyzen 		 * state.
200*c5ad8142SEric van Gyzen 		 */
201*c5ad8142SEric van Gyzen 		assert(tsd_in_nominal_list(tsd));
202*c5ad8142SEric van Gyzen 		if (new_state > tsd_state_nominal_max) {
203*c5ad8142SEric van Gyzen 			tsd_remove_nominal(tsd);
204*c5ad8142SEric van Gyzen 			tsd_atomic_store(&tsd->state, new_state,
205*c5ad8142SEric van Gyzen 			    ATOMIC_RELAXED);
206*c5ad8142SEric van Gyzen 		} else {
207*c5ad8142SEric van Gyzen 			/*
208*c5ad8142SEric van Gyzen 			 * This is the tricky case.  We're transitioning from
209*c5ad8142SEric van Gyzen 			 * one nominal state to another.  The caller can't know
210*c5ad8142SEric van Gyzen 			 * about any races that are occuring at the same time,
211*c5ad8142SEric van Gyzen 			 * so we always have to recompute no matter what.
212*c5ad8142SEric van Gyzen 			 */
213*c5ad8142SEric van Gyzen 			tsd_slow_update(tsd);
214b7eaed25SJason Evans 		}
215b7eaed25SJason Evans 	}
216b7eaed25SJason Evans }
217b7eaed25SJason Evans 
218b7eaed25SJason Evans static bool
tsd_data_init(tsd_t * tsd)219b7eaed25SJason Evans tsd_data_init(tsd_t *tsd) {
220b7eaed25SJason Evans 	/*
221b7eaed25SJason Evans 	 * We initialize the rtree context first (before the tcache), since the
222b7eaed25SJason Evans 	 * tcache initialization depends on it.
223b7eaed25SJason Evans 	 */
224b7eaed25SJason Evans 	rtree_ctx_data_init(tsd_rtree_ctxp_get_unsafe(tsd));
225b7eaed25SJason Evans 
2260ef50b4eSJason Evans 	/*
2270ef50b4eSJason Evans 	 * A nondeterministic seed based on the address of tsd reduces
2280ef50b4eSJason Evans 	 * the likelihood of lockstep non-uniform cache index
2290ef50b4eSJason Evans 	 * utilization among identical concurrent processes, but at the
2300ef50b4eSJason Evans 	 * cost of test repeatability.  For debug builds, instead use a
2310ef50b4eSJason Evans 	 * deterministic seed.
2320ef50b4eSJason Evans 	 */
2330ef50b4eSJason Evans 	*tsd_offset_statep_get(tsd) = config_debug ? 0 :
2340ef50b4eSJason Evans 	    (uint64_t)(uintptr_t)tsd;
2350ef50b4eSJason Evans 
236b7eaed25SJason Evans 	return tsd_tcache_enabled_data_init(tsd);
237b7eaed25SJason Evans }
238b7eaed25SJason Evans 
239b7eaed25SJason Evans static void
assert_tsd_data_cleanup_done(tsd_t * tsd)240b7eaed25SJason Evans assert_tsd_data_cleanup_done(tsd_t *tsd) {
241b7eaed25SJason Evans 	assert(!tsd_nominal(tsd));
242*c5ad8142SEric van Gyzen 	assert(!tsd_in_nominal_list(tsd));
243b7eaed25SJason Evans 	assert(*tsd_arenap_get_unsafe(tsd) == NULL);
244b7eaed25SJason Evans 	assert(*tsd_iarenap_get_unsafe(tsd) == NULL);
245b7eaed25SJason Evans 	assert(*tsd_arenas_tdata_bypassp_get_unsafe(tsd) == true);
246b7eaed25SJason Evans 	assert(*tsd_arenas_tdatap_get_unsafe(tsd) == NULL);
247b7eaed25SJason Evans 	assert(*tsd_tcache_enabledp_get_unsafe(tsd) == false);
248b7eaed25SJason Evans 	assert(*tsd_prof_tdatap_get_unsafe(tsd) == NULL);
249b7eaed25SJason Evans }
250b7eaed25SJason Evans 
251b7eaed25SJason Evans static bool
tsd_data_init_nocleanup(tsd_t * tsd)252b7eaed25SJason Evans tsd_data_init_nocleanup(tsd_t *tsd) {
253*c5ad8142SEric van Gyzen 	assert(tsd_state_get(tsd) == tsd_state_reincarnated ||
254*c5ad8142SEric van Gyzen 	    tsd_state_get(tsd) == tsd_state_minimal_initialized);
255b7eaed25SJason Evans 	/*
256b7eaed25SJason Evans 	 * During reincarnation, there is no guarantee that the cleanup function
257b7eaed25SJason Evans 	 * will be called (deallocation may happen after all tsd destructors).
258b7eaed25SJason Evans 	 * We set up tsd in a way that no cleanup is needed.
259b7eaed25SJason Evans 	 */
260b7eaed25SJason Evans 	rtree_ctx_data_init(tsd_rtree_ctxp_get_unsafe(tsd));
261b7eaed25SJason Evans 	*tsd_arenas_tdata_bypassp_get(tsd) = true;
262b7eaed25SJason Evans 	*tsd_tcache_enabledp_get_unsafe(tsd) = false;
263b7eaed25SJason Evans 	*tsd_reentrancy_levelp_get(tsd) = 1;
264b7eaed25SJason Evans 	assert_tsd_data_cleanup_done(tsd);
265b7eaed25SJason Evans 
266b7eaed25SJason Evans 	return false;
267b7eaed25SJason Evans }
268b7eaed25SJason Evans 
269b7eaed25SJason Evans tsd_t *
tsd_fetch_slow(tsd_t * tsd,bool minimal)2708b2f5aafSJason Evans tsd_fetch_slow(tsd_t *tsd, bool minimal) {
2718b2f5aafSJason Evans 	assert(!tsd_fast(tsd));
272b7eaed25SJason Evans 
273*c5ad8142SEric van Gyzen 	if (tsd_state_get(tsd) == tsd_state_nominal_slow) {
274*c5ad8142SEric van Gyzen 		/*
275*c5ad8142SEric van Gyzen 		 * On slow path but no work needed.  Note that we can't
276*c5ad8142SEric van Gyzen 		 * necessarily *assert* that we're slow, because we might be
277*c5ad8142SEric van Gyzen 		 * slow because of an asynchronous modification to global state,
278*c5ad8142SEric van Gyzen 		 * which might be asynchronously modified *back*.
279*c5ad8142SEric van Gyzen 		 */
280*c5ad8142SEric van Gyzen 	} else if (tsd_state_get(tsd) == tsd_state_nominal_recompute) {
281*c5ad8142SEric van Gyzen 		tsd_slow_update(tsd);
282*c5ad8142SEric van Gyzen 	} else if (tsd_state_get(tsd) == tsd_state_uninitialized) {
2838b2f5aafSJason Evans 		if (!minimal) {
284*c5ad8142SEric van Gyzen 			if (tsd_booted) {
285*c5ad8142SEric van Gyzen 				tsd_state_set(tsd, tsd_state_nominal);
286b7eaed25SJason Evans 				tsd_slow_update(tsd);
287b7eaed25SJason Evans 				/* Trigger cleanup handler registration. */
288b7eaed25SJason Evans 				tsd_set(tsd);
289b7eaed25SJason Evans 				tsd_data_init(tsd);
290*c5ad8142SEric van Gyzen 			}
2918b2f5aafSJason Evans 		} else {
292*c5ad8142SEric van Gyzen 			tsd_state_set(tsd, tsd_state_minimal_initialized);
2938b2f5aafSJason Evans 			tsd_set(tsd);
2948b2f5aafSJason Evans 			tsd_data_init_nocleanup(tsd);
2958b2f5aafSJason Evans 		}
296*c5ad8142SEric van Gyzen 	} else if (tsd_state_get(tsd) == tsd_state_minimal_initialized) {
2978b2f5aafSJason Evans 		if (!minimal) {
2988b2f5aafSJason Evans 			/* Switch to fully initialized. */
299*c5ad8142SEric van Gyzen 			tsd_state_set(tsd, tsd_state_nominal);
3008b2f5aafSJason Evans 			assert(*tsd_reentrancy_levelp_get(tsd) >= 1);
3018b2f5aafSJason Evans 			(*tsd_reentrancy_levelp_get(tsd))--;
3028b2f5aafSJason Evans 			tsd_slow_update(tsd);
3038b2f5aafSJason Evans 			tsd_data_init(tsd);
3048b2f5aafSJason Evans 		} else {
3058b2f5aafSJason Evans 			assert_tsd_data_cleanup_done(tsd);
3068b2f5aafSJason Evans 		}
307*c5ad8142SEric van Gyzen 	} else if (tsd_state_get(tsd) == tsd_state_purgatory) {
308*c5ad8142SEric van Gyzen 		tsd_state_set(tsd, tsd_state_reincarnated);
309b7eaed25SJason Evans 		tsd_set(tsd);
310b7eaed25SJason Evans 		tsd_data_init_nocleanup(tsd);
311b7eaed25SJason Evans 	} else {
312*c5ad8142SEric van Gyzen 		assert(tsd_state_get(tsd) == tsd_state_reincarnated);
313b7eaed25SJason Evans 	}
314b7eaed25SJason Evans 
315b7eaed25SJason Evans 	return tsd;
316b7eaed25SJason Evans }
317b7eaed25SJason Evans 
318a4bd5210SJason Evans void *
malloc_tsd_malloc(size_t size)319b7eaed25SJason Evans malloc_tsd_malloc(size_t size) {
320b7eaed25SJason Evans 	return a0malloc(CACHELINE_CEILING(size));
321a4bd5210SJason Evans }
322a4bd5210SJason Evans 
323a4bd5210SJason Evans void
malloc_tsd_dalloc(void * wrapper)324b7eaed25SJason Evans malloc_tsd_dalloc(void *wrapper) {
325d0e79aa3SJason Evans 	a0dalloc(wrapper);
326a4bd5210SJason Evans }
327a4bd5210SJason Evans 
328e722f8f8SJason Evans #if defined(JEMALLOC_MALLOC_THREAD_CLEANUP) || defined(_WIN32)
329e722f8f8SJason Evans #ifndef _WIN32
330e722f8f8SJason Evans JEMALLOC_EXPORT
331e722f8f8SJason Evans #endif
332a4bd5210SJason Evans void
_malloc_thread_cleanup(void)333b7eaed25SJason Evans _malloc_thread_cleanup(void) {
334e722f8f8SJason Evans 	bool pending[MALLOC_TSD_CLEANUPS_MAX], again;
335a4bd5210SJason Evans 	unsigned i;
336a4bd5210SJason Evans 
337b7eaed25SJason Evans 	for (i = 0; i < ncleanups; i++) {
338a4bd5210SJason Evans 		pending[i] = true;
339b7eaed25SJason Evans 	}
340a4bd5210SJason Evans 
341a4bd5210SJason Evans 	do {
342a4bd5210SJason Evans 		again = false;
343a4bd5210SJason Evans 		for (i = 0; i < ncleanups; i++) {
344a4bd5210SJason Evans 			if (pending[i]) {
3458ed34ab0SJason Evans 				pending[i] = cleanups[i]();
346b7eaed25SJason Evans 				if (pending[i]) {
347a4bd5210SJason Evans 					again = true;
348a4bd5210SJason Evans 				}
349a4bd5210SJason Evans 			}
350b7eaed25SJason Evans 		}
351a4bd5210SJason Evans 	} while (again);
352a4bd5210SJason Evans }
353a4bd5210SJason Evans #endif
354a4bd5210SJason Evans 
355a4bd5210SJason Evans void
malloc_tsd_cleanup_register(bool (* f)(void))356b7eaed25SJason Evans malloc_tsd_cleanup_register(bool (*f)(void)) {
357a4bd5210SJason Evans 	assert(ncleanups < MALLOC_TSD_CLEANUPS_MAX);
3588ed34ab0SJason Evans 	cleanups[ncleanups] = f;
359a4bd5210SJason Evans 	ncleanups++;
360a4bd5210SJason Evans }
361a4bd5210SJason Evans 
362b7eaed25SJason Evans static void
tsd_do_data_cleanup(tsd_t * tsd)363b7eaed25SJason Evans tsd_do_data_cleanup(tsd_t *tsd) {
364b7eaed25SJason Evans 	prof_tdata_cleanup(tsd);
365b7eaed25SJason Evans 	iarena_cleanup(tsd);
366b7eaed25SJason Evans 	arena_cleanup(tsd);
367b7eaed25SJason Evans 	arenas_tdata_cleanup(tsd);
368b7eaed25SJason Evans 	tcache_cleanup(tsd);
369b7eaed25SJason Evans 	witnesses_cleanup(tsd_witness_tsdp_get_unsafe(tsd));
370b7eaed25SJason Evans }
371b7eaed25SJason Evans 
372a4bd5210SJason Evans void
tsd_cleanup(void * arg)373b7eaed25SJason Evans tsd_cleanup(void *arg) {
374d0e79aa3SJason Evans 	tsd_t *tsd = (tsd_t *)arg;
375d0e79aa3SJason Evans 
376*c5ad8142SEric van Gyzen 	switch (tsd_state_get(tsd)) {
377ba4f5cc0SJason Evans 	case tsd_state_uninitialized:
378ba4f5cc0SJason Evans 		/* Do nothing. */
379ba4f5cc0SJason Evans 		break;
3808b2f5aafSJason Evans 	case tsd_state_minimal_initialized:
3818b2f5aafSJason Evans 		/* This implies the thread only did free() in its life time. */
3828b2f5aafSJason Evans 		/* Fall through. */
383b7eaed25SJason Evans 	case tsd_state_reincarnated:
384b7eaed25SJason Evans 		/*
385b7eaed25SJason Evans 		 * Reincarnated means another destructor deallocated memory
386b7eaed25SJason Evans 		 * after the destructor was called.  Cleanup isn't required but
387b7eaed25SJason Evans 		 * is still called for testing and completeness.
388b7eaed25SJason Evans 		 */
389b7eaed25SJason Evans 		assert_tsd_data_cleanup_done(tsd);
390b7eaed25SJason Evans 		/* Fall through. */
391d0e79aa3SJason Evans 	case tsd_state_nominal:
392b7eaed25SJason Evans 	case tsd_state_nominal_slow:
393b7eaed25SJason Evans 		tsd_do_data_cleanup(tsd);
394*c5ad8142SEric van Gyzen 		tsd_state_set(tsd, tsd_state_purgatory);
395d0e79aa3SJason Evans 		tsd_set(tsd);
396d0e79aa3SJason Evans 		break;
397d0e79aa3SJason Evans 	case tsd_state_purgatory:
398d0e79aa3SJason Evans 		/*
399d0e79aa3SJason Evans 		 * The previous time this destructor was called, we set the
400d0e79aa3SJason Evans 		 * state to tsd_state_purgatory so that other destructors
401d0e79aa3SJason Evans 		 * wouldn't cause re-creation of the tsd.  This time, do
402d0e79aa3SJason Evans 		 * nothing, and do not request another callback.
403d0e79aa3SJason Evans 		 */
404d0e79aa3SJason Evans 		break;
405d0e79aa3SJason Evans 	default:
406d0e79aa3SJason Evans 		not_reached();
407d0e79aa3SJason Evans 	}
408b7eaed25SJason Evans #ifdef JEMALLOC_JET
409b7eaed25SJason Evans 	test_callback_t test_callback = *tsd_test_callbackp_get_unsafe(tsd);
410b7eaed25SJason Evans 	int *data = tsd_test_datap_get_unsafe(tsd);
411b7eaed25SJason Evans 	if (test_callback != NULL) {
412b7eaed25SJason Evans 		test_callback(data);
413b7eaed25SJason Evans 	}
414b7eaed25SJason Evans #endif
415d0e79aa3SJason Evans }
416d0e79aa3SJason Evans 
4171f0a49e8SJason Evans tsd_t *
malloc_tsd_boot0(void)418b7eaed25SJason Evans malloc_tsd_boot0(void) {
4191f0a49e8SJason Evans 	tsd_t *tsd;
420a4bd5210SJason Evans 
421a4bd5210SJason Evans 	ncleanups = 0;
422*c5ad8142SEric van Gyzen 	if (malloc_mutex_init(&tsd_nominal_tsds_lock, "tsd_nominal_tsds_lock",
423*c5ad8142SEric van Gyzen 	    WITNESS_RANK_OMIT, malloc_mutex_rank_exclusive)) {
424*c5ad8142SEric van Gyzen 		return NULL;
425*c5ad8142SEric van Gyzen 	}
426b7eaed25SJason Evans 	if (tsd_boot0()) {
427b7eaed25SJason Evans 		return NULL;
428b7eaed25SJason Evans 	}
4291f0a49e8SJason Evans 	tsd = tsd_fetch();
4301f0a49e8SJason Evans 	*tsd_arenas_tdata_bypassp_get(tsd) = true;
431b7eaed25SJason Evans 	return tsd;
432d0e79aa3SJason Evans }
433d0e79aa3SJason Evans 
434d0e79aa3SJason Evans void
malloc_tsd_boot1(void)435b7eaed25SJason Evans malloc_tsd_boot1(void) {
436d0e79aa3SJason Evans 	tsd_boot1();
437b7eaed25SJason Evans 	tsd_t *tsd = tsd_fetch();
438b7eaed25SJason Evans 	/* malloc_slow has been set properly.  Update tsd_slow. */
439b7eaed25SJason Evans 	tsd_slow_update(tsd);
440b7eaed25SJason Evans 	*tsd_arenas_tdata_bypassp_get(tsd) = false;
441a4bd5210SJason Evans }
442e722f8f8SJason Evans 
443e722f8f8SJason Evans #ifdef _WIN32
444e722f8f8SJason Evans static BOOL WINAPI
_tls_callback(HINSTANCE hinstDLL,DWORD fdwReason,LPVOID lpvReserved)445b7eaed25SJason Evans _tls_callback(HINSTANCE hinstDLL, DWORD fdwReason, LPVOID lpvReserved) {
446e722f8f8SJason Evans 	switch (fdwReason) {
447e722f8f8SJason Evans #ifdef JEMALLOC_LAZY_LOCK
448e722f8f8SJason Evans 	case DLL_THREAD_ATTACH:
449e722f8f8SJason Evans 		isthreaded = true;
450e722f8f8SJason Evans 		break;
451e722f8f8SJason Evans #endif
452e722f8f8SJason Evans 	case DLL_THREAD_DETACH:
453e722f8f8SJason Evans 		_malloc_thread_cleanup();
454e722f8f8SJason Evans 		break;
455e722f8f8SJason Evans 	default:
456e722f8f8SJason Evans 		break;
457e722f8f8SJason Evans 	}
458b7eaed25SJason Evans 	return true;
459e722f8f8SJason Evans }
460e722f8f8SJason Evans 
461b7eaed25SJason Evans /*
462b7eaed25SJason Evans  * We need to be able to say "read" here (in the "pragma section"), but have
463b7eaed25SJason Evans  * hooked "read". We won't read for the rest of the file, so we can get away
464b7eaed25SJason Evans  * with unhooking.
465b7eaed25SJason Evans  */
466b7eaed25SJason Evans #ifdef read
467b7eaed25SJason Evans #  undef read
468b7eaed25SJason Evans #endif
469b7eaed25SJason Evans 
470e722f8f8SJason Evans #ifdef _MSC_VER
471e722f8f8SJason Evans #  ifdef _M_IX86
472e722f8f8SJason Evans #    pragma comment(linker, "/INCLUDE:__tls_used")
473df0d881dSJason Evans #    pragma comment(linker, "/INCLUDE:_tls_callback")
474e722f8f8SJason Evans #  else
475e722f8f8SJason Evans #    pragma comment(linker, "/INCLUDE:_tls_used")
476*c5ad8142SEric van Gyzen #    pragma comment(linker, "/INCLUDE:" STRINGIFY(tls_callback) )
477e722f8f8SJason Evans #  endif
478e722f8f8SJason Evans #  pragma section(".CRT$XLY",long,read)
479e722f8f8SJason Evans #endif
480e722f8f8SJason Evans JEMALLOC_SECTION(".CRT$XLY") JEMALLOC_ATTR(used)
481df0d881dSJason Evans BOOL	(WINAPI *const tls_callback)(HINSTANCE hinstDLL,
482e722f8f8SJason Evans     DWORD fdwReason, LPVOID lpvReserved) = _tls_callback;
483e722f8f8SJason Evans #endif
484f921d10fSJason Evans 
485f921d10fSJason Evans #if (!defined(JEMALLOC_MALLOC_THREAD_CLEANUP) && !defined(JEMALLOC_TLS) && \
486f921d10fSJason Evans     !defined(_WIN32))
487f921d10fSJason Evans void *
tsd_init_check_recursion(tsd_init_head_t * head,tsd_init_block_t * block)488b7eaed25SJason Evans tsd_init_check_recursion(tsd_init_head_t *head, tsd_init_block_t *block) {
489f921d10fSJason Evans 	pthread_t self = pthread_self();
490f921d10fSJason Evans 	tsd_init_block_t *iter;
491f921d10fSJason Evans 
492f921d10fSJason Evans 	/* Check whether this thread has already inserted into the list. */
493bde95144SJason Evans 	malloc_mutex_lock(TSDN_NULL, &head->lock);
494f921d10fSJason Evans 	ql_foreach(iter, &head->blocks, link) {
495f921d10fSJason Evans 		if (iter->thread == self) {
496bde95144SJason Evans 			malloc_mutex_unlock(TSDN_NULL, &head->lock);
497b7eaed25SJason Evans 			return iter->data;
498f921d10fSJason Evans 		}
499f921d10fSJason Evans 	}
500f921d10fSJason Evans 	/* Insert block into list. */
501f921d10fSJason Evans 	ql_elm_new(block, link);
502f921d10fSJason Evans 	block->thread = self;
503f921d10fSJason Evans 	ql_tail_insert(&head->blocks, block, link);
504bde95144SJason Evans 	malloc_mutex_unlock(TSDN_NULL, &head->lock);
505b7eaed25SJason Evans 	return NULL;
506f921d10fSJason Evans }
507f921d10fSJason Evans 
508f921d10fSJason Evans void
tsd_init_finish(tsd_init_head_t * head,tsd_init_block_t * block)509b7eaed25SJason Evans tsd_init_finish(tsd_init_head_t *head, tsd_init_block_t *block) {
510bde95144SJason Evans 	malloc_mutex_lock(TSDN_NULL, &head->lock);
511f921d10fSJason Evans 	ql_remove(&head->blocks, block, link);
512bde95144SJason Evans 	malloc_mutex_unlock(TSDN_NULL, &head->lock);
513f921d10fSJason Evans }
514f921d10fSJason Evans #endif
515*c5ad8142SEric van Gyzen 
516*c5ad8142SEric van Gyzen void
tsd_prefork(tsd_t * tsd)517*c5ad8142SEric van Gyzen tsd_prefork(tsd_t *tsd) {
518*c5ad8142SEric van Gyzen 	malloc_mutex_prefork(tsd_tsdn(tsd), &tsd_nominal_tsds_lock);
519*c5ad8142SEric van Gyzen }
520*c5ad8142SEric van Gyzen 
521*c5ad8142SEric van Gyzen void
tsd_postfork_parent(tsd_t * tsd)522*c5ad8142SEric van Gyzen tsd_postfork_parent(tsd_t *tsd) {
523*c5ad8142SEric van Gyzen 	malloc_mutex_postfork_parent(tsd_tsdn(tsd), &tsd_nominal_tsds_lock);
524*c5ad8142SEric van Gyzen }
525*c5ad8142SEric van Gyzen 
526*c5ad8142SEric van Gyzen void
tsd_postfork_child(tsd_t * tsd)527*c5ad8142SEric van Gyzen tsd_postfork_child(tsd_t *tsd) {
528*c5ad8142SEric van Gyzen 	malloc_mutex_postfork_child(tsd_tsdn(tsd), &tsd_nominal_tsds_lock);
529*c5ad8142SEric van Gyzen 	ql_new(&tsd_nominal_tsds);
530*c5ad8142SEric van Gyzen 
531*c5ad8142SEric van Gyzen 	if (tsd_state_get(tsd) <= tsd_state_nominal_max) {
532*c5ad8142SEric van Gyzen 		tsd_add_nominal(tsd);
533*c5ad8142SEric van Gyzen 	}
534*c5ad8142SEric van Gyzen }
535