1*ff6d591cSmrg //===-- tsan_platform_mac.cpp ---------------------------------------------===//
2*ff6d591cSmrg //
3*ff6d591cSmrg // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*ff6d591cSmrg // See https://llvm.org/LICENSE.txt for license information.
5*ff6d591cSmrg // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*ff6d591cSmrg //
7*ff6d591cSmrg //===----------------------------------------------------------------------===//
8*ff6d591cSmrg //
9*ff6d591cSmrg // This file is a part of ThreadSanitizer (TSan), a race detector.
10*ff6d591cSmrg //
11*ff6d591cSmrg // Mac-specific code.
12*ff6d591cSmrg //===----------------------------------------------------------------------===//
13*ff6d591cSmrg
14*ff6d591cSmrg #include "sanitizer_common/sanitizer_platform.h"
15*ff6d591cSmrg #if SANITIZER_MAC
16*ff6d591cSmrg
17*ff6d591cSmrg #include "sanitizer_common/sanitizer_atomic.h"
18*ff6d591cSmrg #include "sanitizer_common/sanitizer_common.h"
19*ff6d591cSmrg #include "sanitizer_common/sanitizer_libc.h"
20*ff6d591cSmrg #include "sanitizer_common/sanitizer_posix.h"
21*ff6d591cSmrg #include "sanitizer_common/sanitizer_procmaps.h"
22*ff6d591cSmrg #include "sanitizer_common/sanitizer_ptrauth.h"
23*ff6d591cSmrg #include "sanitizer_common/sanitizer_stackdepot.h"
24*ff6d591cSmrg #include "tsan_platform.h"
25*ff6d591cSmrg #include "tsan_rtl.h"
26*ff6d591cSmrg #include "tsan_flags.h"
27*ff6d591cSmrg
28*ff6d591cSmrg #include <mach/mach.h>
29*ff6d591cSmrg #include <pthread.h>
30*ff6d591cSmrg #include <signal.h>
31*ff6d591cSmrg #include <stdio.h>
32*ff6d591cSmrg #include <stdlib.h>
33*ff6d591cSmrg #include <string.h>
34*ff6d591cSmrg #include <stdarg.h>
35*ff6d591cSmrg #include <sys/mman.h>
36*ff6d591cSmrg #include <sys/syscall.h>
37*ff6d591cSmrg #include <sys/time.h>
38*ff6d591cSmrg #include <sys/types.h>
39*ff6d591cSmrg #include <sys/resource.h>
40*ff6d591cSmrg #include <sys/stat.h>
41*ff6d591cSmrg #include <unistd.h>
42*ff6d591cSmrg #include <errno.h>
43*ff6d591cSmrg #include <sched.h>
44*ff6d591cSmrg
45*ff6d591cSmrg namespace __tsan {
46*ff6d591cSmrg
47*ff6d591cSmrg #if !SANITIZER_GO
SignalSafeGetOrAllocate(uptr * dst,uptr size)48*ff6d591cSmrg static void *SignalSafeGetOrAllocate(uptr *dst, uptr size) {
49*ff6d591cSmrg atomic_uintptr_t *a = (atomic_uintptr_t *)dst;
50*ff6d591cSmrg void *val = (void *)atomic_load_relaxed(a);
51*ff6d591cSmrg atomic_signal_fence(memory_order_acquire); // Turns the previous load into
52*ff6d591cSmrg // acquire wrt signals.
53*ff6d591cSmrg if (UNLIKELY(val == nullptr)) {
54*ff6d591cSmrg val = (void *)internal_mmap(nullptr, size, PROT_READ | PROT_WRITE,
55*ff6d591cSmrg MAP_PRIVATE | MAP_ANON, -1, 0);
56*ff6d591cSmrg CHECK(val);
57*ff6d591cSmrg void *cmp = nullptr;
58*ff6d591cSmrg if (!atomic_compare_exchange_strong(a, (uintptr_t *)&cmp, (uintptr_t)val,
59*ff6d591cSmrg memory_order_acq_rel)) {
60*ff6d591cSmrg internal_munmap(val, size);
61*ff6d591cSmrg val = cmp;
62*ff6d591cSmrg }
63*ff6d591cSmrg }
64*ff6d591cSmrg return val;
65*ff6d591cSmrg }
66*ff6d591cSmrg
67*ff6d591cSmrg // On OS X, accessing TLVs via __thread or manually by using pthread_key_* is
68*ff6d591cSmrg // problematic, because there are several places where interceptors are called
69*ff6d591cSmrg // when TLVs are not accessible (early process startup, thread cleanup, ...).
70*ff6d591cSmrg // The following provides a "poor man's TLV" implementation, where we use the
71*ff6d591cSmrg // shadow memory of the pointer returned by pthread_self() to store a pointer to
72*ff6d591cSmrg // the ThreadState object. The main thread's ThreadState is stored separately
73*ff6d591cSmrg // in a static variable, because we need to access it even before the
74*ff6d591cSmrg // shadow memory is set up.
75*ff6d591cSmrg static uptr main_thread_identity = 0;
76*ff6d591cSmrg ALIGNED(64) static char main_thread_state[sizeof(ThreadState)];
77*ff6d591cSmrg static ThreadState *main_thread_state_loc = (ThreadState *)main_thread_state;
78*ff6d591cSmrg
79*ff6d591cSmrg // We cannot use pthread_self() before libpthread has been initialized. Our
80*ff6d591cSmrg // current heuristic for guarding this is checking `main_thread_identity` which
81*ff6d591cSmrg // is only assigned in `__tsan::InitializePlatform`.
cur_thread_location()82*ff6d591cSmrg static ThreadState **cur_thread_location() {
83*ff6d591cSmrg if (main_thread_identity == 0)
84*ff6d591cSmrg return &main_thread_state_loc;
85*ff6d591cSmrg uptr thread_identity = (uptr)pthread_self();
86*ff6d591cSmrg if (thread_identity == main_thread_identity)
87*ff6d591cSmrg return &main_thread_state_loc;
88*ff6d591cSmrg return (ThreadState **)MemToShadow(thread_identity);
89*ff6d591cSmrg }
90*ff6d591cSmrg
cur_thread()91*ff6d591cSmrg ThreadState *cur_thread() {
92*ff6d591cSmrg return (ThreadState *)SignalSafeGetOrAllocate(
93*ff6d591cSmrg (uptr *)cur_thread_location(), sizeof(ThreadState));
94*ff6d591cSmrg }
95*ff6d591cSmrg
set_cur_thread(ThreadState * thr)96*ff6d591cSmrg void set_cur_thread(ThreadState *thr) {
97*ff6d591cSmrg *cur_thread_location() = thr;
98*ff6d591cSmrg }
99*ff6d591cSmrg
100*ff6d591cSmrg // TODO(kuba.brecka): This is not async-signal-safe. In particular, we call
101*ff6d591cSmrg // munmap first and then clear `fake_tls`; if we receive a signal in between,
102*ff6d591cSmrg // handler will try to access the unmapped ThreadState.
cur_thread_finalize()103*ff6d591cSmrg void cur_thread_finalize() {
104*ff6d591cSmrg ThreadState **thr_state_loc = cur_thread_location();
105*ff6d591cSmrg if (thr_state_loc == &main_thread_state_loc) {
106*ff6d591cSmrg // Calling dispatch_main() or xpc_main() actually invokes pthread_exit to
107*ff6d591cSmrg // exit the main thread. Let's keep the main thread's ThreadState.
108*ff6d591cSmrg return;
109*ff6d591cSmrg }
110*ff6d591cSmrg internal_munmap(*thr_state_loc, sizeof(ThreadState));
111*ff6d591cSmrg *thr_state_loc = nullptr;
112*ff6d591cSmrg }
113*ff6d591cSmrg #endif
114*ff6d591cSmrg
FlushShadowMemory()115*ff6d591cSmrg void FlushShadowMemory() {
116*ff6d591cSmrg }
117*ff6d591cSmrg
RegionMemUsage(uptr start,uptr end,uptr * res,uptr * dirty)118*ff6d591cSmrg static void RegionMemUsage(uptr start, uptr end, uptr *res, uptr *dirty) {
119*ff6d591cSmrg vm_address_t address = start;
120*ff6d591cSmrg vm_address_t end_address = end;
121*ff6d591cSmrg uptr resident_pages = 0;
122*ff6d591cSmrg uptr dirty_pages = 0;
123*ff6d591cSmrg while (address < end_address) {
124*ff6d591cSmrg vm_size_t vm_region_size;
125*ff6d591cSmrg mach_msg_type_number_t count = VM_REGION_EXTENDED_INFO_COUNT;
126*ff6d591cSmrg vm_region_extended_info_data_t vm_region_info;
127*ff6d591cSmrg mach_port_t object_name;
128*ff6d591cSmrg kern_return_t ret = vm_region_64(
129*ff6d591cSmrg mach_task_self(), &address, &vm_region_size, VM_REGION_EXTENDED_INFO,
130*ff6d591cSmrg (vm_region_info_t)&vm_region_info, &count, &object_name);
131*ff6d591cSmrg if (ret != KERN_SUCCESS) break;
132*ff6d591cSmrg
133*ff6d591cSmrg resident_pages += vm_region_info.pages_resident;
134*ff6d591cSmrg dirty_pages += vm_region_info.pages_dirtied;
135*ff6d591cSmrg
136*ff6d591cSmrg address += vm_region_size;
137*ff6d591cSmrg }
138*ff6d591cSmrg *res = resident_pages * GetPageSizeCached();
139*ff6d591cSmrg *dirty = dirty_pages * GetPageSizeCached();
140*ff6d591cSmrg }
141*ff6d591cSmrg
WriteMemoryProfile(char * buf,uptr buf_size,u64 uptime_ns)142*ff6d591cSmrg void WriteMemoryProfile(char *buf, uptr buf_size, u64 uptime_ns) {
143*ff6d591cSmrg uptr shadow_res, shadow_dirty;
144*ff6d591cSmrg uptr meta_res, meta_dirty;
145*ff6d591cSmrg uptr trace_res, trace_dirty;
146*ff6d591cSmrg RegionMemUsage(ShadowBeg(), ShadowEnd(), &shadow_res, &shadow_dirty);
147*ff6d591cSmrg RegionMemUsage(MetaShadowBeg(), MetaShadowEnd(), &meta_res, &meta_dirty);
148*ff6d591cSmrg RegionMemUsage(TraceMemBeg(), TraceMemEnd(), &trace_res, &trace_dirty);
149*ff6d591cSmrg
150*ff6d591cSmrg #if !SANITIZER_GO
151*ff6d591cSmrg uptr low_res, low_dirty;
152*ff6d591cSmrg uptr high_res, high_dirty;
153*ff6d591cSmrg uptr heap_res, heap_dirty;
154*ff6d591cSmrg RegionMemUsage(LoAppMemBeg(), LoAppMemEnd(), &low_res, &low_dirty);
155*ff6d591cSmrg RegionMemUsage(HiAppMemBeg(), HiAppMemEnd(), &high_res, &high_dirty);
156*ff6d591cSmrg RegionMemUsage(HeapMemBeg(), HeapMemEnd(), &heap_res, &heap_dirty);
157*ff6d591cSmrg #else // !SANITIZER_GO
158*ff6d591cSmrg uptr app_res, app_dirty;
159*ff6d591cSmrg RegionMemUsage(LoAppMemBeg(), LoAppMemEnd(), &app_res, &app_dirty);
160*ff6d591cSmrg #endif
161*ff6d591cSmrg
162*ff6d591cSmrg StackDepotStats stacks = StackDepotGetStats();
163*ff6d591cSmrg uptr nthread, nlive;
164*ff6d591cSmrg ctx->thread_registry.GetNumberOfThreads(&nthread, &nlive);
165*ff6d591cSmrg internal_snprintf(
166*ff6d591cSmrg buf, buf_size,
167*ff6d591cSmrg "shadow (0x%016zx-0x%016zx): resident %zd kB, dirty %zd kB\n"
168*ff6d591cSmrg "meta (0x%016zx-0x%016zx): resident %zd kB, dirty %zd kB\n"
169*ff6d591cSmrg "traces (0x%016zx-0x%016zx): resident %zd kB, dirty %zd kB\n"
170*ff6d591cSmrg # if !SANITIZER_GO
171*ff6d591cSmrg "low app (0x%016zx-0x%016zx): resident %zd kB, dirty %zd kB\n"
172*ff6d591cSmrg "high app (0x%016zx-0x%016zx): resident %zd kB, dirty %zd kB\n"
173*ff6d591cSmrg "heap (0x%016zx-0x%016zx): resident %zd kB, dirty %zd kB\n"
174*ff6d591cSmrg # else // !SANITIZER_GO
175*ff6d591cSmrg "app (0x%016zx-0x%016zx): resident %zd kB, dirty %zd kB\n"
176*ff6d591cSmrg # endif
177*ff6d591cSmrg "stacks: %zd unique IDs, %zd kB allocated\n"
178*ff6d591cSmrg "threads: %zd total, %zd live\n"
179*ff6d591cSmrg "------------------------------\n",
180*ff6d591cSmrg ShadowBeg(), ShadowEnd(), shadow_res / 1024, shadow_dirty / 1024,
181*ff6d591cSmrg MetaShadowBeg(), MetaShadowEnd(), meta_res / 1024, meta_dirty / 1024,
182*ff6d591cSmrg TraceMemBeg(), TraceMemEnd(), trace_res / 1024, trace_dirty / 1024,
183*ff6d591cSmrg # if !SANITIZER_GO
184*ff6d591cSmrg LoAppMemBeg(), LoAppMemEnd(), low_res / 1024, low_dirty / 1024,
185*ff6d591cSmrg HiAppMemBeg(), HiAppMemEnd(), high_res / 1024, high_dirty / 1024,
186*ff6d591cSmrg HeapMemBeg(), HeapMemEnd(), heap_res / 1024, heap_dirty / 1024,
187*ff6d591cSmrg # else // !SANITIZER_GO
188*ff6d591cSmrg LoAppMemBeg(), LoAppMemEnd(), app_res / 1024, app_dirty / 1024,
189*ff6d591cSmrg # endif
190*ff6d591cSmrg stacks.n_uniq_ids, stacks.allocated / 1024, nthread, nlive);
191*ff6d591cSmrg }
192*ff6d591cSmrg
193*ff6d591cSmrg # if !SANITIZER_GO
InitializeShadowMemoryPlatform()194*ff6d591cSmrg void InitializeShadowMemoryPlatform() { }
195*ff6d591cSmrg
196*ff6d591cSmrg // On OS X, GCD worker threads are created without a call to pthread_create. We
197*ff6d591cSmrg // need to properly register these threads with ThreadCreate and ThreadStart.
198*ff6d591cSmrg // These threads don't have a parent thread, as they are created "spuriously".
199*ff6d591cSmrg // We're using a libpthread API that notifies us about a newly created thread.
200*ff6d591cSmrg // The `thread == pthread_self()` check indicates this is actually a worker
201*ff6d591cSmrg // thread. If it's just a regular thread, this hook is called on the parent
202*ff6d591cSmrg // thread.
203*ff6d591cSmrg typedef void (*pthread_introspection_hook_t)(unsigned int event,
204*ff6d591cSmrg pthread_t thread, void *addr,
205*ff6d591cSmrg size_t size);
206*ff6d591cSmrg extern "C" pthread_introspection_hook_t pthread_introspection_hook_install(
207*ff6d591cSmrg pthread_introspection_hook_t hook);
208*ff6d591cSmrg static const uptr PTHREAD_INTROSPECTION_THREAD_CREATE = 1;
209*ff6d591cSmrg static const uptr PTHREAD_INTROSPECTION_THREAD_TERMINATE = 3;
210*ff6d591cSmrg static pthread_introspection_hook_t prev_pthread_introspection_hook;
my_pthread_introspection_hook(unsigned int event,pthread_t thread,void * addr,size_t size)211*ff6d591cSmrg static void my_pthread_introspection_hook(unsigned int event, pthread_t thread,
212*ff6d591cSmrg void *addr, size_t size) {
213*ff6d591cSmrg if (event == PTHREAD_INTROSPECTION_THREAD_CREATE) {
214*ff6d591cSmrg if (thread == pthread_self()) {
215*ff6d591cSmrg // The current thread is a newly created GCD worker thread.
216*ff6d591cSmrg ThreadState *thr = cur_thread();
217*ff6d591cSmrg Processor *proc = ProcCreate();
218*ff6d591cSmrg ProcWire(proc, thr);
219*ff6d591cSmrg ThreadState *parent_thread_state = nullptr; // No parent.
220*ff6d591cSmrg Tid tid = ThreadCreate(parent_thread_state, 0, (uptr)thread, true);
221*ff6d591cSmrg CHECK_NE(tid, kMainTid);
222*ff6d591cSmrg ThreadStart(thr, tid, GetTid(), ThreadType::Worker);
223*ff6d591cSmrg }
224*ff6d591cSmrg } else if (event == PTHREAD_INTROSPECTION_THREAD_TERMINATE) {
225*ff6d591cSmrg if (thread == pthread_self()) {
226*ff6d591cSmrg ThreadState *thr = cur_thread();
227*ff6d591cSmrg if (thr->tctx) {
228*ff6d591cSmrg DestroyThreadState();
229*ff6d591cSmrg }
230*ff6d591cSmrg }
231*ff6d591cSmrg }
232*ff6d591cSmrg
233*ff6d591cSmrg if (prev_pthread_introspection_hook != nullptr)
234*ff6d591cSmrg prev_pthread_introspection_hook(event, thread, addr, size);
235*ff6d591cSmrg }
236*ff6d591cSmrg #endif
237*ff6d591cSmrg
InitializePlatformEarly()238*ff6d591cSmrg void InitializePlatformEarly() {
239*ff6d591cSmrg # if !SANITIZER_GO && SANITIZER_IOS
240*ff6d591cSmrg uptr max_vm = GetMaxUserVirtualAddress() + 1;
241*ff6d591cSmrg if (max_vm != HiAppMemEnd()) {
242*ff6d591cSmrg Printf("ThreadSanitizer: unsupported vm address limit %p, expected %p.\n",
243*ff6d591cSmrg (void *)max_vm, (void *)HiAppMemEnd());
244*ff6d591cSmrg Die();
245*ff6d591cSmrg }
246*ff6d591cSmrg #endif
247*ff6d591cSmrg }
248*ff6d591cSmrg
249*ff6d591cSmrg static uptr longjmp_xor_key = 0;
250*ff6d591cSmrg
InitializePlatform()251*ff6d591cSmrg void InitializePlatform() {
252*ff6d591cSmrg DisableCoreDumperIfNecessary();
253*ff6d591cSmrg #if !SANITIZER_GO
254*ff6d591cSmrg CheckAndProtect();
255*ff6d591cSmrg
256*ff6d591cSmrg CHECK_EQ(main_thread_identity, 0);
257*ff6d591cSmrg main_thread_identity = (uptr)pthread_self();
258*ff6d591cSmrg
259*ff6d591cSmrg prev_pthread_introspection_hook =
260*ff6d591cSmrg pthread_introspection_hook_install(&my_pthread_introspection_hook);
261*ff6d591cSmrg #endif
262*ff6d591cSmrg
263*ff6d591cSmrg if (GetMacosAlignedVersion() >= MacosVersion(10, 14)) {
264*ff6d591cSmrg // Libsystem currently uses a process-global key; this might change.
265*ff6d591cSmrg const unsigned kTLSLongjmpXorKeySlot = 0x7;
266*ff6d591cSmrg longjmp_xor_key = (uptr)pthread_getspecific(kTLSLongjmpXorKeySlot);
267*ff6d591cSmrg }
268*ff6d591cSmrg }
269*ff6d591cSmrg
270*ff6d591cSmrg #ifdef __aarch64__
271*ff6d591cSmrg # define LONG_JMP_SP_ENV_SLOT \
272*ff6d591cSmrg ((GetMacosAlignedVersion() >= MacosVersion(10, 14)) ? 12 : 13)
273*ff6d591cSmrg #else
274*ff6d591cSmrg # define LONG_JMP_SP_ENV_SLOT 2
275*ff6d591cSmrg #endif
276*ff6d591cSmrg
ExtractLongJmpSp(uptr * env)277*ff6d591cSmrg uptr ExtractLongJmpSp(uptr *env) {
278*ff6d591cSmrg uptr mangled_sp = env[LONG_JMP_SP_ENV_SLOT];
279*ff6d591cSmrg uptr sp = mangled_sp ^ longjmp_xor_key;
280*ff6d591cSmrg sp = (uptr)ptrauth_auth_data((void *)sp, ptrauth_key_asdb,
281*ff6d591cSmrg ptrauth_string_discriminator("sp"));
282*ff6d591cSmrg return sp;
283*ff6d591cSmrg }
284*ff6d591cSmrg
285*ff6d591cSmrg #if !SANITIZER_GO
__tsan_tls_initialization()286*ff6d591cSmrg extern "C" void __tsan_tls_initialization() {}
287*ff6d591cSmrg
ImitateTlsWrite(ThreadState * thr,uptr tls_addr,uptr tls_size)288*ff6d591cSmrg void ImitateTlsWrite(ThreadState *thr, uptr tls_addr, uptr tls_size) {
289*ff6d591cSmrg // The pointer to the ThreadState object is stored in the shadow memory
290*ff6d591cSmrg // of the tls.
291*ff6d591cSmrg uptr tls_end = tls_addr + tls_size;
292*ff6d591cSmrg uptr thread_identity = (uptr)pthread_self();
293*ff6d591cSmrg const uptr pc = StackTrace::GetNextInstructionPc(
294*ff6d591cSmrg reinterpret_cast<uptr>(__tsan_tls_initialization));
295*ff6d591cSmrg if (thread_identity == main_thread_identity) {
296*ff6d591cSmrg MemoryRangeImitateWrite(thr, pc, tls_addr, tls_size);
297*ff6d591cSmrg } else {
298*ff6d591cSmrg uptr thr_state_start = thread_identity;
299*ff6d591cSmrg uptr thr_state_end = thr_state_start + sizeof(uptr);
300*ff6d591cSmrg CHECK_GE(thr_state_start, tls_addr);
301*ff6d591cSmrg CHECK_LE(thr_state_start, tls_addr + tls_size);
302*ff6d591cSmrg CHECK_GE(thr_state_end, tls_addr);
303*ff6d591cSmrg CHECK_LE(thr_state_end, tls_addr + tls_size);
304*ff6d591cSmrg MemoryRangeImitateWrite(thr, pc, tls_addr, thr_state_start - tls_addr);
305*ff6d591cSmrg MemoryRangeImitateWrite(thr, pc, thr_state_end, tls_end - thr_state_end);
306*ff6d591cSmrg }
307*ff6d591cSmrg }
308*ff6d591cSmrg #endif
309*ff6d591cSmrg
310*ff6d591cSmrg #if !SANITIZER_GO
311*ff6d591cSmrg // Note: this function runs with async signals enabled,
312*ff6d591cSmrg // so it must not touch any tsan state.
call_pthread_cancel_with_cleanup(int (* fn)(void * arg),void (* cleanup)(void * arg),void * arg)313*ff6d591cSmrg int call_pthread_cancel_with_cleanup(int (*fn)(void *arg),
314*ff6d591cSmrg void (*cleanup)(void *arg), void *arg) {
315*ff6d591cSmrg // pthread_cleanup_push/pop are hardcore macros mess.
316*ff6d591cSmrg // We can't intercept nor call them w/o including pthread.h.
317*ff6d591cSmrg int res;
318*ff6d591cSmrg pthread_cleanup_push(cleanup, arg);
319*ff6d591cSmrg res = fn(arg);
320*ff6d591cSmrg pthread_cleanup_pop(0);
321*ff6d591cSmrg return res;
322*ff6d591cSmrg }
323*ff6d591cSmrg #endif
324*ff6d591cSmrg
325*ff6d591cSmrg } // namespace __tsan
326*ff6d591cSmrg
327*ff6d591cSmrg #endif // SANITIZER_MAC
328