xref: /llvm-project/compiler-rt/lib/tsan/benchmarks/start_many_threads.cpp (revision d11b16e1fef5886c73a7a6701b6e0264ae6b44d4)
1*d11b16e1SNico Weber // Mini-benchmark for creating a lot of threads.
2*d11b16e1SNico Weber //
3*d11b16e1SNico Weber // Some facts:
4*d11b16e1SNico Weber // a) clang -O1 takes <15ms to start N=500 threads,
5*d11b16e1SNico Weber //    consuming ~4MB more RAM than N=1.
6*d11b16e1SNico Weber // b) clang -O1 -ftsan takes ~26s to start N=500 threads,
7*d11b16e1SNico Weber //    eats 5GB more RAM than N=1 (which is somewhat expected but still a lot)
8*d11b16e1SNico Weber //    but then it consumes ~4GB of extra memory when the threads shut down!
9*d11b16e1SNico Weber //        (definitely not in the barrier_wait interceptor)
10*d11b16e1SNico Weber //    Also, it takes 26s to run with N=500 vs just 1.1s to run with N=1.
11*d11b16e1SNico Weber #include <assert.h>
12*d11b16e1SNico Weber #include <pthread.h>
13*d11b16e1SNico Weber #include <stdio.h>
14*d11b16e1SNico Weber #include <stdlib.h>
15*d11b16e1SNico Weber #include <unistd.h>
16*d11b16e1SNico Weber 
17*d11b16e1SNico Weber pthread_barrier_t all_threads_ready;
18*d11b16e1SNico Weber 
Thread(void * unused)19*d11b16e1SNico Weber void* Thread(void *unused) {
20*d11b16e1SNico Weber   pthread_barrier_wait(&all_threads_ready);
21*d11b16e1SNico Weber   return 0;
22*d11b16e1SNico Weber }
23*d11b16e1SNico Weber 
main(int argc,char ** argv)24*d11b16e1SNico Weber int main(int argc, char **argv) {
25*d11b16e1SNico Weber   int n_threads;
26*d11b16e1SNico Weber   if (argc == 1) {
27*d11b16e1SNico Weber     n_threads = 100;
28*d11b16e1SNico Weber   } else if (argc == 2) {
29*d11b16e1SNico Weber     n_threads = atoi(argv[1]);
30*d11b16e1SNico Weber   } else {
31*d11b16e1SNico Weber     printf("Usage: %s n_threads\n", argv[0]);
32*d11b16e1SNico Weber     return 1;
33*d11b16e1SNico Weber   }
34*d11b16e1SNico Weber   printf("%s: n_threads=%d\n", __FILE__, n_threads);
35*d11b16e1SNico Weber 
36*d11b16e1SNico Weber   pthread_barrier_init(&all_threads_ready, NULL, n_threads + 1);
37*d11b16e1SNico Weber 
38*d11b16e1SNico Weber   pthread_t *t = new pthread_t[n_threads];
39*d11b16e1SNico Weber   for (int i = 0; i < n_threads; i++) {
40*d11b16e1SNico Weber     int status = pthread_create(&t[i], 0, Thread, (void*)i);
41*d11b16e1SNico Weber     assert(status == 0);
42*d11b16e1SNico Weber   }
43*d11b16e1SNico Weber   // sleep(5);  // FIXME: simplify measuring the memory usage.
44*d11b16e1SNico Weber   pthread_barrier_wait(&all_threads_ready);
45*d11b16e1SNico Weber   for (int i = 0; i < n_threads; i++) {
46*d11b16e1SNico Weber     pthread_join(t[i], 0);
47*d11b16e1SNico Weber   }
48*d11b16e1SNico Weber   // sleep(5);  // FIXME: simplify measuring the memory usage.
49*d11b16e1SNico Weber   delete [] t;
50*d11b16e1SNico Weber 
51*d11b16e1SNico Weber   return 0;
52*d11b16e1SNico Weber }
53