1*d11b16e1SNico Weber // Mini-benchmark for creating a lot of threads.
2*d11b16e1SNico Weber //
3*d11b16e1SNico Weber // Some facts:
4*d11b16e1SNico Weber // a) clang -O1 takes <15ms to start N=500 threads,
5*d11b16e1SNico Weber // consuming ~4MB more RAM than N=1.
6*d11b16e1SNico Weber // b) clang -O1 -ftsan takes ~26s to start N=500 threads,
7*d11b16e1SNico Weber // eats 5GB more RAM than N=1 (which is somewhat expected but still a lot)
8*d11b16e1SNico Weber // but then it consumes ~4GB of extra memory when the threads shut down!
9*d11b16e1SNico Weber // (definitely not in the barrier_wait interceptor)
10*d11b16e1SNico Weber // Also, it takes 26s to run with N=500 vs just 1.1s to run with N=1.
11*d11b16e1SNico Weber #include <assert.h>
12*d11b16e1SNico Weber #include <pthread.h>
13*d11b16e1SNico Weber #include <stdio.h>
14*d11b16e1SNico Weber #include <stdlib.h>
15*d11b16e1SNico Weber #include <unistd.h>
16*d11b16e1SNico Weber
17*d11b16e1SNico Weber pthread_barrier_t all_threads_ready;
18*d11b16e1SNico Weber
Thread(void * unused)19*d11b16e1SNico Weber void* Thread(void *unused) {
20*d11b16e1SNico Weber pthread_barrier_wait(&all_threads_ready);
21*d11b16e1SNico Weber return 0;
22*d11b16e1SNico Weber }
23*d11b16e1SNico Weber
main(int argc,char ** argv)24*d11b16e1SNico Weber int main(int argc, char **argv) {
25*d11b16e1SNico Weber int n_threads;
26*d11b16e1SNico Weber if (argc == 1) {
27*d11b16e1SNico Weber n_threads = 100;
28*d11b16e1SNico Weber } else if (argc == 2) {
29*d11b16e1SNico Weber n_threads = atoi(argv[1]);
30*d11b16e1SNico Weber } else {
31*d11b16e1SNico Weber printf("Usage: %s n_threads\n", argv[0]);
32*d11b16e1SNico Weber return 1;
33*d11b16e1SNico Weber }
34*d11b16e1SNico Weber printf("%s: n_threads=%d\n", __FILE__, n_threads);
35*d11b16e1SNico Weber
36*d11b16e1SNico Weber pthread_barrier_init(&all_threads_ready, NULL, n_threads + 1);
37*d11b16e1SNico Weber
38*d11b16e1SNico Weber pthread_t *t = new pthread_t[n_threads];
39*d11b16e1SNico Weber for (int i = 0; i < n_threads; i++) {
40*d11b16e1SNico Weber int status = pthread_create(&t[i], 0, Thread, (void*)i);
41*d11b16e1SNico Weber assert(status == 0);
42*d11b16e1SNico Weber }
43*d11b16e1SNico Weber // sleep(5); // FIXME: simplify measuring the memory usage.
44*d11b16e1SNico Weber pthread_barrier_wait(&all_threads_ready);
45*d11b16e1SNico Weber for (int i = 0; i < n_threads; i++) {
46*d11b16e1SNico Weber pthread_join(t[i], 0);
47*d11b16e1SNico Weber }
48*d11b16e1SNico Weber // sleep(5); // FIXME: simplify measuring the memory usage.
49*d11b16e1SNico Weber delete [] t;
50*d11b16e1SNico Weber
51*d11b16e1SNico Weber return 0;
52*d11b16e1SNico Weber }
53