1 // Mini-benchmark for creating a lot of threads.
4 // a) clang -O1 takes <15ms to start N=500 threads,
5 // consuming ~4MB more RAM than N=1.
6 // b) clang -O1 -ftsan takes ~26s to start N=500 threads,
7 // eats 5GB more RAM than N=1 (which is somewhat expected but still a lot)
8 // but then it consumes ~4GB of extra memory when the threads shut down!
9 // (definitely not in the barrier_wait interceptor)
10 // Also, it takes 26s to run with N=500 vs just 1.1s to run with N=1.
17 pthread_barrier_t all_threads_ready
;
19 void* Thread(void *unused
) {
20 pthread_barrier_wait(&all_threads_ready
);
24 int main(int argc
, char **argv
) {
28 } else if (argc
== 2) {
29 n_threads
= atoi(argv
[1]);
31 printf("Usage: %s n_threads\n", argv
[0]);
34 printf("%s: n_threads=%d\n", __FILE__
, n_threads
);
36 pthread_barrier_init(&all_threads_ready
, NULL
, n_threads
+ 1);
38 pthread_t
*t
= new pthread_t
[n_threads
];
39 for (int i
= 0; i
< n_threads
; i
++) {
40 int status
= pthread_create(&t
[i
], 0, Thread
, (void*)i
);
43 // sleep(5); // FIXME: simplify measuring the memory usage.
44 pthread_barrier_wait(&all_threads_ready
);
45 for (int i
= 0; i
< n_threads
; i
++) {
46 pthread_join(t
[i
], 0);
48 // sleep(5); // FIXME: simplify measuring the memory usage.