File: start_many_threads.cpp

package info (click to toggle)
llvm-toolchain-13 1%3A13.0.1-11
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 1,418,840 kB
  • sloc: cpp: 5,290,826; ansic: 996,570; asm: 544,593; python: 188,212; objc: 72,027; lisp: 30,291; f90: 25,395; sh: 24,898; javascript: 9,780; pascal: 9,398; perl: 7,484; ml: 5,432; awk: 3,523; makefile: 2,913; xml: 953; cs: 573; fortran: 539
file content (52 lines) | stat: -rw-r--r-- 1,517 bytes parent folder | download | duplicates (47)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
// Mini-benchmark for creating a lot of threads.
//
// Some facts:
// a) clang -O1 takes <15ms to start N=500 threads,
//    consuming ~4MB more RAM than N=1.
// b) clang -O1 -ftsan takes ~26s to start N=500 threads,
//    eats 5GB more RAM than N=1 (which is somewhat expected but still a lot)
//    but then it consumes ~4GB of extra memory when the threads shut down!
//        (definitely not in the barrier_wait interceptor)
//    Also, it takes 26s to run with N=500 vs just 1.1s to run with N=1.
#include <assert.h>
#include <pthread.h>
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>

pthread_barrier_t all_threads_ready;

void* Thread(void *unused) {
  pthread_barrier_wait(&all_threads_ready);
  return 0;
}

int main(int argc, char **argv) {
  int n_threads;
  if (argc == 1) {
    n_threads = 100;
  } else if (argc == 2) {
    n_threads = atoi(argv[1]);
  } else {
    printf("Usage: %s n_threads\n", argv[0]);
    return 1;
  }
  printf("%s: n_threads=%d\n", __FILE__, n_threads);

  pthread_barrier_init(&all_threads_ready, NULL, n_threads + 1);

  pthread_t *t = new pthread_t[n_threads];
  for (int i = 0; i < n_threads; i++) {
    int status = pthread_create(&t[i], 0, Thread, (void*)i);
    assert(status == 0);
  }
  // sleep(5);  // FIXME: simplify measuring the memory usage.
  pthread_barrier_wait(&all_threads_ready);
  for (int i = 0; i < n_threads; i++) {
    pthread_join(t[i], 0);
  }
  // sleep(5);  // FIXME: simplify measuring the memory usage.
  delete [] t;

  return 0;
}