bench.h 1.59 KB
#include <pthread.h>
#include <stdlib.h>
#include <stddef.h>
#include <unistd.h>
#include <stdio.h>
#include <time.h>

int bench_nthread;
int bench_niter;
int grow_clock_var;
pthread_barrier_t glow_clock_barrier;

void bench();  // defined by user
void start_thread_group(int nth, void(*f)(int tid));
void grow_clock_worker(int tid);

int main(int argc, char **argv) {
  bench_nthread = 2;
  if (argc > 1)
    bench_nthread = atoi(argv[1]);
  bench_niter = 100;
  if (argc > 2)
    bench_niter = atoi(argv[2]);

  // Grow thread's clock.
  int clock_size = 10;
  if (argc > 1)
    clock_size = 1000;
  pthread_barrier_init(&glow_clock_barrier, 0, clock_size);
  start_thread_group(clock_size, grow_clock_worker);
  pthread_barrier_destroy(&glow_clock_barrier);
  __atomic_load_n(&grow_clock_var, __ATOMIC_ACQUIRE);

  timespec tp0;
  clock_gettime(CLOCK_MONOTONIC, &tp0);
  bench();
  timespec tp1;
  clock_gettime(CLOCK_MONOTONIC, &tp1);
  unsigned long long t =
      (tp1.tv_sec * 1000000000ULL + tp1.tv_nsec) -
      (tp0.tv_sec * 1000000000ULL + tp0.tv_nsec);
  fprintf(stderr, "%llu ns/iter\n", t / bench_niter);
  fprintf(stderr, "DONE\n");
}

void start_thread_group(int nth, void(*f)(int tid)) {
  pthread_t *th = (pthread_t*)malloc(nth * sizeof(pthread_t));
  for (int i = 0; i < nth; i++)
    pthread_create(&th[i], 0, (void*(*)(void*))f, (void*)(long)i);
  for (int i = 0; i < nth; i++)
    pthread_join(th[i], 0);
}

void grow_clock_worker(int tid) {
  int res = pthread_barrier_wait(&glow_clock_barrier);
  if (res == PTHREAD_BARRIER_SERIAL_THREAD)
    __atomic_store_n(&grow_clock_var, 0, __ATOMIC_RELEASE);
}