forked from OSchip/llvm-project
60 lines
1.6 KiB
C
60 lines
1.6 KiB
C
#include <pthread.h>
|
|
#include <stdlib.h>
|
|
#include <stddef.h>
|
|
#include <unistd.h>
|
|
#include <stdio.h>
|
|
#include <time.h>
|
|
|
|
int bench_nthread;
|
|
int bench_niter;
|
|
int grow_clock_var;
|
|
pthread_barrier_t glow_clock_barrier;
|
|
|
|
void bench(); // defined by user
|
|
void start_thread_group(int nth, void(*f)(int tid));
|
|
void grow_clock_worker(int tid);
|
|
|
|
int main(int argc, char **argv) {
|
|
bench_nthread = 2;
|
|
if (argc > 1)
|
|
bench_nthread = atoi(argv[1]);
|
|
bench_niter = 100;
|
|
if (argc > 2)
|
|
bench_niter = atoi(argv[2]);
|
|
|
|
// Grow thread's clock.
|
|
int clock_size = 10;
|
|
if (argc > 1)
|
|
clock_size = 1000;
|
|
pthread_barrier_init(&glow_clock_barrier, 0, clock_size);
|
|
start_thread_group(clock_size, grow_clock_worker);
|
|
pthread_barrier_destroy(&glow_clock_barrier);
|
|
__atomic_load_n(&grow_clock_var, __ATOMIC_ACQUIRE);
|
|
|
|
timespec tp0;
|
|
clock_gettime(CLOCK_MONOTONIC, &tp0);
|
|
bench();
|
|
timespec tp1;
|
|
clock_gettime(CLOCK_MONOTONIC, &tp1);
|
|
unsigned long long t =
|
|
(tp1.tv_sec * 1000000000ULL + tp1.tv_nsec) -
|
|
(tp0.tv_sec * 1000000000ULL + tp0.tv_nsec);
|
|
fprintf(stderr, "%llu ns/iter\n", t / bench_niter);
|
|
fprintf(stderr, "DONE\n");
|
|
}
|
|
|
|
void start_thread_group(int nth, void(*f)(int tid)) {
|
|
pthread_t *th = (pthread_t*)malloc(nth * sizeof(pthread_t));
|
|
for (int i = 0; i < nth; i++)
|
|
pthread_create(&th[i], 0, (void*(*)(void*))f, (void*)(long)i);
|
|
for (int i = 0; i < nth; i++)
|
|
pthread_join(th[i], 0);
|
|
}
|
|
|
|
void grow_clock_worker(int tid) {
|
|
int res = pthread_barrier_wait(&glow_clock_barrier);
|
|
if (res == PTHREAD_BARRIER_SERIAL_THREAD)
|
|
__atomic_store_n(&grow_clock_var, 0, __ATOMIC_RELEASE);
|
|
}
|
|
|