blob: e7f568d1c9f08af8b5559a41be2b6d4f6ddc9862 [file] [log] [blame]
/* Copyright (c) 2010-14 The Regents of the University of California
* Barret Rhoden <brho@cs.berkeley.edu>
* See LICENSE for details.
*
* Basic test for pthreading. Spawns a bunch of threads that yield.
*
* To build on linux, cd into tests and run:
* $ gcc -O2 -std=gnu99 -fno-stack-protector -g pthread_test.c -lpthread
*
* Make sure you run it with taskset to fix the number of vcores/cpus. */
#define _GNU_SOURCE /* for pth_yield on linux */
#include <stdio.h>
#include <pthread.h>
#include <stdlib.h>
#include <unistd.h>
#include <sys/time.h>
#include "misc-compat.h" /* OS dependent #incs */
/* These are here just to have the compiler test the _INITIALIZERS */
pthread_cond_t dummy_cond = PTHREAD_COND_INITIALIZER;
pthread_mutex_t dummy_mutex = PTHREAD_MUTEX_INITIALIZER;
pthread_mutex_t lock = PTHREAD_MUTEX_INITIALIZER;
#define printf_safe(...) {}
//#define printf_safe(...) \
pthread_mutex_lock(&lock); \
printf(__VA_ARGS__); \
pthread_mutex_unlock(&lock);
#define MAX_NR_TEST_THREADS 100000
int nr_yield_threads = 100;
int nr_yield_loops = 100;
int nr_vcores = 0;
int amt_fake_work = 0;
pthread_t my_threads[MAX_NR_TEST_THREADS];
void *my_retvals[MAX_NR_TEST_THREADS];
pthread_barrier_t barrier;
void *yield_thread(void* arg)
{
/* Wait til all threads are created */
pthread_barrier_wait(&barrier);
for (int i = 0; i < nr_yield_loops; i++) {
printf_safe("[A] pthread %d %p on vcore %d, itr: %d\n",
pthread_id(), pthread_self(), vcore_id(), i);
/* Fakes some work by spinning a bit. Amount varies per
* uth/vcore, scaled by fake_work */
if (amt_fake_work)
udelay(amt_fake_work * (pthread_id() * (vcore_id() +
2)));
pthread_yield();
printf_safe("[A] pthread %p returned from yield on vcore %d, itr: %d\n",
pthread_self(), vcore_id(), i);
}
return (void*)(pthread_self());
}
int main(int argc, char** argv)
{
struct timeval start_tv = {0};
struct timeval end_tv = {0};
long usec_diff;
long nr_ctx_switches;
if (argc > 1)
nr_yield_threads = strtol(argv[1], 0, 10);
if (argc > 2)
nr_yield_loops = strtol(argv[2], 0, 10);
if (argc > 3)
nr_vcores = strtol(argv[3], 0, 10);
if (argc > 4)
amt_fake_work = strtol(argv[4], 0, 10);
nr_yield_threads = MIN(nr_yield_threads, MAX_NR_TEST_THREADS);
printf("Making %d threads of %d loops each, on %d vcore(s), %d work\n",
nr_yield_threads, nr_yield_loops, nr_vcores, amt_fake_work);
/* OS dependent prep work */
#ifdef __ros__
if (nr_vcores) {
/* Only do the vcore trickery if requested */
parlib_never_yield = TRUE;
pthread_need_tls(FALSE);
pthread_mcp_init(); /* gives us one vcore */
vcore_request_total(nr_vcores);
parlib_never_vc_request = TRUE;
for (int i = 0; i < nr_vcores; i++) {
printf_safe("Vcore %d mapped to pcore %d\n", i,
__procinfo.vcoremap[i].pcoreid);
}
}
struct uth_join_request *join_reqs;
join_reqs = malloc(nr_yield_threads * sizeof(struct uth_join_request));
for (int i = 0; i < nr_yield_threads; i++)
join_reqs[i].retval_loc = &my_retvals[i];
assert(join_reqs);
#endif /* __ros__ */
pthread_barrier_init(&barrier, NULL, nr_yield_threads);
/* create and join on yield */
for (int i = 0; i < nr_yield_threads; i++) {
printf_safe("[A] About to create thread %d\n", i);
if (pthread_create(&my_threads[i], NULL, &yield_thread, NULL))
perror("pth_create failed");
}
if (gettimeofday(&start_tv, 0))
perror("Start time error...");
/* Akaros supports parallel join */
#ifdef __ros__
for (int i = 0; i < nr_yield_threads; i++)
join_reqs[i].uth = (struct uthread*)my_threads[i];
uthread_join_arr(join_reqs, nr_yield_threads);
#else
for (int i = 0; i < nr_yield_threads; i++) {
printf_safe("[A] About to join on thread %d(%p)\n",
i, my_threads[i]);
pthread_join(my_threads[i], &my_retvals[i]);
printf_safe("[A] Successful join on thread %d (retval: %p)\n",
i, my_retvals[i]);
}
#endif
if (gettimeofday(&end_tv, 0))
perror("End time error...");
nr_ctx_switches = nr_yield_threads * nr_yield_loops;
usec_diff = (end_tv.tv_sec - start_tv.tv_sec) * 1000000 +
(end_tv.tv_usec - start_tv.tv_usec);
printf("Done: %d uthreads, %d loops, %d vcores, %d work\n",
nr_yield_threads, nr_yield_loops, nr_vcores, amt_fake_work);
printf("Nr context switches: %ld\n", nr_ctx_switches);
printf("Time to run: %ld usec\n", usec_diff);
if (nr_vcores == 1)
printf("Context switch latency: %d nsec\n",
(int)(1000LL*usec_diff / nr_ctx_switches));
printf("Context switches / sec: %d\n\n",
(int)(1000000LL*nr_ctx_switches / usec_diff));
}