X-Git-Url: http://git.liburcu.org/?p=urcu.git;a=blobdiff_plain;f=test_perthreadlock.c;h=5bbe72b1637af9adbaa099cb4c4631a74a3fc50e;hp=a2abb8df714c2e825aa31657032d46523135f6bf;hb=2a7ac59da1436b86d7cb59fb8b5712c7d98c1519;hpb=8b632babd61dd1708c4cf95f1f417469f8f6a528 diff --git a/test_perthreadlock.c b/test_perthreadlock.c index a2abb8d..5bbe72b 100644 --- a/test_perthreadlock.c +++ b/test_perthreadlock.c @@ -35,6 +35,12 @@ #include "arch.h" +/* Make this big enough to include the POWER5+ L3 cacheline size of 256B */ +#define CACHE_LINE_SIZE 4096 + +/* hardcoded number of CPUs */ +#define NR_CPUS 16384 + #if defined(_syscall0) _syscall0(pid_t, gettid) #elif defined(__NR_gettid) @@ -63,21 +69,55 @@ struct test_array { struct per_thread_lock { pthread_mutex_t lock; -} __attribute__((aligned(128))); /* cache-line aligned */ +} __attribute__((aligned(CACHE_LINE_SIZE))); /* cache-line aligned */ static struct per_thread_lock *per_thread_lock; static volatile int test_go, test_stop; -static int wdelay; +static unsigned long wdelay; static volatile struct test_array test_array = { 8 }; static unsigned long duration; -/* read-side C.S. duration, in us */ +/* read-side C.S. duration, in loops */ static unsigned long rduration; +static inline void loop_sleep(unsigned long l) +{ + while(l-- != 0) + cpu_relax(); +} + +static int verbose_mode; + +#define printf_verbose(fmt, args...) \ + do { \ + if (verbose_mode) \ + printf(fmt, args); \ + } while (0) + +static unsigned int cpu_affinities[NR_CPUS]; +static unsigned int next_aff = 0; +static int use_affinity = 0; + +static void set_affinity(void) +{ + cpu_set_t mask; + int cpu; + + if (!use_affinity) + return; + + cpu = cpu_affinities[next_aff++]; + CPU_ZERO(&mask); + CPU_SET(cpu, &mask); + sched_setaffinity(0, sizeof(mask), &mask); +} + + + /* * returns 0 if test should end. */ @@ -94,8 +134,10 @@ static int test_duration_read(void) static unsigned long long __thread nr_writes; static unsigned long long __thread nr_reads; -static unsigned long long __attribute__((aligned(128))) *tot_nr_writes; -static unsigned long long __attribute__((aligned(128))) *tot_nr_reads; +static +unsigned long long __attribute__((aligned(CACHE_LINE_SIZE))) *tot_nr_writes; +static +unsigned long long __attribute__((aligned(CACHE_LINE_SIZE))) *tot_nr_reads; static unsigned int nr_readers; static unsigned int nr_writers; @@ -127,9 +169,11 @@ void *thr_reader(void *data) { unsigned long tidx = (unsigned long)data; - printf("thread_begin %s, thread id : %lx, tid %lu\n", + printf_verbose("thread_begin %s, thread id : %lx, tid %lu\n", "reader", pthread_self(), (unsigned long)gettid()); + set_affinity(); + while (!test_go) { } @@ -138,7 +182,7 @@ void *thr_reader(void *data) pthread_mutex_lock(&per_thread_lock[tidx].lock); assert(test_array.a == 8); if (unlikely(rduration)) - usleep(rduration); + loop_sleep(rduration); pthread_mutex_unlock(&per_thread_lock[tidx].lock); nr_reads++; if (unlikely(!test_duration_read())) @@ -146,7 +190,7 @@ void *thr_reader(void *data) } tot_nr_reads[tidx] = nr_reads; - printf("thread_end %s, thread id : %lx, tid %lu\n", + printf_verbose("thread_end %s, thread id : %lx, tid %lu\n", "reader", pthread_self(), (unsigned long)gettid()); return ((void*)1); @@ -157,9 +201,11 @@ void *thr_writer(void *data) unsigned long wtidx = (unsigned long)data; long tidx; - printf("thread_begin %s, thread id : %lx, tid %lu\n", + printf_verbose("thread_begin %s, thread id : %lx, tid %lu\n", "writer", pthread_self(), (unsigned long)gettid()); + set_affinity(); + while (!test_go) { } @@ -171,17 +217,17 @@ void *thr_writer(void *data) } test_array.a = 0; test_array.a = 8; - for (tidx = nr_readers - 1; tidx >= 0; tidx--) { + for (tidx = (long)nr_readers - 1; tidx >= 0; tidx--) { pthread_mutex_unlock(&per_thread_lock[tidx].lock); } nr_writes++; if (unlikely(!test_duration_write())) break; if (unlikely(wdelay)) - usleep(wdelay); + loop_sleep(wdelay); } - printf("thread_end %s, thread id : %lx, tid %lu\n", + printf_verbose("thread_end %s, thread id : %lx, tid %lu\n", "writer", pthread_self(), (unsigned long)gettid()); tot_nr_writes[wtidx] = nr_writes; return ((void*)2); @@ -194,13 +240,12 @@ void show_usage(int argc, char **argv) printf(" [-r] [-w] (yield reader and/or writer)"); #endif printf(" [-d delay] (writer period (us))"); - printf(" [-c duration] (reader C.S. duration (us))"); + printf(" [-c duration] (reader C.S. duration (in loops))"); + printf(" [-v] (verbose output)"); printf(" [-a cpu#] [-a cpu#]... (affinity)"); printf("\n"); } -cpu_set_t affinity; - int main(int argc, char **argv) { int err; @@ -209,7 +254,6 @@ int main(int argc, char **argv) unsigned long long *count_reader, *count_writer; unsigned long long tot_reads = 0, tot_writes = 0; int i, a; - int use_affinity = 0; if (argc < 4) { show_usage(argc, argv); @@ -235,8 +279,6 @@ int main(int argc, char **argv) return -1; } - CPU_ZERO(&affinity); - for (i = 4; i < argc; i++) { if (argv[i][0] != '-') continue; @@ -255,39 +297,37 @@ int main(int argc, char **argv) return -1; } a = atoi(argv[++i]); - CPU_SET(a, &affinity); + cpu_affinities[next_aff++] = a; use_affinity = 1; - printf("Adding CPU %d affinity\n", a); + printf_verbose("Adding CPU %d affinity\n", a); break; case 'c': if (argc < i + 2) { show_usage(argc, argv); return -1; } - rduration = atoi(argv[++i]); + rduration = atol(argv[++i]); break; case 'd': if (argc < i + 2) { show_usage(argc, argv); return -1; } - wdelay = atoi(argv[++i]); + wdelay = atol(argv[++i]); + break; + case 'v': + verbose_mode = 1; break; } } - printf("running test for %lu seconds, %u readers, %u writers.\n", + printf_verbose("running test for %lu seconds, %u readers, %u writers.\n", duration, nr_readers, nr_writers); - printf("Writer delay : %u us.\n", wdelay); - printf("thread %-6s, thread id : %lx, tid %lu\n", + printf_verbose("Writer delay : %lu loops.\n", wdelay); + printf_verbose("Reader duration : %lu loops.\n", rduration); + printf_verbose("thread %-6s, thread id : %lx, tid %lu\n", "main", pthread_self(), (unsigned long)gettid()); - if (use_affinity - && sched_setaffinity(0, sizeof(affinity), &affinity) < 0) { - perror("sched_setaffinity"); - exit(-1); - } - tid_reader = malloc(sizeof(*tid_reader) * nr_readers); tid_writer = malloc(sizeof(*tid_writer) * nr_writers); count_reader = malloc(sizeof(*count_reader) * nr_readers); @@ -296,6 +336,8 @@ int main(int argc, char **argv) tot_nr_writes = malloc(sizeof(*tot_nr_writes) * nr_writers); per_thread_lock = malloc(sizeof(*per_thread_lock) * nr_readers); + next_aff = 0; + for (i = 0; i < nr_readers; i++) { err = pthread_create(&tid_reader[i], NULL, thr_reader, (void *)(long)i); @@ -329,9 +371,16 @@ int main(int argc, char **argv) exit(1); tot_writes += tot_nr_writes[i]; } - - printf("total number of reads : %llu, writes %llu\n", tot_reads, + + printf_verbose("total number of reads : %llu, writes %llu\n", tot_reads, tot_writes); + printf("SUMMARY %-25s testdur %4lu nr_readers %3u rdur %6lu " + "nr_writers %3u " + "wdelay %6lu nr_reads %12llu nr_writes %12llu nr_ops %12llu\n", + argv[0], duration, nr_readers, rduration, + nr_writers, wdelay, tot_reads, tot_writes, + tot_reads + tot_writes); + free(tid_reader); free(tid_writer); free(count_reader);