diff options
author | Mark Salyzyn <salyzyn@google.com> | 2015-02-10 08:34:35 -0800 |
---|---|---|
committer | Mark Salyzyn <salyzyn@google.com> | 2015-02-12 09:43:58 -0800 |
commit | 5d064464f139cc0b5fed57e3c439d441ad946fe9 (patch) | |
tree | 829ce81f18288c5ee0c85df128e727073bdbae75 /benchmarks | |
parent | 0046c39f9ed6d7335f06e4d866df5ae0e7b4d485 (diff) | |
download | bionic-5d064464f139cc0b5fed57e3c439d441ad946fe9.zip bionic-5d064464f139cc0b5fed57e3c439d441ad946fe9.tar.gz bionic-5d064464f139cc0b5fed57e3c439d441ad946fe9.tar.bz2 |
bionic: benchmarks: Add BM_semaphore_sem_post_sem_wait
This test reports the overhead of sem_post to sem_wake for a low thread count
and a high thread count.
Change-Id: Ic30dcc8a78d754979117446bf3a28b7575cabac7
Diffstat (limited to 'benchmarks')
-rw-r--r-- | benchmarks/semaphore_benchmark.cpp | 98 |
1 files changed, 98 insertions, 0 deletions
diff --git a/benchmarks/semaphore_benchmark.cpp b/benchmarks/semaphore_benchmark.cpp index f383da4..974b046 100644 --- a/benchmarks/semaphore_benchmark.cpp +++ b/benchmarks/semaphore_benchmark.cpp @@ -100,6 +100,9 @@ static void BM_semaphore_sem_post(int iters) { pthread_attr_setschedparam(&attr, ¶m); pthread_attr_setschedpolicy(&attr, SCHED_OTHER); pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED); +#ifdef PTHREAD_SET_INHERIT_SCHED + pthread_attr_setinheritsched(&attr, PTHREAD_EXPLICIT_SCHED); +#endif pthread_t pthread; pthread_create(&pthread, &attr, BM_semaphore_sem_post_start_thread, &semaphore); pthread_attr_destroy(&attr); @@ -141,3 +144,98 @@ static void BM_semaphore_sem_post(int iters) { } while (!BM_semaphore_sem_post_running); } BENCHMARK(BM_semaphore_sem_post); + +/* + * This test reports the overhead of sem_post to sem_wake. A circle of + * num_semaphore - 1 threads are run on a set of semaphores to measure the + * activity. One can calculate the sem_wake overhead alone by: + * + * BM_semaphore_sem_post_sem_wait - BM_semaphore_sem_post - BM_time_clock_gettime + * + * Differences will result if there are more threads than active processors, + * there will be delay induced when scheduling the processes. This cost is + * measured by trying different values of num_semaphore. The governor selected + * will have a major impact on the results for a large number of threads. + * + * To reduce the chances for threads racing ahead and not triggering the + * futex, for example the background threads finish their job before the + * sem_wait is hit in the main thread, the background threads will run at + * batch priority and the main thread at fifo priority. This should generally + * guarantee the main thread completes its task of priming itself with the + * sem_wait before the other threads can start. In practice without the + * sched mechanics here, this works on Android configured kernels, this is + * insurance for wacky(tm) sched configurations. + */ +static void *BM_semaphore_sem_post_sem_wait_start_thread(void *obj) { + sem_t *semaphore = reinterpret_cast<sem_t *>(obj); + + while ((BM_semaphore_sem_post_running > 0) && !sem_wait(semaphore)) { + sem_post(semaphore + 1); + } + --BM_semaphore_sem_post_running; + return NULL; +} + +static void BM_semaphore_sem_post_sem_wait_num(int iters, int num_semaphore) { + StopBenchmarkTiming(); + + sem_t semaphore[num_semaphore]; + + for (int i = 0; i < num_semaphore; ++i) { + sem_init(semaphore + i, 0, 0); + } + + pthread_attr_t attr; + pthread_attr_init(&attr); + BM_semaphore_sem_post_running = 1; + struct sched_param param = { 0, }; + pthread_attr_setschedparam(&attr, ¶m); + pthread_attr_setschedpolicy(&attr, SCHED_BATCH); + pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED); +#ifdef PTHREAD_SET_INHERIT_SCHED + pthread_attr_setinheritsched(&attr, PTHREAD_EXPLICIT_SCHED); +#endif + for (int i = 0; i < (num_semaphore - 1); ++i) { + pthread_t pthread; + pthread_create(&pthread, &attr, BM_semaphore_sem_post_sem_wait_start_thread, semaphore + i); + } + pthread_attr_destroy(&attr); + sched_yield(); + + param.sched_priority = 1; + sched_setscheduler((pid_t)0, SCHED_FIFO, ¶m); + + StartBenchmarkTiming(); + + for (int i = 0; i < iters; i += num_semaphore) { + sem_post(semaphore); + sem_wait(semaphore + num_semaphore - 1); + } + + StopBenchmarkTiming(); + + param.sched_priority = 0; + sched_setscheduler((pid_t)0, SCHED_OTHER, ¶m); + + if (BM_semaphore_sem_post_running > 0) { + BM_semaphore_sem_post_running = 0; + } + for (int i = 0; + (i < (10 * num_semaphore)) && (BM_semaphore_sem_post_running > (1 - num_semaphore)); + ++i) { + for (int j = 0; j < (num_semaphore - 1); ++j) { + sem_post(semaphore + j); + } + sched_yield(); + } +} + +static void BM_semaphore_sem_post_sem_wait_low(int iters) { + BM_semaphore_sem_post_sem_wait_num(iters, 2); +} +BENCHMARK(BM_semaphore_sem_post_sem_wait_low); + +static void BM_semaphore_sem_post_sem_wait_high(int iters) { + BM_semaphore_sem_post_sem_wait_num(iters, 100); +} +BENCHMARK(BM_semaphore_sem_post_sem_wait_high); |