summaryrefslogtreecommitdiffstats
path: root/benchmarks
diff options
context:
space:
mode:
authorMark Salyzyn <salyzyn@google.com>2015-02-10 08:34:35 -0800
committerMark Salyzyn <salyzyn@google.com>2015-02-12 09:43:58 -0800
commit5d064464f139cc0b5fed57e3c439d441ad946fe9 (patch)
tree829ce81f18288c5ee0c85df128e727073bdbae75 /benchmarks
parent0046c39f9ed6d7335f06e4d866df5ae0e7b4d485 (diff)
downloadbionic-5d064464f139cc0b5fed57e3c439d441ad946fe9.zip
bionic-5d064464f139cc0b5fed57e3c439d441ad946fe9.tar.gz
bionic-5d064464f139cc0b5fed57e3c439d441ad946fe9.tar.bz2
bionic: benchmarks: Add BM_semaphore_sem_post_sem_wait
This test reports the overhead of sem_post to sem_wake for a low thread count and a high thread count. Change-Id: Ic30dcc8a78d754979117446bf3a28b7575cabac7
Diffstat (limited to 'benchmarks')
-rw-r--r--benchmarks/semaphore_benchmark.cpp98
1 files changed, 98 insertions, 0 deletions
diff --git a/benchmarks/semaphore_benchmark.cpp b/benchmarks/semaphore_benchmark.cpp
index f383da4..974b046 100644
--- a/benchmarks/semaphore_benchmark.cpp
+++ b/benchmarks/semaphore_benchmark.cpp
@@ -100,6 +100,9 @@ static void BM_semaphore_sem_post(int iters) {
pthread_attr_setschedparam(&attr, &param);
pthread_attr_setschedpolicy(&attr, SCHED_OTHER);
pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED);
+#ifdef PTHREAD_SET_INHERIT_SCHED
+ pthread_attr_setinheritsched(&attr, PTHREAD_EXPLICIT_SCHED);
+#endif
pthread_t pthread;
pthread_create(&pthread, &attr, BM_semaphore_sem_post_start_thread, &semaphore);
pthread_attr_destroy(&attr);
@@ -141,3 +144,98 @@ static void BM_semaphore_sem_post(int iters) {
} while (!BM_semaphore_sem_post_running);
}
BENCHMARK(BM_semaphore_sem_post);
+
+/*
+ * This test reports the overhead of sem_post to sem_wake. A circle of
+ * num_semaphore - 1 threads are run on a set of semaphores to measure the
+ * activity. One can calculate the sem_wake overhead alone by:
+ *
+ * BM_semaphore_sem_post_sem_wait - BM_semaphore_sem_post - BM_time_clock_gettime
+ *
+ * Differences will result if there are more threads than active processors,
+ * there will be delay induced when scheduling the processes. This cost is
+ * measured by trying different values of num_semaphore. The governor selected
+ * will have a major impact on the results for a large number of threads.
+ *
+ * To reduce the chances for threads racing ahead and not triggering the
+ * futex, for example the background threads finish their job before the
+ * sem_wait is hit in the main thread, the background threads will run at
+ * batch priority and the main thread at fifo priority. This should generally
+ * guarantee the main thread completes its task of priming itself with the
+ * sem_wait before the other threads can start. In practice without the
+ * sched mechanics here, this works on Android configured kernels, this is
+ * insurance for wacky(tm) sched configurations.
+ */
+static void *BM_semaphore_sem_post_sem_wait_start_thread(void *obj) {
+ sem_t *semaphore = reinterpret_cast<sem_t *>(obj);
+
+ while ((BM_semaphore_sem_post_running > 0) && !sem_wait(semaphore)) {
+ sem_post(semaphore + 1);
+ }
+ --BM_semaphore_sem_post_running;
+ return NULL;
+}
+
+static void BM_semaphore_sem_post_sem_wait_num(int iters, int num_semaphore) {
+ StopBenchmarkTiming();
+
+ sem_t semaphore[num_semaphore];
+
+ for (int i = 0; i < num_semaphore; ++i) {
+ sem_init(semaphore + i, 0, 0);
+ }
+
+ pthread_attr_t attr;
+ pthread_attr_init(&attr);
+ BM_semaphore_sem_post_running = 1;
+ struct sched_param param = { 0, };
+ pthread_attr_setschedparam(&attr, &param);
+ pthread_attr_setschedpolicy(&attr, SCHED_BATCH);
+ pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED);
+#ifdef PTHREAD_SET_INHERIT_SCHED
+ pthread_attr_setinheritsched(&attr, PTHREAD_EXPLICIT_SCHED);
+#endif
+ for (int i = 0; i < (num_semaphore - 1); ++i) {
+ pthread_t pthread;
+ pthread_create(&pthread, &attr, BM_semaphore_sem_post_sem_wait_start_thread, semaphore + i);
+ }
+ pthread_attr_destroy(&attr);
+ sched_yield();
+
+ param.sched_priority = 1;
+ sched_setscheduler((pid_t)0, SCHED_FIFO, &param);
+
+ StartBenchmarkTiming();
+
+ for (int i = 0; i < iters; i += num_semaphore) {
+ sem_post(semaphore);
+ sem_wait(semaphore + num_semaphore - 1);
+ }
+
+ StopBenchmarkTiming();
+
+ param.sched_priority = 0;
+ sched_setscheduler((pid_t)0, SCHED_OTHER, &param);
+
+ if (BM_semaphore_sem_post_running > 0) {
+ BM_semaphore_sem_post_running = 0;
+ }
+ for (int i = 0;
+ (i < (10 * num_semaphore)) && (BM_semaphore_sem_post_running > (1 - num_semaphore));
+ ++i) {
+ for (int j = 0; j < (num_semaphore - 1); ++j) {
+ sem_post(semaphore + j);
+ }
+ sched_yield();
+ }
+}
+
+static void BM_semaphore_sem_post_sem_wait_low(int iters) {
+ BM_semaphore_sem_post_sem_wait_num(iters, 2);
+}
+BENCHMARK(BM_semaphore_sem_post_sem_wait_low);
+
+static void BM_semaphore_sem_post_sem_wait_high(int iters) {
+ BM_semaphore_sem_post_sem_wait_num(iters, 100);
+}
+BENCHMARK(BM_semaphore_sem_post_sem_wait_high);