xref: /aosp_15_r20/external/abseil-cpp/absl/synchronization/mutex_benchmark.cc (revision 9356374a3709195abf420251b3e825997ff56c0f)
1*9356374aSAndroid Build Coastguard Worker // Copyright 2017 The Abseil Authors.
2*9356374aSAndroid Build Coastguard Worker //
3*9356374aSAndroid Build Coastguard Worker // Licensed under the Apache License, Version 2.0 (the "License");
4*9356374aSAndroid Build Coastguard Worker // you may not use this file except in compliance with the License.
5*9356374aSAndroid Build Coastguard Worker // You may obtain a copy of the License at
6*9356374aSAndroid Build Coastguard Worker //
7*9356374aSAndroid Build Coastguard Worker //      https://www.apache.org/licenses/LICENSE-2.0
8*9356374aSAndroid Build Coastguard Worker //
9*9356374aSAndroid Build Coastguard Worker // Unless required by applicable law or agreed to in writing, software
10*9356374aSAndroid Build Coastguard Worker // distributed under the License is distributed on an "AS IS" BASIS,
11*9356374aSAndroid Build Coastguard Worker // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12*9356374aSAndroid Build Coastguard Worker // See the License for the specific language governing permissions and
13*9356374aSAndroid Build Coastguard Worker // limitations under the License.
14*9356374aSAndroid Build Coastguard Worker 
15*9356374aSAndroid Build Coastguard Worker #include <cstdint>
16*9356374aSAndroid Build Coastguard Worker #include <mutex>  // NOLINT(build/c++11)
17*9356374aSAndroid Build Coastguard Worker #include <vector>
18*9356374aSAndroid Build Coastguard Worker 
19*9356374aSAndroid Build Coastguard Worker #include "absl/base/config.h"
20*9356374aSAndroid Build Coastguard Worker #include "absl/base/internal/cycleclock.h"
21*9356374aSAndroid Build Coastguard Worker #include "absl/base/internal/spinlock.h"
22*9356374aSAndroid Build Coastguard Worker #include "absl/base/no_destructor.h"
23*9356374aSAndroid Build Coastguard Worker #include "absl/synchronization/blocking_counter.h"
24*9356374aSAndroid Build Coastguard Worker #include "absl/synchronization/internal/thread_pool.h"
25*9356374aSAndroid Build Coastguard Worker #include "absl/synchronization/mutex.h"
26*9356374aSAndroid Build Coastguard Worker #include "benchmark/benchmark.h"
27*9356374aSAndroid Build Coastguard Worker 
28*9356374aSAndroid Build Coastguard Worker namespace {
29*9356374aSAndroid Build Coastguard Worker 
BM_Mutex(benchmark::State & state)30*9356374aSAndroid Build Coastguard Worker void BM_Mutex(benchmark::State& state) {
31*9356374aSAndroid Build Coastguard Worker   static absl::NoDestructor<absl::Mutex> mu;
32*9356374aSAndroid Build Coastguard Worker   for (auto _ : state) {
33*9356374aSAndroid Build Coastguard Worker     absl::MutexLock lock(mu.get());
34*9356374aSAndroid Build Coastguard Worker   }
35*9356374aSAndroid Build Coastguard Worker }
36*9356374aSAndroid Build Coastguard Worker BENCHMARK(BM_Mutex)->UseRealTime()->Threads(1)->ThreadPerCpu();
37*9356374aSAndroid Build Coastguard Worker 
BM_ReaderLock(benchmark::State & state)38*9356374aSAndroid Build Coastguard Worker void BM_ReaderLock(benchmark::State& state) {
39*9356374aSAndroid Build Coastguard Worker   static absl::NoDestructor<absl::Mutex> mu;
40*9356374aSAndroid Build Coastguard Worker   for (auto _ : state) {
41*9356374aSAndroid Build Coastguard Worker     absl::ReaderMutexLock lock(mu.get());
42*9356374aSAndroid Build Coastguard Worker   }
43*9356374aSAndroid Build Coastguard Worker }
44*9356374aSAndroid Build Coastguard Worker BENCHMARK(BM_ReaderLock)->UseRealTime()->Threads(1)->ThreadPerCpu();
45*9356374aSAndroid Build Coastguard Worker 
BM_TryLock(benchmark::State & state)46*9356374aSAndroid Build Coastguard Worker void BM_TryLock(benchmark::State& state) {
47*9356374aSAndroid Build Coastguard Worker   absl::Mutex mu;
48*9356374aSAndroid Build Coastguard Worker   for (auto _ : state) {
49*9356374aSAndroid Build Coastguard Worker     if (mu.TryLock()) {
50*9356374aSAndroid Build Coastguard Worker       mu.Unlock();
51*9356374aSAndroid Build Coastguard Worker     }
52*9356374aSAndroid Build Coastguard Worker   }
53*9356374aSAndroid Build Coastguard Worker }
54*9356374aSAndroid Build Coastguard Worker BENCHMARK(BM_TryLock);
55*9356374aSAndroid Build Coastguard Worker 
BM_ReaderTryLock(benchmark::State & state)56*9356374aSAndroid Build Coastguard Worker void BM_ReaderTryLock(benchmark::State& state) {
57*9356374aSAndroid Build Coastguard Worker   static absl::NoDestructor<absl::Mutex> mu;
58*9356374aSAndroid Build Coastguard Worker   for (auto _ : state) {
59*9356374aSAndroid Build Coastguard Worker     if (mu->ReaderTryLock()) {
60*9356374aSAndroid Build Coastguard Worker       mu->ReaderUnlock();
61*9356374aSAndroid Build Coastguard Worker     }
62*9356374aSAndroid Build Coastguard Worker   }
63*9356374aSAndroid Build Coastguard Worker }
64*9356374aSAndroid Build Coastguard Worker BENCHMARK(BM_ReaderTryLock)->UseRealTime()->Threads(1)->ThreadPerCpu();
65*9356374aSAndroid Build Coastguard Worker 
DelayNs(int64_t ns,int * data)66*9356374aSAndroid Build Coastguard Worker static void DelayNs(int64_t ns, int* data) {
67*9356374aSAndroid Build Coastguard Worker   int64_t end = absl::base_internal::CycleClock::Now() +
68*9356374aSAndroid Build Coastguard Worker                 ns * absl::base_internal::CycleClock::Frequency() / 1e9;
69*9356374aSAndroid Build Coastguard Worker   while (absl::base_internal::CycleClock::Now() < end) {
70*9356374aSAndroid Build Coastguard Worker     ++(*data);
71*9356374aSAndroid Build Coastguard Worker     benchmark::DoNotOptimize(*data);
72*9356374aSAndroid Build Coastguard Worker   }
73*9356374aSAndroid Build Coastguard Worker }
74*9356374aSAndroid Build Coastguard Worker 
75*9356374aSAndroid Build Coastguard Worker template <typename MutexType>
76*9356374aSAndroid Build Coastguard Worker class RaiiLocker {
77*9356374aSAndroid Build Coastguard Worker  public:
RaiiLocker(MutexType * mu)78*9356374aSAndroid Build Coastguard Worker   explicit RaiiLocker(MutexType* mu) : mu_(mu) { mu_->Lock(); }
~RaiiLocker()79*9356374aSAndroid Build Coastguard Worker   ~RaiiLocker() { mu_->Unlock(); }
80*9356374aSAndroid Build Coastguard Worker  private:
81*9356374aSAndroid Build Coastguard Worker   MutexType* mu_;
82*9356374aSAndroid Build Coastguard Worker };
83*9356374aSAndroid Build Coastguard Worker 
84*9356374aSAndroid Build Coastguard Worker template <>
85*9356374aSAndroid Build Coastguard Worker class RaiiLocker<std::mutex> {
86*9356374aSAndroid Build Coastguard Worker  public:
RaiiLocker(std::mutex * mu)87*9356374aSAndroid Build Coastguard Worker   explicit RaiiLocker(std::mutex* mu) : mu_(mu) { mu_->lock(); }
~RaiiLocker()88*9356374aSAndroid Build Coastguard Worker   ~RaiiLocker() { mu_->unlock(); }
89*9356374aSAndroid Build Coastguard Worker  private:
90*9356374aSAndroid Build Coastguard Worker   std::mutex* mu_;
91*9356374aSAndroid Build Coastguard Worker };
92*9356374aSAndroid Build Coastguard Worker 
93*9356374aSAndroid Build Coastguard Worker // RAII object to change the Mutex priority of the running thread.
94*9356374aSAndroid Build Coastguard Worker class ScopedThreadMutexPriority {
95*9356374aSAndroid Build Coastguard Worker  public:
ScopedThreadMutexPriority(int priority)96*9356374aSAndroid Build Coastguard Worker   explicit ScopedThreadMutexPriority(int priority) {
97*9356374aSAndroid Build Coastguard Worker     absl::base_internal::ThreadIdentity* identity =
98*9356374aSAndroid Build Coastguard Worker         absl::synchronization_internal::GetOrCreateCurrentThreadIdentity();
99*9356374aSAndroid Build Coastguard Worker     identity->per_thread_synch.priority = priority;
100*9356374aSAndroid Build Coastguard Worker     // Bump next_priority_read_cycles to the infinite future so that the
101*9356374aSAndroid Build Coastguard Worker     // implementation doesn't re-read the thread's actual scheduler priority
102*9356374aSAndroid Build Coastguard Worker     // and replace our temporary scoped priority.
103*9356374aSAndroid Build Coastguard Worker     identity->per_thread_synch.next_priority_read_cycles =
104*9356374aSAndroid Build Coastguard Worker         std::numeric_limits<int64_t>::max();
105*9356374aSAndroid Build Coastguard Worker   }
~ScopedThreadMutexPriority()106*9356374aSAndroid Build Coastguard Worker   ~ScopedThreadMutexPriority() {
107*9356374aSAndroid Build Coastguard Worker     // Reset the "next priority read time" back to the infinite past so that
108*9356374aSAndroid Build Coastguard Worker     // the next time the Mutex implementation wants to know this thread's
109*9356374aSAndroid Build Coastguard Worker     // priority, it re-reads it from the OS instead of using our overridden
110*9356374aSAndroid Build Coastguard Worker     // priority.
111*9356374aSAndroid Build Coastguard Worker     absl::synchronization_internal::GetOrCreateCurrentThreadIdentity()
112*9356374aSAndroid Build Coastguard Worker         ->per_thread_synch.next_priority_read_cycles =
113*9356374aSAndroid Build Coastguard Worker         std::numeric_limits<int64_t>::min();
114*9356374aSAndroid Build Coastguard Worker   }
115*9356374aSAndroid Build Coastguard Worker };
116*9356374aSAndroid Build Coastguard Worker 
BM_MutexEnqueue(benchmark::State & state)117*9356374aSAndroid Build Coastguard Worker void BM_MutexEnqueue(benchmark::State& state) {
118*9356374aSAndroid Build Coastguard Worker   // In the "multiple priorities" variant of the benchmark, one of the
119*9356374aSAndroid Build Coastguard Worker   // threads runs with Mutex priority 0 while the rest run at elevated priority.
120*9356374aSAndroid Build Coastguard Worker   // This benchmarks the performance impact of the presence of a low priority
121*9356374aSAndroid Build Coastguard Worker   // waiter when a higher priority waiter adds itself of the queue
122*9356374aSAndroid Build Coastguard Worker   // (b/175224064).
123*9356374aSAndroid Build Coastguard Worker   //
124*9356374aSAndroid Build Coastguard Worker   // NOTE: The actual scheduler priority is not modified in this benchmark:
125*9356374aSAndroid Build Coastguard Worker   // all of the threads get CPU slices with the same priority. Only the
126*9356374aSAndroid Build Coastguard Worker   // Mutex queueing behavior is modified.
127*9356374aSAndroid Build Coastguard Worker   const bool multiple_priorities = state.range(0);
128*9356374aSAndroid Build Coastguard Worker   ScopedThreadMutexPriority priority_setter(
129*9356374aSAndroid Build Coastguard Worker       (multiple_priorities && state.thread_index() != 0) ? 1 : 0);
130*9356374aSAndroid Build Coastguard Worker 
131*9356374aSAndroid Build Coastguard Worker   struct Shared {
132*9356374aSAndroid Build Coastguard Worker     absl::Mutex mu;
133*9356374aSAndroid Build Coastguard Worker     std::atomic<int> looping_threads{0};
134*9356374aSAndroid Build Coastguard Worker     std::atomic<int> blocked_threads{0};
135*9356374aSAndroid Build Coastguard Worker     std::atomic<bool> thread_has_mutex{false};
136*9356374aSAndroid Build Coastguard Worker   };
137*9356374aSAndroid Build Coastguard Worker   static absl::NoDestructor<Shared> shared;
138*9356374aSAndroid Build Coastguard Worker 
139*9356374aSAndroid Build Coastguard Worker   // Set up 'blocked_threads' to count how many threads are currently blocked
140*9356374aSAndroid Build Coastguard Worker   // in Abseil synchronization code.
141*9356374aSAndroid Build Coastguard Worker   //
142*9356374aSAndroid Build Coastguard Worker   // NOTE: Blocking done within the Google Benchmark library itself (e.g.
143*9356374aSAndroid Build Coastguard Worker   // the barrier which synchronizes threads entering and exiting the benchmark
144*9356374aSAndroid Build Coastguard Worker   // loop) does _not_ get registered in this counter. This is because Google
145*9356374aSAndroid Build Coastguard Worker   // Benchmark uses its own synchronization primitives based on std::mutex, not
146*9356374aSAndroid Build Coastguard Worker   // Abseil synchronization primitives. If at some point the benchmark library
147*9356374aSAndroid Build Coastguard Worker   // merges into Abseil, this code may break.
148*9356374aSAndroid Build Coastguard Worker   absl::synchronization_internal::PerThreadSem::SetThreadBlockedCounter(
149*9356374aSAndroid Build Coastguard Worker       &shared->blocked_threads);
150*9356374aSAndroid Build Coastguard Worker 
151*9356374aSAndroid Build Coastguard Worker   // The benchmark framework may run several iterations in the same process,
152*9356374aSAndroid Build Coastguard Worker   // reusing the same static-initialized 'shared' object. Given the semantics
153*9356374aSAndroid Build Coastguard Worker   // of the members, here, we expect everything to be reset to zero by the
154*9356374aSAndroid Build Coastguard Worker   // end of any iteration. Assert that's the case, just to be sure.
155*9356374aSAndroid Build Coastguard Worker   ABSL_RAW_CHECK(
156*9356374aSAndroid Build Coastguard Worker       shared->looping_threads.load(std::memory_order_relaxed) == 0 &&
157*9356374aSAndroid Build Coastguard Worker           shared->blocked_threads.load(std::memory_order_relaxed) == 0 &&
158*9356374aSAndroid Build Coastguard Worker           !shared->thread_has_mutex.load(std::memory_order_relaxed),
159*9356374aSAndroid Build Coastguard Worker       "Shared state isn't zeroed at start of benchmark iteration");
160*9356374aSAndroid Build Coastguard Worker 
161*9356374aSAndroid Build Coastguard Worker   static constexpr int kBatchSize = 1000;
162*9356374aSAndroid Build Coastguard Worker   while (state.KeepRunningBatch(kBatchSize)) {
163*9356374aSAndroid Build Coastguard Worker     shared->looping_threads.fetch_add(1);
164*9356374aSAndroid Build Coastguard Worker     for (int i = 0; i < kBatchSize; i++) {
165*9356374aSAndroid Build Coastguard Worker       {
166*9356374aSAndroid Build Coastguard Worker         absl::MutexLock l(&shared->mu);
167*9356374aSAndroid Build Coastguard Worker         shared->thread_has_mutex.store(true, std::memory_order_relaxed);
168*9356374aSAndroid Build Coastguard Worker         // Spin until all other threads are either out of the benchmark loop
169*9356374aSAndroid Build Coastguard Worker         // or blocked on the mutex. This ensures that the mutex queue is kept
170*9356374aSAndroid Build Coastguard Worker         // at its maximal length to benchmark the performance of queueing on
171*9356374aSAndroid Build Coastguard Worker         // a highly contended mutex.
172*9356374aSAndroid Build Coastguard Worker         while (shared->looping_threads.load(std::memory_order_relaxed) -
173*9356374aSAndroid Build Coastguard Worker                    shared->blocked_threads.load(std::memory_order_relaxed) !=
174*9356374aSAndroid Build Coastguard Worker                1) {
175*9356374aSAndroid Build Coastguard Worker         }
176*9356374aSAndroid Build Coastguard Worker         shared->thread_has_mutex.store(false);
177*9356374aSAndroid Build Coastguard Worker       }
178*9356374aSAndroid Build Coastguard Worker       // Spin until some other thread has acquired the mutex before we block
179*9356374aSAndroid Build Coastguard Worker       // again. This ensures that we always go through the slow (queueing)
180*9356374aSAndroid Build Coastguard Worker       // acquisition path rather than reacquiring the mutex we just released.
181*9356374aSAndroid Build Coastguard Worker       while (!shared->thread_has_mutex.load(std::memory_order_relaxed) &&
182*9356374aSAndroid Build Coastguard Worker              shared->looping_threads.load(std::memory_order_relaxed) > 1) {
183*9356374aSAndroid Build Coastguard Worker       }
184*9356374aSAndroid Build Coastguard Worker     }
185*9356374aSAndroid Build Coastguard Worker     // The benchmark framework uses a barrier to ensure that all of the threads
186*9356374aSAndroid Build Coastguard Worker     // complete their benchmark loop together before any of the threads exit
187*9356374aSAndroid Build Coastguard Worker     // the loop. So, we need to remove ourselves from the "looping threads"
188*9356374aSAndroid Build Coastguard Worker     // counter here before potentially blocking on that barrier. Otherwise,
189*9356374aSAndroid Build Coastguard Worker     // another thread spinning above might wait forever for this thread to
190*9356374aSAndroid Build Coastguard Worker     // block on the mutex while we in fact are waiting to exit.
191*9356374aSAndroid Build Coastguard Worker     shared->looping_threads.fetch_add(-1);
192*9356374aSAndroid Build Coastguard Worker   }
193*9356374aSAndroid Build Coastguard Worker   absl::synchronization_internal::PerThreadSem::SetThreadBlockedCounter(
194*9356374aSAndroid Build Coastguard Worker       nullptr);
195*9356374aSAndroid Build Coastguard Worker }
196*9356374aSAndroid Build Coastguard Worker 
197*9356374aSAndroid Build Coastguard Worker BENCHMARK(BM_MutexEnqueue)
198*9356374aSAndroid Build Coastguard Worker     ->Threads(4)
199*9356374aSAndroid Build Coastguard Worker     ->Threads(64)
200*9356374aSAndroid Build Coastguard Worker     ->Threads(128)
201*9356374aSAndroid Build Coastguard Worker     ->Threads(512)
202*9356374aSAndroid Build Coastguard Worker     ->ArgName("multiple_priorities")
203*9356374aSAndroid Build Coastguard Worker     ->Arg(false)
204*9356374aSAndroid Build Coastguard Worker     ->Arg(true);
205*9356374aSAndroid Build Coastguard Worker 
206*9356374aSAndroid Build Coastguard Worker template <typename MutexType>
BM_Contended(benchmark::State & state)207*9356374aSAndroid Build Coastguard Worker void BM_Contended(benchmark::State& state) {
208*9356374aSAndroid Build Coastguard Worker   int priority = state.thread_index() % state.range(1);
209*9356374aSAndroid Build Coastguard Worker   ScopedThreadMutexPriority priority_setter(priority);
210*9356374aSAndroid Build Coastguard Worker 
211*9356374aSAndroid Build Coastguard Worker   struct Shared {
212*9356374aSAndroid Build Coastguard Worker     MutexType mu;
213*9356374aSAndroid Build Coastguard Worker     int data = 0;
214*9356374aSAndroid Build Coastguard Worker   };
215*9356374aSAndroid Build Coastguard Worker   static absl::NoDestructor<Shared> shared;
216*9356374aSAndroid Build Coastguard Worker   int local = 0;
217*9356374aSAndroid Build Coastguard Worker   for (auto _ : state) {
218*9356374aSAndroid Build Coastguard Worker     // Here we model both local work outside of the critical section as well as
219*9356374aSAndroid Build Coastguard Worker     // some work inside of the critical section. The idea is to capture some
220*9356374aSAndroid Build Coastguard Worker     // more or less realisitic contention levels.
221*9356374aSAndroid Build Coastguard Worker     // If contention is too low, the benchmark won't measure anything useful.
222*9356374aSAndroid Build Coastguard Worker     // If contention is unrealistically high, the benchmark will favor
223*9356374aSAndroid Build Coastguard Worker     // bad mutex implementations that block and otherwise distract threads
224*9356374aSAndroid Build Coastguard Worker     // from the mutex and shared state for as much as possible.
225*9356374aSAndroid Build Coastguard Worker     // To achieve this amount of local work is multiplied by number of threads
226*9356374aSAndroid Build Coastguard Worker     // to keep ratio between local work and critical section approximately
227*9356374aSAndroid Build Coastguard Worker     // equal regardless of number of threads.
228*9356374aSAndroid Build Coastguard Worker     DelayNs(100 * state.threads(), &local);
229*9356374aSAndroid Build Coastguard Worker     RaiiLocker<MutexType> locker(&shared->mu);
230*9356374aSAndroid Build Coastguard Worker     DelayNs(state.range(0), &shared->data);
231*9356374aSAndroid Build Coastguard Worker   }
232*9356374aSAndroid Build Coastguard Worker }
SetupBenchmarkArgs(benchmark::internal::Benchmark * bm,bool do_test_priorities)233*9356374aSAndroid Build Coastguard Worker void SetupBenchmarkArgs(benchmark::internal::Benchmark* bm,
234*9356374aSAndroid Build Coastguard Worker                         bool do_test_priorities) {
235*9356374aSAndroid Build Coastguard Worker   const int max_num_priorities = do_test_priorities ? 2 : 1;
236*9356374aSAndroid Build Coastguard Worker   bm->UseRealTime()
237*9356374aSAndroid Build Coastguard Worker       // ThreadPerCpu poorly handles non-power-of-two CPU counts.
238*9356374aSAndroid Build Coastguard Worker       ->Threads(1)
239*9356374aSAndroid Build Coastguard Worker       ->Threads(2)
240*9356374aSAndroid Build Coastguard Worker       ->Threads(4)
241*9356374aSAndroid Build Coastguard Worker       ->Threads(6)
242*9356374aSAndroid Build Coastguard Worker       ->Threads(8)
243*9356374aSAndroid Build Coastguard Worker       ->Threads(12)
244*9356374aSAndroid Build Coastguard Worker       ->Threads(16)
245*9356374aSAndroid Build Coastguard Worker       ->Threads(24)
246*9356374aSAndroid Build Coastguard Worker       ->Threads(32)
247*9356374aSAndroid Build Coastguard Worker       ->Threads(48)
248*9356374aSAndroid Build Coastguard Worker       ->Threads(64)
249*9356374aSAndroid Build Coastguard Worker       ->Threads(96)
250*9356374aSAndroid Build Coastguard Worker       ->Threads(128)
251*9356374aSAndroid Build Coastguard Worker       ->Threads(192)
252*9356374aSAndroid Build Coastguard Worker       ->Threads(256)
253*9356374aSAndroid Build Coastguard Worker       ->ArgNames({"cs_ns", "num_prios"});
254*9356374aSAndroid Build Coastguard Worker   // Some empirically chosen amounts of work in critical section.
255*9356374aSAndroid Build Coastguard Worker   // 1 is low contention, 2000 is high contention and few values in between.
256*9356374aSAndroid Build Coastguard Worker   for (int critical_section_ns : {1, 20, 50, 200, 2000}) {
257*9356374aSAndroid Build Coastguard Worker     for (int num_priorities = 1; num_priorities <= max_num_priorities;
258*9356374aSAndroid Build Coastguard Worker          num_priorities++) {
259*9356374aSAndroid Build Coastguard Worker       bm->ArgPair(critical_section_ns, num_priorities);
260*9356374aSAndroid Build Coastguard Worker     }
261*9356374aSAndroid Build Coastguard Worker   }
262*9356374aSAndroid Build Coastguard Worker }
263*9356374aSAndroid Build Coastguard Worker 
264*9356374aSAndroid Build Coastguard Worker BENCHMARK_TEMPLATE(BM_Contended, absl::Mutex)
__anon24d683790202(benchmark::internal::Benchmark* bm) 265*9356374aSAndroid Build Coastguard Worker     ->Apply([](benchmark::internal::Benchmark* bm) {
266*9356374aSAndroid Build Coastguard Worker       SetupBenchmarkArgs(bm, /*do_test_priorities=*/true);
267*9356374aSAndroid Build Coastguard Worker     });
268*9356374aSAndroid Build Coastguard Worker 
269*9356374aSAndroid Build Coastguard Worker BENCHMARK_TEMPLATE(BM_Contended, absl::base_internal::SpinLock)
__anon24d683790302(benchmark::internal::Benchmark* bm) 270*9356374aSAndroid Build Coastguard Worker     ->Apply([](benchmark::internal::Benchmark* bm) {
271*9356374aSAndroid Build Coastguard Worker       SetupBenchmarkArgs(bm, /*do_test_priorities=*/false);
272*9356374aSAndroid Build Coastguard Worker     });
273*9356374aSAndroid Build Coastguard Worker 
274*9356374aSAndroid Build Coastguard Worker BENCHMARK_TEMPLATE(BM_Contended, std::mutex)
__anon24d683790402(benchmark::internal::Benchmark* bm) 275*9356374aSAndroid Build Coastguard Worker     ->Apply([](benchmark::internal::Benchmark* bm) {
276*9356374aSAndroid Build Coastguard Worker       SetupBenchmarkArgs(bm, /*do_test_priorities=*/false);
277*9356374aSAndroid Build Coastguard Worker     });
278*9356374aSAndroid Build Coastguard Worker 
279*9356374aSAndroid Build Coastguard Worker // Measure the overhead of conditions on mutex release (when they must be
280*9356374aSAndroid Build Coastguard Worker // evaluated).  Mutex has (some) support for equivalence classes allowing
281*9356374aSAndroid Build Coastguard Worker // Conditions with the same function/argument to potentially not be multiply
282*9356374aSAndroid Build Coastguard Worker // evaluated.
283*9356374aSAndroid Build Coastguard Worker //
284*9356374aSAndroid Build Coastguard Worker // num_classes==0 is used for the special case of every waiter being distinct.
BM_ConditionWaiters(benchmark::State & state)285*9356374aSAndroid Build Coastguard Worker void BM_ConditionWaiters(benchmark::State& state) {
286*9356374aSAndroid Build Coastguard Worker   int num_classes = state.range(0);
287*9356374aSAndroid Build Coastguard Worker   int num_waiters = state.range(1);
288*9356374aSAndroid Build Coastguard Worker 
289*9356374aSAndroid Build Coastguard Worker   struct Helper {
290*9356374aSAndroid Build Coastguard Worker     static void Waiter(absl::BlockingCounter* init, absl::Mutex* m, int* p) {
291*9356374aSAndroid Build Coastguard Worker       init->DecrementCount();
292*9356374aSAndroid Build Coastguard Worker       m->LockWhen(absl::Condition(
293*9356374aSAndroid Build Coastguard Worker           static_cast<bool (*)(int*)>([](int* v) { return *v == 0; }), p));
294*9356374aSAndroid Build Coastguard Worker       m->Unlock();
295*9356374aSAndroid Build Coastguard Worker     }
296*9356374aSAndroid Build Coastguard Worker   };
297*9356374aSAndroid Build Coastguard Worker 
298*9356374aSAndroid Build Coastguard Worker   if (num_classes == 0) {
299*9356374aSAndroid Build Coastguard Worker     // No equivalence classes.
300*9356374aSAndroid Build Coastguard Worker     num_classes = num_waiters;
301*9356374aSAndroid Build Coastguard Worker   }
302*9356374aSAndroid Build Coastguard Worker 
303*9356374aSAndroid Build Coastguard Worker   absl::BlockingCounter init(num_waiters);
304*9356374aSAndroid Build Coastguard Worker   absl::Mutex mu;
305*9356374aSAndroid Build Coastguard Worker   std::vector<int> equivalence_classes(num_classes, 1);
306*9356374aSAndroid Build Coastguard Worker 
307*9356374aSAndroid Build Coastguard Worker   // Must be declared last to be destroyed first.
308*9356374aSAndroid Build Coastguard Worker   absl::synchronization_internal::ThreadPool pool(num_waiters);
309*9356374aSAndroid Build Coastguard Worker 
310*9356374aSAndroid Build Coastguard Worker   for (int i = 0; i < num_waiters; i++) {
311*9356374aSAndroid Build Coastguard Worker     // Mutex considers Conditions with the same function and argument
312*9356374aSAndroid Build Coastguard Worker     // to be equivalent.
313*9356374aSAndroid Build Coastguard Worker     pool.Schedule([&, i] {
314*9356374aSAndroid Build Coastguard Worker       Helper::Waiter(&init, &mu, &equivalence_classes[i % num_classes]);
315*9356374aSAndroid Build Coastguard Worker     });
316*9356374aSAndroid Build Coastguard Worker   }
317*9356374aSAndroid Build Coastguard Worker   init.Wait();
318*9356374aSAndroid Build Coastguard Worker 
319*9356374aSAndroid Build Coastguard Worker   for (auto _ : state) {
320*9356374aSAndroid Build Coastguard Worker     mu.Lock();
321*9356374aSAndroid Build Coastguard Worker     mu.Unlock();  // Each unlock requires Condition evaluation for our waiters.
322*9356374aSAndroid Build Coastguard Worker   }
323*9356374aSAndroid Build Coastguard Worker 
324*9356374aSAndroid Build Coastguard Worker   mu.Lock();
325*9356374aSAndroid Build Coastguard Worker   for (int i = 0; i < num_classes; i++) {
326*9356374aSAndroid Build Coastguard Worker     equivalence_classes[i] = 0;
327*9356374aSAndroid Build Coastguard Worker   }
328*9356374aSAndroid Build Coastguard Worker   mu.Unlock();
329*9356374aSAndroid Build Coastguard Worker }
330*9356374aSAndroid Build Coastguard Worker 
331*9356374aSAndroid Build Coastguard Worker // Some configurations have higher thread limits than others.
332*9356374aSAndroid Build Coastguard Worker #if defined(__linux__) && !defined(ABSL_HAVE_THREAD_SANITIZER)
333*9356374aSAndroid Build Coastguard Worker constexpr int kMaxConditionWaiters = 8192;
334*9356374aSAndroid Build Coastguard Worker #else
335*9356374aSAndroid Build Coastguard Worker constexpr int kMaxConditionWaiters = 1024;
336*9356374aSAndroid Build Coastguard Worker #endif
337*9356374aSAndroid Build Coastguard Worker BENCHMARK(BM_ConditionWaiters)->RangePair(0, 2, 1, kMaxConditionWaiters);
338*9356374aSAndroid Build Coastguard Worker 
339*9356374aSAndroid Build Coastguard Worker }  // namespace
340