xref: /aosp_15_r20/external/XNNPACK/bench/f32-vsqrt.cc (revision 4bdc94577ba0e567308109d787f7fec7b531ce36)
1*4bdc9457SAndroid Build Coastguard Worker // Copyright 2020 Google LLC
2*4bdc9457SAndroid Build Coastguard Worker //
3*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
4*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
5*4bdc9457SAndroid Build Coastguard Worker 
6*4bdc9457SAndroid Build Coastguard Worker #include <algorithm>
7*4bdc9457SAndroid Build Coastguard Worker #include <cmath>
8*4bdc9457SAndroid Build Coastguard Worker #include <functional>
9*4bdc9457SAndroid Build Coastguard Worker #include <random>
10*4bdc9457SAndroid Build Coastguard Worker #include <vector>
11*4bdc9457SAndroid Build Coastguard Worker 
12*4bdc9457SAndroid Build Coastguard Worker #include <benchmark/benchmark.h>
13*4bdc9457SAndroid Build Coastguard Worker #include "bench/utils.h"
14*4bdc9457SAndroid Build Coastguard Worker 
15*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack.h>
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/aligned-allocator.h>
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h>
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microfnptr.h>
19*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microparams-init.h>
20*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/vunary.h>
21*4bdc9457SAndroid Build Coastguard Worker 
22*4bdc9457SAndroid Build Coastguard Worker 
f32_vsqrt(benchmark::State & state,xnn_f32_vsqrt_ukernel_function vsqrt,xnn_init_f32_sqrt_params_fn init_params=nullptr,benchmark::utils::IsaCheckFunction isa_check=nullptr)23*4bdc9457SAndroid Build Coastguard Worker static void f32_vsqrt(
24*4bdc9457SAndroid Build Coastguard Worker   benchmark::State& state,
25*4bdc9457SAndroid Build Coastguard Worker   xnn_f32_vsqrt_ukernel_function vsqrt,
26*4bdc9457SAndroid Build Coastguard Worker   xnn_init_f32_sqrt_params_fn init_params = nullptr,
27*4bdc9457SAndroid Build Coastguard Worker   benchmark::utils::IsaCheckFunction isa_check = nullptr)
28*4bdc9457SAndroid Build Coastguard Worker {
29*4bdc9457SAndroid Build Coastguard Worker   if (isa_check && !isa_check(state)) {
30*4bdc9457SAndroid Build Coastguard Worker     return;
31*4bdc9457SAndroid Build Coastguard Worker   }
32*4bdc9457SAndroid Build Coastguard Worker 
33*4bdc9457SAndroid Build Coastguard Worker   const size_t num_elements = state.range(0);
34*4bdc9457SAndroid Build Coastguard Worker   std::vector<float, AlignedAllocator<float, 64>> input(num_elements);
35*4bdc9457SAndroid Build Coastguard Worker   std::vector<float, AlignedAllocator<float, 64>> output(num_elements);
36*4bdc9457SAndroid Build Coastguard Worker 
37*4bdc9457SAndroid Build Coastguard Worker   std::random_device random_device;
38*4bdc9457SAndroid Build Coastguard Worker   auto rng = std::mt19937(random_device());
39*4bdc9457SAndroid Build Coastguard Worker   auto f32rng = std::bind(std::uniform_real_distribution<float>(0.0f, 10.0f), std::ref(rng));
40*4bdc9457SAndroid Build Coastguard Worker   std::generate(input.begin(), input.end(), std::ref(f32rng));
41*4bdc9457SAndroid Build Coastguard Worker   std::fill(output.begin(), output.end(), std::nanf(""));
42*4bdc9457SAndroid Build Coastguard Worker 
43*4bdc9457SAndroid Build Coastguard Worker   union xnn_f32_sqrt_params params;
44*4bdc9457SAndroid Build Coastguard Worker   if (init_params != nullptr) {
45*4bdc9457SAndroid Build Coastguard Worker     init_params(&params);
46*4bdc9457SAndroid Build Coastguard Worker   }
47*4bdc9457SAndroid Build Coastguard Worker   for (auto _ : state) {
48*4bdc9457SAndroid Build Coastguard Worker     vsqrt(num_elements * sizeof(float), input.data(), output.data(), &params);
49*4bdc9457SAndroid Build Coastguard Worker   }
50*4bdc9457SAndroid Build Coastguard Worker 
51*4bdc9457SAndroid Build Coastguard Worker   const uint64_t cpu_frequency = benchmark::utils::GetCurrentCpuFrequency();
52*4bdc9457SAndroid Build Coastguard Worker   if (cpu_frequency != 0) {
53*4bdc9457SAndroid Build Coastguard Worker     state.counters["cpufreq"] = cpu_frequency;
54*4bdc9457SAndroid Build Coastguard Worker   }
55*4bdc9457SAndroid Build Coastguard Worker 
56*4bdc9457SAndroid Build Coastguard Worker   const size_t elements_per_iteration = num_elements;
57*4bdc9457SAndroid Build Coastguard Worker   state.counters["elements"] =
58*4bdc9457SAndroid Build Coastguard Worker     benchmark::Counter(uint64_t(state.iterations()) * elements_per_iteration, benchmark::Counter::kIsRate);
59*4bdc9457SAndroid Build Coastguard Worker 
60*4bdc9457SAndroid Build Coastguard Worker   const size_t bytes_per_iteration = 2 * num_elements * sizeof(float);
61*4bdc9457SAndroid Build Coastguard Worker   state.counters["bytes"] =
62*4bdc9457SAndroid Build Coastguard Worker     benchmark::Counter(uint64_t(state.iterations()) * bytes_per_iteration, benchmark::Counter::kIsRate);
63*4bdc9457SAndroid Build Coastguard Worker }
64*4bdc9457SAndroid Build Coastguard Worker 
65*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_ARM64
66*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neon_sqrt_x4,
67*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neon_sqrt_x4)
68*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
69*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
70*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neon_sqrt_x8,
71*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neon_sqrt_x8)
72*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
73*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
74*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_ARM64
75*4bdc9457SAndroid Build Coastguard Worker 
76*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_ARM64 || XNN_ARCH_ARM64
77*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x4,
78*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x4,
79*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
80*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
81*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
82*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
83*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x8,
84*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x8,
85*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
86*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
87*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
88*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
89*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x12,
90*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x12,
91*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
92*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
93*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
94*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
95*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x16,
96*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x16,
97*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
98*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
99*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
100*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
101*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x20,
102*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x20,
103*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
104*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
105*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
106*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
107*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x24,
108*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x24,
109*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
110*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
111*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
112*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
113*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x28,
114*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x28,
115*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
116*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
117*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
118*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
119*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x32,
120*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x32,
121*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
122*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
123*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
124*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
125*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x36,
126*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x36,
127*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
128*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
129*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
130*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
131*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr1rsqrts1fma1adj_x40,
132*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x40,
133*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
134*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
135*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
136*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
137*4bdc9457SAndroid Build Coastguard Worker 
138*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x4,
139*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x4,
140*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
141*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
142*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
143*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
144*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x8,
145*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x8,
146*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
147*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
148*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
149*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
150*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x12,
151*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x12,
152*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
153*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
154*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
155*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
156*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x16,
157*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x16,
158*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
159*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
160*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
161*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
162*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x20,
163*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x20,
164*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
165*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
166*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
167*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
168*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x24,
169*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x24,
170*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
171*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
172*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
173*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
174*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x28,
175*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x28,
176*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
177*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
178*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
179*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
180*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x32,
181*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x32,
182*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
183*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
184*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
185*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
186*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x36,
187*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x36,
188*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
189*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
190*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
191*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
192*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, neonfma_nr2fma1adj_x40,
193*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x40,
194*4bdc9457SAndroid Build Coastguard Worker                     nullptr /* init params */,
195*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONFMA)
196*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
197*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
198*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_ARM64 || XNN_ARCH_ARM64
199*4bdc9457SAndroid Build Coastguard Worker 
200*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_X86 || XNN_ARCH_X86_64
201*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx512f_nr1fma1adj_x16,
202*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x16,
203*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx512_params,
204*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512F)
205*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
206*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
207*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx512f_nr1fma1adj_x32,
208*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x32,
209*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx512_params,
210*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512F)
211*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
212*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
213*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx512f_nr1fma1adj_x48,
214*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x48,
215*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx512_params,
216*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512F)
217*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
218*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
219*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx512f_nr1fma1adj_x64,
220*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x64,
221*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx512_params,
222*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512F)
223*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
224*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
225*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx512f_nr1fma1adj_x80,
226*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x80,
227*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx512_params,
228*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512F)
229*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
230*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
231*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx512f_nr1fma1adj_x96,
232*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96,
233*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx512_params,
234*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512F)
235*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
236*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
237*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx512f_nr1fma1adj_x112,
238*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112,
239*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx512_params,
240*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512F)
241*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
242*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
243*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx512f_nr1fma1adj_x128,
244*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128,
245*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx512_params,
246*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512F)
247*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
248*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
249*4bdc9457SAndroid Build Coastguard Worker 
250*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, fma3_nr1fma1adj_x8,
251*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x8,
252*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_fma_params,
253*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckFMA3)
254*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
255*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
256*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, fma3_nr1fma1adj_x16,
257*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x16,
258*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_fma_params,
259*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckFMA3)
260*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
261*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
262*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, fma3_nr1fma1adj_x24,
263*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x24,
264*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_fma_params,
265*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckFMA3)
266*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
267*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
268*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, fma3_nr1fma1adj_x32,
269*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x32,
270*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_fma_params,
271*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckFMA3)
272*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
273*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
274*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, fma3_nr1fma1adj_x40,
275*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x40,
276*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_fma_params,
277*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckFMA3)
278*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
279*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
280*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, fma3_nr1fma1adj_x48,
281*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x48,
282*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_fma_params,
283*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckFMA3)
284*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
285*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
286*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, fma3_nr1fma1adj_x56,
287*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x56,
288*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_fma_params,
289*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckFMA3)
290*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
291*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
292*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, fma3_nr1fma1adj_x64,
293*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x64,
294*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_fma_params,
295*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckFMA3)
296*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
297*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
298*4bdc9457SAndroid Build Coastguard Worker 
299*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx_sqrt_x8,
300*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx_sqrt_x8,
301*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx_params,
302*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX)
303*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
304*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
305*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, avx_sqrt_x16,
306*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__avx_sqrt_x16,
307*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_sqrt_avx_params,
308*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX)
309*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
310*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
311*4bdc9457SAndroid Build Coastguard Worker 
312*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, sse_sqrt_x4,
313*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__sse_sqrt_x4)
314*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
315*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
316*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, sse_sqrt_x8,
317*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__sse_sqrt_x8)
318*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
319*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
320*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_X86 || XNN_ARCH_X86_64
321*4bdc9457SAndroid Build Coastguard Worker 
322*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
323*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, wasmsimd_sqrt_x4,
324*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__wasmsimd_sqrt_x4)
325*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
326*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
327*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_vsqrt, wasmsimd_sqrt_x8,
328*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_vsqrt_ukernel__wasmsimd_sqrt_x8)
329*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
330*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
331*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
332*4bdc9457SAndroid Build Coastguard Worker 
333*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_vsqrt, scalar_sqrt_x1,
334*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_vsqrt_ukernel__scalar_sqrt_x1)
335*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
336*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
337*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_vsqrt, scalar_sqrt_x2,
338*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_vsqrt_ukernel__scalar_sqrt_x2)
339*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
340*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
341*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_vsqrt, scalar_sqrt_x4,
342*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_vsqrt_ukernel__scalar_sqrt_x4)
343*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, float>)
344*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
345*4bdc9457SAndroid Build Coastguard Worker 
346*4bdc9457SAndroid Build Coastguard Worker #ifndef XNNPACK_BENCHMARK_NO_MAIN
347*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_MAIN();
348*4bdc9457SAndroid Build Coastguard Worker #endif
349