xref: /aosp_15_r20/external/XNNPACK/bench/f32-qs8-vcvt.cc (revision 4bdc94577ba0e567308109d787f7fec7b531ce36)
1*4bdc9457SAndroid Build Coastguard Worker // Copyright 2021 Google LLC
2*4bdc9457SAndroid Build Coastguard Worker //
3*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
4*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
5*4bdc9457SAndroid Build Coastguard Worker 
6*4bdc9457SAndroid Build Coastguard Worker #include <algorithm>
7*4bdc9457SAndroid Build Coastguard Worker #include <cmath>
8*4bdc9457SAndroid Build Coastguard Worker #include <functional>
9*4bdc9457SAndroid Build Coastguard Worker #include <random>
10*4bdc9457SAndroid Build Coastguard Worker #include <vector>
11*4bdc9457SAndroid Build Coastguard Worker 
12*4bdc9457SAndroid Build Coastguard Worker #include <benchmark/benchmark.h>
13*4bdc9457SAndroid Build Coastguard Worker #include <fp16/fp16.h>
14*4bdc9457SAndroid Build Coastguard Worker #include "bench/utils.h"
15*4bdc9457SAndroid Build Coastguard Worker 
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack.h>
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/aligned-allocator.h>
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h>
19*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microfnptr.h>
20*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microparams-init.h>
21*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/vcvt.h>
22*4bdc9457SAndroid Build Coastguard Worker 
23*4bdc9457SAndroid Build Coastguard Worker 
f32_qs8_vcvt(benchmark::State & state,xnn_f32_qs8_vcvt_ukernel_function cvt,xnn_init_f32_qs8_cvt_params_fn init_params,benchmark::utils::IsaCheckFunction isa_check=nullptr)24*4bdc9457SAndroid Build Coastguard Worker static void f32_qs8_vcvt(
25*4bdc9457SAndroid Build Coastguard Worker   benchmark::State& state,
26*4bdc9457SAndroid Build Coastguard Worker   xnn_f32_qs8_vcvt_ukernel_function cvt,
27*4bdc9457SAndroid Build Coastguard Worker   xnn_init_f32_qs8_cvt_params_fn init_params,
28*4bdc9457SAndroid Build Coastguard Worker   benchmark::utils::IsaCheckFunction isa_check = nullptr)
29*4bdc9457SAndroid Build Coastguard Worker {
30*4bdc9457SAndroid Build Coastguard Worker   if (isa_check && !isa_check(state)) {
31*4bdc9457SAndroid Build Coastguard Worker     return;
32*4bdc9457SAndroid Build Coastguard Worker   }
33*4bdc9457SAndroid Build Coastguard Worker 
34*4bdc9457SAndroid Build Coastguard Worker   const size_t num_elements = state.range(0);
35*4bdc9457SAndroid Build Coastguard Worker 
36*4bdc9457SAndroid Build Coastguard Worker   std::random_device random_device;
37*4bdc9457SAndroid Build Coastguard Worker   auto rng = std::mt19937(random_device());
38*4bdc9457SAndroid Build Coastguard Worker   auto f32rng = std::bind(std::uniform_real_distribution<float>(-10.0f, 10.0f), std::ref(rng));
39*4bdc9457SAndroid Build Coastguard Worker 
40*4bdc9457SAndroid Build Coastguard Worker   std::vector<float, AlignedAllocator<float, 64>> x(num_elements + XNN_EXTRA_BYTES / sizeof(float));
41*4bdc9457SAndroid Build Coastguard Worker   std::vector<int8_t, AlignedAllocator<int8_t, 64>> y(num_elements);
42*4bdc9457SAndroid Build Coastguard Worker   std::generate(x.begin(), x.end(), std::ref(f32rng));
43*4bdc9457SAndroid Build Coastguard Worker   std::fill(y.begin(), y.end(), INT8_C(0xA5));
44*4bdc9457SAndroid Build Coastguard Worker 
45*4bdc9457SAndroid Build Coastguard Worker   xnn_f32_qs8_cvt_params params;
46*4bdc9457SAndroid Build Coastguard Worker   init_params(&params,
47*4bdc9457SAndroid Build Coastguard Worker     25.0f /* scale */,
48*4bdc9457SAndroid Build Coastguard Worker     1 /* output zero point */,
49*4bdc9457SAndroid Build Coastguard Worker     std::numeric_limits<int8_t>::min() + 1 /* output min */,
50*4bdc9457SAndroid Build Coastguard Worker     std::numeric_limits<int8_t>::max() - 1 /* output max */);
51*4bdc9457SAndroid Build Coastguard Worker   for (auto _ : state) {
52*4bdc9457SAndroid Build Coastguard Worker     cvt(num_elements * sizeof(int8_t), x.data(), y.data(), &params);
53*4bdc9457SAndroid Build Coastguard Worker   }
54*4bdc9457SAndroid Build Coastguard Worker 
55*4bdc9457SAndroid Build Coastguard Worker   const uint64_t cpu_frequency = benchmark::utils::GetCurrentCpuFrequency();
56*4bdc9457SAndroid Build Coastguard Worker   if (cpu_frequency != 0) {
57*4bdc9457SAndroid Build Coastguard Worker     state.counters["cpufreq"] = cpu_frequency;
58*4bdc9457SAndroid Build Coastguard Worker   }
59*4bdc9457SAndroid Build Coastguard Worker 
60*4bdc9457SAndroid Build Coastguard Worker   const size_t elements_per_iteration = num_elements;
61*4bdc9457SAndroid Build Coastguard Worker   state.counters["elements"] =
62*4bdc9457SAndroid Build Coastguard Worker     benchmark::Counter(uint64_t(state.iterations()) * elements_per_iteration, benchmark::Counter::kIsRate);
63*4bdc9457SAndroid Build Coastguard Worker 
64*4bdc9457SAndroid Build Coastguard Worker   const size_t bytes_per_iteration = num_elements * (sizeof(int8_t) + sizeof(float));
65*4bdc9457SAndroid Build Coastguard Worker   state.counters["bytes"] =
66*4bdc9457SAndroid Build Coastguard Worker     benchmark::Counter(uint64_t(state.iterations()) * bytes_per_iteration, benchmark::Counter::kIsRate);
67*4bdc9457SAndroid Build Coastguard Worker }
68*4bdc9457SAndroid Build Coastguard Worker 
69*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_ARM || XNN_ARCH_ARM64
70*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, neonv8_x8,
71*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__neonv8_x8,
72*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_neonv8_params,
73*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONV8)
74*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
75*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
76*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, neonv8_x16,
77*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__neonv8_x16,
78*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_neonv8_params,
79*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONV8)
80*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
81*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
82*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, neonv8_x24,
83*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__neonv8_x24,
84*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_neonv8_params,
85*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONV8)
86*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
87*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
88*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, neonv8_x32,
89*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__neonv8_x32,
90*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_neonv8_params,
91*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEONV8)
92*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
93*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
94*4bdc9457SAndroid Build Coastguard Worker 
95*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, neon_x8,
96*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__neon_x8,
97*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_neon_params,
98*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEON)
99*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
100*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
101*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, neon_x16,
102*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__neon_x16,
103*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_neon_params,
104*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEON)
105*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
106*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
107*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, neon_x24,
108*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__neon_x24,
109*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_neon_params,
110*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEON)
111*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
112*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
113*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, neon_x32,
114*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__neon_x32,
115*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_neon_params,
116*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckNEON)
117*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
118*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
119*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_ARM || XNN_ARCH_ARM64
120*4bdc9457SAndroid Build Coastguard Worker 
121*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_X86 || XNN_ARCH_X86_64
122*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx512skx_x32,
123*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx512skx_x32,
124*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx512_params,
125*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512SKX)
126*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
127*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
128*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx512skx_x64,
129*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx512skx_x64,
130*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx512_params,
131*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512SKX)
132*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
133*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
134*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx512skx_x96,
135*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx512skx_x96,
136*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx512_params,
137*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512SKX)
138*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
139*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
140*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx512skx_x128,
141*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx512skx_x128,
142*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx512_params,
143*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX512SKX)
144*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
145*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
146*4bdc9457SAndroid Build Coastguard Worker 
147*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx2_x16,
148*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx2_x16,
149*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx2_params,
150*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX2)
151*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
152*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
153*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx2_x32,
154*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx2_x32,
155*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx2_params,
156*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX2)
157*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
158*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
159*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx2_x48,
160*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx2_x48,
161*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx2_params,
162*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX2)
163*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
164*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
165*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx2_x64,
166*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx2_x64,
167*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx2_params,
168*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX2)
169*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
170*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
171*4bdc9457SAndroid Build Coastguard Worker 
172*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx_x8,
173*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx_x8,
174*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx_params,
175*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX)
176*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
177*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
178*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx_x16,
179*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx_x16,
180*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx_params,
181*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX)
182*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
183*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
184*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx_x24,
185*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx_x24,
186*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx_params,
187*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX)
188*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
189*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
190*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, avx_x32,
191*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__avx_x32,
192*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_avx_params,
193*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckAVX)
194*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
195*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
196*4bdc9457SAndroid Build Coastguard Worker 
197*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, sse41_x8,
198*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__sse41_x8,
199*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_sse4_params,
200*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckSSE41)
201*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
202*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
203*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, sse41_x16,
204*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__sse41_x16,
205*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_sse4_params,
206*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckSSE41)
207*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
208*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
209*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, sse41_x24,
210*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__sse41_x24,
211*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_sse4_params,
212*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckSSE41)
213*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
214*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
215*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, sse41_x32,
216*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__sse41_x32,
217*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_sse4_params,
218*4bdc9457SAndroid Build Coastguard Worker                     benchmark::utils::CheckSSE41)
219*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
220*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
221*4bdc9457SAndroid Build Coastguard Worker 
222*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, sse2_x8,
223*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__sse2_x8,
224*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_sse2_params)
225*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
226*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
227*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, sse2_x16,
228*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__sse2_x16,
229*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_sse2_params)
230*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
231*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
232*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, sse2_x24,
233*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__sse2_x24,
234*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_sse2_params)
235*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
236*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
237*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, sse2_x32,
238*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__sse2_x32,
239*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_sse2_params)
240*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
241*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
242*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_X86 || XNN_ARCH_X86_64
243*4bdc9457SAndroid Build Coastguard Worker 
244*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
245*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasmsimd_cvt_x8,
246*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasmsimd_cvt_x8,
247*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_wasmsimd_cvt_params)
248*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
249*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
250*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasmsimd_cvt_x16,
251*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasmsimd_cvt_x16,
252*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_wasmsimd_cvt_params)
253*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
254*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
255*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasmsimd_cvt_x24,
256*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasmsimd_cvt_x24,
257*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_wasmsimd_cvt_params)
258*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
259*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
260*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasmsimd_cvt_x32,
261*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasmsimd_cvt_x32,
262*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_wasmsimd_cvt_params)
263*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
264*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
265*4bdc9457SAndroid Build Coastguard Worker 
266*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasmsimd_magic_x8,
267*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasmsimd_magic_x8,
268*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_wasmsimd_magic_params)
269*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
270*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
271*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasmsimd_magic_x16,
272*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasmsimd_magic_x16,
273*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_wasmsimd_magic_params)
274*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
275*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
276*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasmsimd_magic_x24,
277*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasmsimd_magic_x24,
278*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_wasmsimd_magic_params)
279*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
280*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
281*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasmsimd_magic_x32,
282*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasmsimd_magic_x32,
283*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_wasmsimd_magic_params)
284*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
285*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
286*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
287*4bdc9457SAndroid Build Coastguard Worker 
288*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
289*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasm_fmagic_x1,
290*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasm_fmagic_x1,
291*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_scalar_fmagic_params)
292*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
293*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
294*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasm_fmagic_x2,
295*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasm_fmagic_x2,
296*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_scalar_fmagic_params)
297*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
298*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
299*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasm_fmagic_x3,
300*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasm_fmagic_x3,
301*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_scalar_fmagic_params)
302*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
303*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
304*4bdc9457SAndroid Build Coastguard Worker   BENCHMARK_CAPTURE(f32_qs8_vcvt, wasm_fmagic_x4,
305*4bdc9457SAndroid Build Coastguard Worker                     xnn_f32_qs8_vcvt_ukernel__wasm_fmagic_x4,
306*4bdc9457SAndroid Build Coastguard Worker                     xnn_init_f32_qs8_cvt_scalar_fmagic_params)
307*4bdc9457SAndroid Build Coastguard Worker     ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
308*4bdc9457SAndroid Build Coastguard Worker     ->UseRealTime();
309*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
310*4bdc9457SAndroid Build Coastguard Worker 
311*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_fmagic_x1,
312*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_fmagic_x1,
313*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_fmagic_params)
314*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
315*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
316*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_fmagic_x2,
317*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_fmagic_x2,
318*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_fmagic_params)
319*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
320*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
321*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_fmagic_x3,
322*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_fmagic_x3,
323*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_fmagic_params)
324*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
325*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
326*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_fmagic_x4,
327*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_fmagic_x4,
328*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_fmagic_params)
329*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
330*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
331*4bdc9457SAndroid Build Coastguard Worker 
332*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_imagic_x1,
333*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_imagic_x1,
334*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_imagic_params)
335*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
336*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
337*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_imagic_x2,
338*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_imagic_x2,
339*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_imagic_params)
340*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
341*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
342*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_imagic_x3,
343*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_imagic_x3,
344*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_imagic_params)
345*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
346*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
347*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_imagic_x4,
348*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_imagic_x4,
349*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_imagic_params)
350*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
351*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
352*4bdc9457SAndroid Build Coastguard Worker 
353*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_lrintf_x1,
354*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_lrintf_x1,
355*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_lrintf_params)
356*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
357*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
358*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_lrintf_x2,
359*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_lrintf_x2,
360*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_lrintf_params)
361*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
362*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
363*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_lrintf_x3,
364*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_lrintf_x3,
365*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_lrintf_params)
366*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
367*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
368*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_CAPTURE(f32_qs8_vcvt, scalar_lrintf_x4,
369*4bdc9457SAndroid Build Coastguard Worker                   xnn_f32_qs8_vcvt_ukernel__scalar_lrintf_x4,
370*4bdc9457SAndroid Build Coastguard Worker                   xnn_init_f32_qs8_cvt_scalar_lrintf_params)
371*4bdc9457SAndroid Build Coastguard Worker   ->Apply(benchmark::utils::UnaryElementwiseParameters<float, int8_t>)
372*4bdc9457SAndroid Build Coastguard Worker   ->UseRealTime();
373*4bdc9457SAndroid Build Coastguard Worker 
374*4bdc9457SAndroid Build Coastguard Worker #ifndef XNNPACK_BENCHMARK_NO_MAIN
375*4bdc9457SAndroid Build Coastguard Worker BENCHMARK_MAIN();
376*4bdc9457SAndroid Build Coastguard Worker #endif
377