1*4bdc9457SAndroid Build Coastguard Worker // Copyright 2022 Google LLC
2*4bdc9457SAndroid Build Coastguard Worker //
3*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
4*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
5*4bdc9457SAndroid Build Coastguard Worker
6*4bdc9457SAndroid Build Coastguard Worker #include <algorithm>
7*4bdc9457SAndroid Build Coastguard Worker #include <cmath>
8*4bdc9457SAndroid Build Coastguard Worker #include <cstddef>
9*4bdc9457SAndroid Build Coastguard Worker #include <cstdint>
10*4bdc9457SAndroid Build Coastguard Worker #include <cstdlib>
11*4bdc9457SAndroid Build Coastguard Worker #include <vector>
12*4bdc9457SAndroid Build Coastguard Worker
13*4bdc9457SAndroid Build Coastguard Worker #include <gtest/gtest.h>
14*4bdc9457SAndroid Build Coastguard Worker
15*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/aligned-allocator.h>
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h>
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/math-stubs.h>
18*4bdc9457SAndroid Build Coastguard Worker
19*4bdc9457SAndroid Build Coastguard Worker
20*4bdc9457SAndroid Build Coastguard Worker constexpr int kBlockSize = 1024;
21*4bdc9457SAndroid Build Coastguard Worker
22*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_BITMANIP,uint16_output)23*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_BITMANIP, uint16_output) {
24*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
25*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
26*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
27*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
28*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
29*4bdc9457SAndroid Build Coastguard Worker }
30*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_bitmanip(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
31*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
32*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
33*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
34*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
35*4bdc9457SAndroid Build Coastguard Worker
36*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
37*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
38*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
39*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
40*4bdc9457SAndroid Build Coastguard Worker
41*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
42*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
43*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
44*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
45*4bdc9457SAndroid Build Coastguard Worker }
46*4bdc9457SAndroid Build Coastguard Worker }
47*4bdc9457SAndroid Build Coastguard Worker }
48*4bdc9457SAndroid Build Coastguard Worker
49*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_BITMANIP, 65536_output) {
50*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
51*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
52*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
53*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
54*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
55*4bdc9457SAndroid Build Coastguard Worker }
56*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_bitmanip(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
57*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
58*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
59*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
60*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
61*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
62*4bdc9457SAndroid Build Coastguard Worker }
63*4bdc9457SAndroid Build Coastguard Worker }
64*4bdc9457SAndroid Build Coastguard Worker }
65*4bdc9457SAndroid Build Coastguard Worker
66*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_CLZ_BINSEARCH,uint16_output)67*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CLZ_BINSEARCH, uint16_output) {
68*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
69*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
70*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
71*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
72*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
73*4bdc9457SAndroid Build Coastguard Worker }
74*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_clz_binsearch(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
75*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
76*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
77*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
78*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
79*4bdc9457SAndroid Build Coastguard Worker
80*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
81*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
82*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
83*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
84*4bdc9457SAndroid Build Coastguard Worker
85*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
86*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
87*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
88*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
89*4bdc9457SAndroid Build Coastguard Worker }
90*4bdc9457SAndroid Build Coastguard Worker }
91*4bdc9457SAndroid Build Coastguard Worker }
92*4bdc9457SAndroid Build Coastguard Worker
93*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CLZ_BINSEARCH, 65536_output) {
94*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
95*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
96*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
97*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
98*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
99*4bdc9457SAndroid Build Coastguard Worker }
100*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_clz_binsearch(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
101*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
102*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
103*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
104*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
105*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
106*4bdc9457SAndroid Build Coastguard Worker }
107*4bdc9457SAndroid Build Coastguard Worker }
108*4bdc9457SAndroid Build Coastguard Worker }
109*4bdc9457SAndroid Build Coastguard Worker
110*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_CLZ_NEWTON,uint16_output)111*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CLZ_NEWTON, uint16_output) {
112*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
113*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
114*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
115*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
116*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
117*4bdc9457SAndroid Build Coastguard Worker }
118*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_clz_newton(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
119*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
120*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
121*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
122*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
123*4bdc9457SAndroid Build Coastguard Worker
124*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
125*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
126*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
127*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
128*4bdc9457SAndroid Build Coastguard Worker
129*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
130*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
131*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
132*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
133*4bdc9457SAndroid Build Coastguard Worker }
134*4bdc9457SAndroid Build Coastguard Worker }
135*4bdc9457SAndroid Build Coastguard Worker }
136*4bdc9457SAndroid Build Coastguard Worker
137*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CLZ_NEWTON, 65536_output) {
138*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
139*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
140*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
141*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
142*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
143*4bdc9457SAndroid Build Coastguard Worker }
144*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_clz_newton(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
145*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
146*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
147*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
148*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
149*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
150*4bdc9457SAndroid Build Coastguard Worker }
151*4bdc9457SAndroid Build Coastguard Worker }
152*4bdc9457SAndroid Build Coastguard Worker }
153*4bdc9457SAndroid Build Coastguard Worker
154*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_CVTI32_SQRT_LRINT,uint16_output)155*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTI32_SQRT_LRINT, uint16_output) {
156*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
157*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
158*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
159*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
160*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
161*4bdc9457SAndroid Build Coastguard Worker }
162*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvti32_sqrt_lrint(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
163*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
164*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
165*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
166*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
167*4bdc9457SAndroid Build Coastguard Worker
168*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
169*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
170*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
171*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
172*4bdc9457SAndroid Build Coastguard Worker
173*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
174*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
175*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
176*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
177*4bdc9457SAndroid Build Coastguard Worker }
178*4bdc9457SAndroid Build Coastguard Worker }
179*4bdc9457SAndroid Build Coastguard Worker }
180*4bdc9457SAndroid Build Coastguard Worker
181*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTI32_SQRT_LRINT, 65536_output) {
182*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
183*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
184*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
185*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
186*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
187*4bdc9457SAndroid Build Coastguard Worker }
188*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvti32_sqrt_lrint(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
189*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
190*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
191*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
192*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
193*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
194*4bdc9457SAndroid Build Coastguard Worker }
195*4bdc9457SAndroid Build Coastguard Worker }
196*4bdc9457SAndroid Build Coastguard Worker }
197*4bdc9457SAndroid Build Coastguard Worker
198*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_CVTI64_SQRT_LRINT,uint16_output)199*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTI64_SQRT_LRINT, uint16_output) {
200*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
201*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
202*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
203*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
204*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
205*4bdc9457SAndroid Build Coastguard Worker }
206*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvti64_sqrt_lrint(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
207*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
208*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
209*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
210*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
211*4bdc9457SAndroid Build Coastguard Worker
212*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
213*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
214*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
215*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
216*4bdc9457SAndroid Build Coastguard Worker
217*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
218*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
219*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
220*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
221*4bdc9457SAndroid Build Coastguard Worker }
222*4bdc9457SAndroid Build Coastguard Worker }
223*4bdc9457SAndroid Build Coastguard Worker }
224*4bdc9457SAndroid Build Coastguard Worker
225*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTI64_SQRT_LRINT, 65536_output) {
226*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
227*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
228*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
229*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
230*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
231*4bdc9457SAndroid Build Coastguard Worker }
232*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvti64_sqrt_lrint(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
233*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
234*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
235*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
236*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
237*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
238*4bdc9457SAndroid Build Coastguard Worker }
239*4bdc9457SAndroid Build Coastguard Worker }
240*4bdc9457SAndroid Build Coastguard Worker }
241*4bdc9457SAndroid Build Coastguard Worker
242*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_CVTU32_SQRT_LRINT,uint16_output)243*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTU32_SQRT_LRINT, uint16_output) {
244*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
245*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
246*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
247*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
248*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
249*4bdc9457SAndroid Build Coastguard Worker }
250*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvtu32_sqrt_lrint(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
251*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
252*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
253*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
254*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
255*4bdc9457SAndroid Build Coastguard Worker
256*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
257*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
258*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
259*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
260*4bdc9457SAndroid Build Coastguard Worker
261*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
262*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
263*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
264*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
265*4bdc9457SAndroid Build Coastguard Worker }
266*4bdc9457SAndroid Build Coastguard Worker }
267*4bdc9457SAndroid Build Coastguard Worker }
268*4bdc9457SAndroid Build Coastguard Worker
269*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTU32_SQRT_LRINT, 65536_output) {
270*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
271*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
272*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
273*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
274*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
275*4bdc9457SAndroid Build Coastguard Worker }
276*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvtu32_sqrt_lrint(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
277*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
278*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
279*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
280*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
281*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
282*4bdc9457SAndroid Build Coastguard Worker }
283*4bdc9457SAndroid Build Coastguard Worker }
284*4bdc9457SAndroid Build Coastguard Worker }
285*4bdc9457SAndroid Build Coastguard Worker
286*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_CVTI64_SQRTF_LRINTF,uint16_output)287*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTI64_SQRTF_LRINTF, uint16_output) {
288*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
289*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
290*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
291*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
292*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
293*4bdc9457SAndroid Build Coastguard Worker }
294*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvti64_sqrtf_lrintf(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
295*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
296*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
297*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
298*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
299*4bdc9457SAndroid Build Coastguard Worker
300*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
301*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
302*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
303*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
304*4bdc9457SAndroid Build Coastguard Worker
305*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
306*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
307*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
308*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
309*4bdc9457SAndroid Build Coastguard Worker }
310*4bdc9457SAndroid Build Coastguard Worker }
311*4bdc9457SAndroid Build Coastguard Worker }
312*4bdc9457SAndroid Build Coastguard Worker
313*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTI64_SQRTF_LRINTF, 65536_output) {
314*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
315*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
316*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
317*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
318*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
319*4bdc9457SAndroid Build Coastguard Worker }
320*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvti64_sqrtf_lrintf(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
321*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
322*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
323*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
324*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
325*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
326*4bdc9457SAndroid Build Coastguard Worker }
327*4bdc9457SAndroid Build Coastguard Worker }
328*4bdc9457SAndroid Build Coastguard Worker }
329*4bdc9457SAndroid Build Coastguard Worker
330*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_CVTU32_SQRTF_LRINTF,uint16_output)331*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTU32_SQRTF_LRINTF, uint16_output) {
332*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
333*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
334*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
335*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
336*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
337*4bdc9457SAndroid Build Coastguard Worker }
338*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvtu32_sqrtf_lrintf(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
339*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
340*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
341*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
342*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
343*4bdc9457SAndroid Build Coastguard Worker
344*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
345*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
346*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
347*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
348*4bdc9457SAndroid Build Coastguard Worker
349*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
350*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
351*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
352*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
353*4bdc9457SAndroid Build Coastguard Worker }
354*4bdc9457SAndroid Build Coastguard Worker }
355*4bdc9457SAndroid Build Coastguard Worker }
356*4bdc9457SAndroid Build Coastguard Worker
357*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_CVTU32_SQRTF_LRINTF, 65536_output) {
358*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
359*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
360*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
361*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
362*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
363*4bdc9457SAndroid Build Coastguard Worker }
364*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvtu32_sqrtf_lrintf(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
365*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
366*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
367*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
368*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
369*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
370*4bdc9457SAndroid Build Coastguard Worker }
371*4bdc9457SAndroid Build Coastguard Worker }
372*4bdc9457SAndroid Build Coastguard Worker }
373*4bdc9457SAndroid Build Coastguard Worker
374*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_HASHEMIAN,uint16_output)375*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_HASHEMIAN, uint16_output) {
376*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
377*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
378*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
379*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
380*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
381*4bdc9457SAndroid Build Coastguard Worker }
382*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_hashemian(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
383*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
384*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
385*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
386*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
387*4bdc9457SAndroid Build Coastguard Worker
388*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
389*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
390*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
391*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
392*4bdc9457SAndroid Build Coastguard Worker
393*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
394*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
395*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
396*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
397*4bdc9457SAndroid Build Coastguard Worker }
398*4bdc9457SAndroid Build Coastguard Worker }
399*4bdc9457SAndroid Build Coastguard Worker }
400*4bdc9457SAndroid Build Coastguard Worker
401*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_HASHEMIAN, 65536_output) {
402*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
403*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
404*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
405*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
406*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
407*4bdc9457SAndroid Build Coastguard Worker }
408*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_hashemian(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
409*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
410*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
411*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
412*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
413*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
414*4bdc9457SAndroid Build Coastguard Worker }
415*4bdc9457SAndroid Build Coastguard Worker }
416*4bdc9457SAndroid Build Coastguard Worker }
417*4bdc9457SAndroid Build Coastguard Worker
418*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_TFLM,uint16_output)419*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_TFLM, uint16_output) {
420*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
421*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
422*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 0; n <= UINT32_C(4294901760); n += kBlockSize) {
423*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
424*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::min<uint32_t>(n + i, UINT32_C(4294901760));
425*4bdc9457SAndroid Build Coastguard Worker }
426*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_tflm(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
427*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
428*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
429*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
430*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_output = int64_t(uint64_t(output) * uint64_t(output));
431*4bdc9457SAndroid Build Coastguard Worker
432*4bdc9457SAndroid Build Coastguard Worker const uint32_t prev_output = output - 1;
433*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_prev_output = int64_t(uint64_t(prev_output) * uint64_t(prev_output));
434*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_prev_output - int64_t(input)))
435*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
436*4bdc9457SAndroid Build Coastguard Worker
437*4bdc9457SAndroid Build Coastguard Worker const uint32_t next_output = output + 1;
438*4bdc9457SAndroid Build Coastguard Worker const int64_t squared_next_output = int64_t(uint64_t(next_output) * uint64_t(next_output));
439*4bdc9457SAndroid Build Coastguard Worker ASSERT_LT(std::abs(squared_output - int64_t(input)), std::abs(squared_next_output - int64_t(input)))
440*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
441*4bdc9457SAndroid Build Coastguard Worker }
442*4bdc9457SAndroid Build Coastguard Worker }
443*4bdc9457SAndroid Build Coastguard Worker }
444*4bdc9457SAndroid Build Coastguard Worker
TEST(SQRT__SCALAR_TFLM,DISABLED_65536_output)445*4bdc9457SAndroid Build Coastguard Worker TEST(SQRT__SCALAR_TFLM, DISABLED_65536_output) {
446*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> inputs(kBlockSize);
447*4bdc9457SAndroid Build Coastguard Worker std::vector<uint32_t, AlignedAllocator<uint32_t, 64>> outputs(kBlockSize);
448*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = UINT32_C(4294901761); n >= UINT32_C(4294901761); n += kBlockSize) {
449*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
450*4bdc9457SAndroid Build Coastguard Worker inputs[i] = std::max<uint32_t>(n + i, UINT32_C(4294901761));
451*4bdc9457SAndroid Build Coastguard Worker }
452*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_tflm(kBlockSize * sizeof(uint32_t), inputs.data(), outputs.data());
453*4bdc9457SAndroid Build Coastguard Worker for (uint32_t i = 0; i < kBlockSize; i++) {
454*4bdc9457SAndroid Build Coastguard Worker const uint32_t input = inputs[i];
455*4bdc9457SAndroid Build Coastguard Worker const uint32_t output = outputs[i];
456*4bdc9457SAndroid Build Coastguard Worker ASSERT_EQ(output, UINT32_C(0x00010000))
457*4bdc9457SAndroid Build Coastguard Worker << "input = " << input << ", output = " << output;
458*4bdc9457SAndroid Build Coastguard Worker }
459*4bdc9457SAndroid Build Coastguard Worker }
460*4bdc9457SAndroid Build Coastguard Worker }
461