1*77c1e3ccSAndroid Build Coastguard Worker /*
2*77c1e3ccSAndroid Build Coastguard Worker * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3*77c1e3ccSAndroid Build Coastguard Worker *
4*77c1e3ccSAndroid Build Coastguard Worker * This source code is subject to the terms of the BSD 2 Clause License and
5*77c1e3ccSAndroid Build Coastguard Worker * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6*77c1e3ccSAndroid Build Coastguard Worker * was not distributed with this source code in the LICENSE file, you can
7*77c1e3ccSAndroid Build Coastguard Worker * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8*77c1e3ccSAndroid Build Coastguard Worker * Media Patent License 1.0 was not distributed with this source code in the
9*77c1e3ccSAndroid Build Coastguard Worker * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10*77c1e3ccSAndroid Build Coastguard Worker */
11*77c1e3ccSAndroid Build Coastguard Worker
12*77c1e3ccSAndroid Build Coastguard Worker #include <cmath>
13*77c1e3ccSAndroid Build Coastguard Worker #include <cstdlib>
14*77c1e3ccSAndroid Build Coastguard Worker #include <string>
15*77c1e3ccSAndroid Build Coastguard Worker #include <tuple>
16*77c1e3ccSAndroid Build Coastguard Worker
17*77c1e3ccSAndroid Build Coastguard Worker #include "gtest/gtest.h"
18*77c1e3ccSAndroid Build Coastguard Worker
19*77c1e3ccSAndroid Build Coastguard Worker #include "config/aom_config.h"
20*77c1e3ccSAndroid Build Coastguard Worker #include "config/aom_dsp_rtcd.h"
21*77c1e3ccSAndroid Build Coastguard Worker
22*77c1e3ccSAndroid Build Coastguard Worker #include "aom_ports/mem.h"
23*77c1e3ccSAndroid Build Coastguard Worker #include "av1/common/common_data.h"
24*77c1e3ccSAndroid Build Coastguard Worker #include "test/acm_random.h"
25*77c1e3ccSAndroid Build Coastguard Worker #include "test/register_state_check.h"
26*77c1e3ccSAndroid Build Coastguard Worker #include "test/util.h"
27*77c1e3ccSAndroid Build Coastguard Worker #include "test/function_equivalence_test.h"
28*77c1e3ccSAndroid Build Coastguard Worker
29*77c1e3ccSAndroid Build Coastguard Worker using libaom_test::ACMRandom;
30*77c1e3ccSAndroid Build Coastguard Worker using libaom_test::FunctionEquivalenceTest;
31*77c1e3ccSAndroid Build Coastguard Worker using ::testing::Combine;
32*77c1e3ccSAndroid Build Coastguard Worker using ::testing::Range;
33*77c1e3ccSAndroid Build Coastguard Worker using ::testing::Values;
34*77c1e3ccSAndroid Build Coastguard Worker using ::testing::ValuesIn;
35*77c1e3ccSAndroid Build Coastguard Worker
36*77c1e3ccSAndroid Build Coastguard Worker namespace {
37*77c1e3ccSAndroid Build Coastguard Worker const int kNumIterations = 10000;
38*77c1e3ccSAndroid Build Coastguard Worker
39*77c1e3ccSAndroid Build Coastguard Worker static const int16_t kInt13Max = (1 << 12) - 1;
40*77c1e3ccSAndroid Build Coastguard Worker
41*77c1e3ccSAndroid Build Coastguard Worker typedef uint64_t (*SSI16Func)(const int16_t *src, int stride, int width,
42*77c1e3ccSAndroid Build Coastguard Worker int height);
43*77c1e3ccSAndroid Build Coastguard Worker typedef libaom_test::FuncParam<SSI16Func> TestFuncs;
44*77c1e3ccSAndroid Build Coastguard Worker
45*77c1e3ccSAndroid Build Coastguard Worker class SumSquaresTest : public ::testing::TestWithParam<TestFuncs> {
46*77c1e3ccSAndroid Build Coastguard Worker public:
47*77c1e3ccSAndroid Build Coastguard Worker ~SumSquaresTest() override = default;
SetUp()48*77c1e3ccSAndroid Build Coastguard Worker void SetUp() override {
49*77c1e3ccSAndroid Build Coastguard Worker params_ = this->GetParam();
50*77c1e3ccSAndroid Build Coastguard Worker rnd_.Reset(ACMRandom::DeterministicSeed());
51*77c1e3ccSAndroid Build Coastguard Worker src_ = reinterpret_cast<int16_t *>(aom_memalign(16, 256 * 256 * 2));
52*77c1e3ccSAndroid Build Coastguard Worker ASSERT_NE(src_, nullptr);
53*77c1e3ccSAndroid Build Coastguard Worker }
54*77c1e3ccSAndroid Build Coastguard Worker
TearDown()55*77c1e3ccSAndroid Build Coastguard Worker void TearDown() override { aom_free(src_); }
56*77c1e3ccSAndroid Build Coastguard Worker void RunTest(bool is_random);
57*77c1e3ccSAndroid Build Coastguard Worker void RunSpeedTest();
58*77c1e3ccSAndroid Build Coastguard Worker
GenRandomData(int width,int height,int stride)59*77c1e3ccSAndroid Build Coastguard Worker void GenRandomData(int width, int height, int stride) {
60*77c1e3ccSAndroid Build Coastguard Worker const int msb = 11; // Up to 12 bit input
61*77c1e3ccSAndroid Build Coastguard Worker const int limit = 1 << (msb + 1);
62*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
63*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
64*77c1e3ccSAndroid Build Coastguard Worker src_[ii * stride + jj] = rnd_(2) ? rnd_(limit) : -rnd_(limit);
65*77c1e3ccSAndroid Build Coastguard Worker }
66*77c1e3ccSAndroid Build Coastguard Worker }
67*77c1e3ccSAndroid Build Coastguard Worker }
68*77c1e3ccSAndroid Build Coastguard Worker
GenExtremeData(int width,int height,int stride)69*77c1e3ccSAndroid Build Coastguard Worker void GenExtremeData(int width, int height, int stride) {
70*77c1e3ccSAndroid Build Coastguard Worker const int msb = 11; // Up to 12 bit input
71*77c1e3ccSAndroid Build Coastguard Worker const int limit = 1 << (msb + 1);
72*77c1e3ccSAndroid Build Coastguard Worker const int val = rnd_(2) ? limit - 1 : -(limit - 1);
73*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
74*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
75*77c1e3ccSAndroid Build Coastguard Worker src_[ii * stride + jj] = val;
76*77c1e3ccSAndroid Build Coastguard Worker }
77*77c1e3ccSAndroid Build Coastguard Worker }
78*77c1e3ccSAndroid Build Coastguard Worker }
79*77c1e3ccSAndroid Build Coastguard Worker
80*77c1e3ccSAndroid Build Coastguard Worker protected:
81*77c1e3ccSAndroid Build Coastguard Worker TestFuncs params_;
82*77c1e3ccSAndroid Build Coastguard Worker int16_t *src_;
83*77c1e3ccSAndroid Build Coastguard Worker ACMRandom rnd_;
84*77c1e3ccSAndroid Build Coastguard Worker };
85*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(SumSquaresTest);
86*77c1e3ccSAndroid Build Coastguard Worker
RunTest(bool is_random)87*77c1e3ccSAndroid Build Coastguard Worker void SumSquaresTest::RunTest(bool is_random) {
88*77c1e3ccSAndroid Build Coastguard Worker int failed = 0;
89*77c1e3ccSAndroid Build Coastguard Worker for (int k = 0; k < kNumIterations; k++) {
90*77c1e3ccSAndroid Build Coastguard Worker const int width = 4 * (rnd_(31) + 1); // Up to 128x128
91*77c1e3ccSAndroid Build Coastguard Worker const int height = 4 * (rnd_(31) + 1); // Up to 128x128
92*77c1e3ccSAndroid Build Coastguard Worker int stride = 4 << rnd_(7); // Up to 256 stride
93*77c1e3ccSAndroid Build Coastguard Worker while (stride < width) { // Make sure it's valid
94*77c1e3ccSAndroid Build Coastguard Worker stride = 4 << rnd_(7);
95*77c1e3ccSAndroid Build Coastguard Worker }
96*77c1e3ccSAndroid Build Coastguard Worker if (is_random) {
97*77c1e3ccSAndroid Build Coastguard Worker GenRandomData(width, height, stride);
98*77c1e3ccSAndroid Build Coastguard Worker } else {
99*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride);
100*77c1e3ccSAndroid Build Coastguard Worker }
101*77c1e3ccSAndroid Build Coastguard Worker const uint64_t res_ref = params_.ref_func(src_, stride, width, height);
102*77c1e3ccSAndroid Build Coastguard Worker uint64_t res_tst;
103*77c1e3ccSAndroid Build Coastguard Worker API_REGISTER_STATE_CHECK(res_tst =
104*77c1e3ccSAndroid Build Coastguard Worker params_.tst_func(src_, stride, width, height));
105*77c1e3ccSAndroid Build Coastguard Worker
106*77c1e3ccSAndroid Build Coastguard Worker if (!failed) {
107*77c1e3ccSAndroid Build Coastguard Worker failed = res_ref != res_tst;
108*77c1e3ccSAndroid Build Coastguard Worker EXPECT_EQ(res_ref, res_tst)
109*77c1e3ccSAndroid Build Coastguard Worker << "Error: Sum Squares Test [" << width << "x" << height
110*77c1e3ccSAndroid Build Coastguard Worker << "] C output does not match optimized output.";
111*77c1e3ccSAndroid Build Coastguard Worker }
112*77c1e3ccSAndroid Build Coastguard Worker }
113*77c1e3ccSAndroid Build Coastguard Worker }
114*77c1e3ccSAndroid Build Coastguard Worker
RunSpeedTest()115*77c1e3ccSAndroid Build Coastguard Worker void SumSquaresTest::RunSpeedTest() {
116*77c1e3ccSAndroid Build Coastguard Worker for (int block = BLOCK_4X4; block < BLOCK_SIZES_ALL; block++) {
117*77c1e3ccSAndroid Build Coastguard Worker const int width = block_size_wide[block]; // Up to 128x128
118*77c1e3ccSAndroid Build Coastguard Worker const int height = block_size_high[block]; // Up to 128x128
119*77c1e3ccSAndroid Build Coastguard Worker int stride = 4 << rnd_(7); // Up to 256 stride
120*77c1e3ccSAndroid Build Coastguard Worker while (stride < width) { // Make sure it's valid
121*77c1e3ccSAndroid Build Coastguard Worker stride = 4 << rnd_(7);
122*77c1e3ccSAndroid Build Coastguard Worker }
123*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride);
124*77c1e3ccSAndroid Build Coastguard Worker const int num_loops = 1000000000 / (width + height);
125*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer;
126*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer);
127*77c1e3ccSAndroid Build Coastguard Worker
128*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < num_loops; ++i)
129*77c1e3ccSAndroid Build Coastguard Worker params_.ref_func(src_, stride, width, height);
130*77c1e3ccSAndroid Build Coastguard Worker
131*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&timer);
132*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer));
133*77c1e3ccSAndroid Build Coastguard Worker printf("SumSquaresTest C %3dx%-3d: %7.2f ns\n", width, height,
134*77c1e3ccSAndroid Build Coastguard Worker 1000.0 * elapsed_time / num_loops);
135*77c1e3ccSAndroid Build Coastguard Worker
136*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer1;
137*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer1);
138*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < num_loops; ++i)
139*77c1e3ccSAndroid Build Coastguard Worker params_.tst_func(src_, stride, width, height);
140*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&timer1);
141*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time1 = static_cast<int>(aom_usec_timer_elapsed(&timer1));
142*77c1e3ccSAndroid Build Coastguard Worker printf("SumSquaresTest Test %3dx%-3d: %7.2f ns\n", width, height,
143*77c1e3ccSAndroid Build Coastguard Worker 1000.0 * elapsed_time1 / num_loops);
144*77c1e3ccSAndroid Build Coastguard Worker }
145*77c1e3ccSAndroid Build Coastguard Worker }
146*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SumSquaresTest,OperationCheck)147*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SumSquaresTest, OperationCheck) {
148*77c1e3ccSAndroid Build Coastguard Worker RunTest(true); // GenRandomData
149*77c1e3ccSAndroid Build Coastguard Worker }
150*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SumSquaresTest,ExtremeValues)151*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SumSquaresTest, ExtremeValues) {
152*77c1e3ccSAndroid Build Coastguard Worker RunTest(false); // GenExtremeData
153*77c1e3ccSAndroid Build Coastguard Worker }
154*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SumSquaresTest,DISABLED_Speed)155*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SumSquaresTest, DISABLED_Speed) { RunSpeedTest(); }
156*77c1e3ccSAndroid Build Coastguard Worker
157*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE2
158*77c1e3ccSAndroid Build Coastguard Worker
159*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
160*77c1e3ccSAndroid Build Coastguard Worker SSE2, SumSquaresTest,
161*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncs(&aom_sum_squares_2d_i16_c,
162*77c1e3ccSAndroid Build Coastguard Worker &aom_sum_squares_2d_i16_sse2)));
163*77c1e3ccSAndroid Build Coastguard Worker
164*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SSE2
165*77c1e3ccSAndroid Build Coastguard Worker
166*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
167*77c1e3ccSAndroid Build Coastguard Worker
168*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
169*77c1e3ccSAndroid Build Coastguard Worker NEON, SumSquaresTest,
170*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncs(&aom_sum_squares_2d_i16_c,
171*77c1e3ccSAndroid Build Coastguard Worker &aom_sum_squares_2d_i16_neon)));
172*77c1e3ccSAndroid Build Coastguard Worker
173*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_NEON
174*77c1e3ccSAndroid Build Coastguard Worker
175*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SVE
176*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
177*77c1e3ccSAndroid Build Coastguard Worker SVE, SumSquaresTest,
178*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncs(&aom_sum_squares_2d_i16_c,
179*77c1e3ccSAndroid Build Coastguard Worker &aom_sum_squares_2d_i16_sve)));
180*77c1e3ccSAndroid Build Coastguard Worker
181*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SVE
182*77c1e3ccSAndroid Build Coastguard Worker
183*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
184*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
185*77c1e3ccSAndroid Build Coastguard Worker AVX2, SumSquaresTest,
186*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncs(&aom_sum_squares_2d_i16_c,
187*77c1e3ccSAndroid Build Coastguard Worker &aom_sum_squares_2d_i16_avx2)));
188*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_AVX2
189*77c1e3ccSAndroid Build Coastguard Worker
190*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
191*77c1e3ccSAndroid Build Coastguard Worker // 1D version
192*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
193*77c1e3ccSAndroid Build Coastguard Worker
194*77c1e3ccSAndroid Build Coastguard Worker typedef uint64_t (*F1D)(const int16_t *src, uint32_t n);
195*77c1e3ccSAndroid Build Coastguard Worker typedef libaom_test::FuncParam<F1D> TestFuncs1D;
196*77c1e3ccSAndroid Build Coastguard Worker
197*77c1e3ccSAndroid Build Coastguard Worker class SumSquares1DTest : public FunctionEquivalenceTest<F1D> {
198*77c1e3ccSAndroid Build Coastguard Worker protected:
199*77c1e3ccSAndroid Build Coastguard Worker static const int kIterations = 1000;
200*77c1e3ccSAndroid Build Coastguard Worker static const int kMaxSize = 256;
201*77c1e3ccSAndroid Build Coastguard Worker };
202*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(SumSquares1DTest);
203*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SumSquares1DTest,RandomValues)204*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SumSquares1DTest, RandomValues) {
205*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, int16_t, src[kMaxSize * kMaxSize]);
206*77c1e3ccSAndroid Build Coastguard Worker
207*77c1e3ccSAndroid Build Coastguard Worker for (int iter = 0; iter < kIterations && !HasFatalFailure(); ++iter) {
208*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < kMaxSize * kMaxSize; ++i)
209*77c1e3ccSAndroid Build Coastguard Worker src[i] = rng_(kInt13Max * 2 + 1) - kInt13Max;
210*77c1e3ccSAndroid Build Coastguard Worker
211*77c1e3ccSAndroid Build Coastguard Worker // Block size is between 64 and 128 * 128 and is always a multiple of 64.
212*77c1e3ccSAndroid Build Coastguard Worker const int n = (rng_(255) + 1) * 64;
213*77c1e3ccSAndroid Build Coastguard Worker
214*77c1e3ccSAndroid Build Coastguard Worker const uint64_t ref_res = params_.ref_func(src, n);
215*77c1e3ccSAndroid Build Coastguard Worker uint64_t tst_res;
216*77c1e3ccSAndroid Build Coastguard Worker API_REGISTER_STATE_CHECK(tst_res = params_.tst_func(src, n));
217*77c1e3ccSAndroid Build Coastguard Worker
218*77c1e3ccSAndroid Build Coastguard Worker ASSERT_EQ(ref_res, tst_res);
219*77c1e3ccSAndroid Build Coastguard Worker }
220*77c1e3ccSAndroid Build Coastguard Worker }
221*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SumSquares1DTest,ExtremeValues)222*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SumSquares1DTest, ExtremeValues) {
223*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, int16_t, src[kMaxSize * kMaxSize]);
224*77c1e3ccSAndroid Build Coastguard Worker
225*77c1e3ccSAndroid Build Coastguard Worker for (int iter = 0; iter < kIterations && !HasFatalFailure(); ++iter) {
226*77c1e3ccSAndroid Build Coastguard Worker if (rng_(2)) {
227*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < kMaxSize * kMaxSize; ++i) src[i] = kInt13Max;
228*77c1e3ccSAndroid Build Coastguard Worker } else {
229*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < kMaxSize * kMaxSize; ++i) src[i] = -kInt13Max;
230*77c1e3ccSAndroid Build Coastguard Worker }
231*77c1e3ccSAndroid Build Coastguard Worker
232*77c1e3ccSAndroid Build Coastguard Worker // Block size is between 64 and 128 * 128 and is always a multiple of 64.
233*77c1e3ccSAndroid Build Coastguard Worker const int n = (rng_(255) + 1) * 64;
234*77c1e3ccSAndroid Build Coastguard Worker
235*77c1e3ccSAndroid Build Coastguard Worker const uint64_t ref_res = params_.ref_func(src, n);
236*77c1e3ccSAndroid Build Coastguard Worker uint64_t tst_res;
237*77c1e3ccSAndroid Build Coastguard Worker API_REGISTER_STATE_CHECK(tst_res = params_.tst_func(src, n));
238*77c1e3ccSAndroid Build Coastguard Worker
239*77c1e3ccSAndroid Build Coastguard Worker ASSERT_EQ(ref_res, tst_res);
240*77c1e3ccSAndroid Build Coastguard Worker }
241*77c1e3ccSAndroid Build Coastguard Worker }
242*77c1e3ccSAndroid Build Coastguard Worker
243*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE2
244*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SSE2, SumSquares1DTest,
245*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncs1D(
246*77c1e3ccSAndroid Build Coastguard Worker aom_sum_squares_i16_c, aom_sum_squares_i16_sse2)));
247*77c1e3ccSAndroid Build Coastguard Worker
248*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SSE2
249*77c1e3ccSAndroid Build Coastguard Worker
250*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
251*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(NEON, SumSquares1DTest,
252*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncs1D(
253*77c1e3ccSAndroid Build Coastguard Worker aom_sum_squares_i16_c, aom_sum_squares_i16_neon)));
254*77c1e3ccSAndroid Build Coastguard Worker
255*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_NEON
256*77c1e3ccSAndroid Build Coastguard Worker
257*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SVE
258*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SVE, SumSquares1DTest,
259*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncs1D(
260*77c1e3ccSAndroid Build Coastguard Worker aom_sum_squares_i16_c, aom_sum_squares_i16_sve)));
261*77c1e3ccSAndroid Build Coastguard Worker
262*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SVE
263*77c1e3ccSAndroid Build Coastguard Worker
264*77c1e3ccSAndroid Build Coastguard Worker typedef int64_t (*SSEFunc)(const uint8_t *a, int a_stride, const uint8_t *b,
265*77c1e3ccSAndroid Build Coastguard Worker int b_stride, int width, int height);
266*77c1e3ccSAndroid Build Coastguard Worker typedef libaom_test::FuncParam<SSEFunc> TestSSEFuncs;
267*77c1e3ccSAndroid Build Coastguard Worker
268*77c1e3ccSAndroid Build Coastguard Worker typedef std::tuple<TestSSEFuncs, int> SSETestParam;
269*77c1e3ccSAndroid Build Coastguard Worker
270*77c1e3ccSAndroid Build Coastguard Worker class SSETest : public ::testing::TestWithParam<SSETestParam> {
271*77c1e3ccSAndroid Build Coastguard Worker public:
272*77c1e3ccSAndroid Build Coastguard Worker ~SSETest() override = default;
SetUp()273*77c1e3ccSAndroid Build Coastguard Worker void SetUp() override {
274*77c1e3ccSAndroid Build Coastguard Worker params_ = GET_PARAM(0);
275*77c1e3ccSAndroid Build Coastguard Worker width_ = GET_PARAM(1);
276*77c1e3ccSAndroid Build Coastguard Worker is_hbd_ =
277*77c1e3ccSAndroid Build Coastguard Worker #if CONFIG_AV1_HIGHBITDEPTH
278*77c1e3ccSAndroid Build Coastguard Worker params_.ref_func == aom_highbd_sse_c;
279*77c1e3ccSAndroid Build Coastguard Worker #else
280*77c1e3ccSAndroid Build Coastguard Worker false;
281*77c1e3ccSAndroid Build Coastguard Worker #endif
282*77c1e3ccSAndroid Build Coastguard Worker rnd_.Reset(ACMRandom::DeterministicSeed());
283*77c1e3ccSAndroid Build Coastguard Worker src_ = reinterpret_cast<uint8_t *>(aom_memalign(32, 256 * 256 * 2));
284*77c1e3ccSAndroid Build Coastguard Worker ref_ = reinterpret_cast<uint8_t *>(aom_memalign(32, 256 * 256 * 2));
285*77c1e3ccSAndroid Build Coastguard Worker ASSERT_NE(src_, nullptr);
286*77c1e3ccSAndroid Build Coastguard Worker ASSERT_NE(ref_, nullptr);
287*77c1e3ccSAndroid Build Coastguard Worker }
288*77c1e3ccSAndroid Build Coastguard Worker
TearDown()289*77c1e3ccSAndroid Build Coastguard Worker void TearDown() override {
290*77c1e3ccSAndroid Build Coastguard Worker aom_free(src_);
291*77c1e3ccSAndroid Build Coastguard Worker aom_free(ref_);
292*77c1e3ccSAndroid Build Coastguard Worker }
293*77c1e3ccSAndroid Build Coastguard Worker void RunTest(bool is_random, int width, int height, int run_times);
294*77c1e3ccSAndroid Build Coastguard Worker
GenRandomData(int width,int height,int stride)295*77c1e3ccSAndroid Build Coastguard Worker void GenRandomData(int width, int height, int stride) {
296*77c1e3ccSAndroid Build Coastguard Worker uint16_t *src16 = reinterpret_cast<uint16_t *>(src_);
297*77c1e3ccSAndroid Build Coastguard Worker uint16_t *ref16 = reinterpret_cast<uint16_t *>(ref_);
298*77c1e3ccSAndroid Build Coastguard Worker const int msb = 11; // Up to 12 bit input
299*77c1e3ccSAndroid Build Coastguard Worker const int limit = 1 << (msb + 1);
300*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
301*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
302*77c1e3ccSAndroid Build Coastguard Worker if (!is_hbd_) {
303*77c1e3ccSAndroid Build Coastguard Worker src_[ii * stride + jj] = rnd_.Rand8();
304*77c1e3ccSAndroid Build Coastguard Worker ref_[ii * stride + jj] = rnd_.Rand8();
305*77c1e3ccSAndroid Build Coastguard Worker } else {
306*77c1e3ccSAndroid Build Coastguard Worker src16[ii * stride + jj] = rnd_(limit);
307*77c1e3ccSAndroid Build Coastguard Worker ref16[ii * stride + jj] = rnd_(limit);
308*77c1e3ccSAndroid Build Coastguard Worker }
309*77c1e3ccSAndroid Build Coastguard Worker }
310*77c1e3ccSAndroid Build Coastguard Worker }
311*77c1e3ccSAndroid Build Coastguard Worker }
312*77c1e3ccSAndroid Build Coastguard Worker
GenExtremeData(int width,int height,int stride,uint8_t * data,int16_t val)313*77c1e3ccSAndroid Build Coastguard Worker void GenExtremeData(int width, int height, int stride, uint8_t *data,
314*77c1e3ccSAndroid Build Coastguard Worker int16_t val) {
315*77c1e3ccSAndroid Build Coastguard Worker uint16_t *data16 = reinterpret_cast<uint16_t *>(data);
316*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
317*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
318*77c1e3ccSAndroid Build Coastguard Worker if (!is_hbd_) {
319*77c1e3ccSAndroid Build Coastguard Worker data[ii * stride + jj] = static_cast<uint8_t>(val);
320*77c1e3ccSAndroid Build Coastguard Worker } else {
321*77c1e3ccSAndroid Build Coastguard Worker data16[ii * stride + jj] = val;
322*77c1e3ccSAndroid Build Coastguard Worker }
323*77c1e3ccSAndroid Build Coastguard Worker }
324*77c1e3ccSAndroid Build Coastguard Worker }
325*77c1e3ccSAndroid Build Coastguard Worker }
326*77c1e3ccSAndroid Build Coastguard Worker
327*77c1e3ccSAndroid Build Coastguard Worker protected:
328*77c1e3ccSAndroid Build Coastguard Worker bool is_hbd_;
329*77c1e3ccSAndroid Build Coastguard Worker int width_;
330*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs params_;
331*77c1e3ccSAndroid Build Coastguard Worker uint8_t *src_;
332*77c1e3ccSAndroid Build Coastguard Worker uint8_t *ref_;
333*77c1e3ccSAndroid Build Coastguard Worker ACMRandom rnd_;
334*77c1e3ccSAndroid Build Coastguard Worker };
335*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(SSETest);
336*77c1e3ccSAndroid Build Coastguard Worker
RunTest(bool is_random,int width,int height,int run_times)337*77c1e3ccSAndroid Build Coastguard Worker void SSETest::RunTest(bool is_random, int width, int height, int run_times) {
338*77c1e3ccSAndroid Build Coastguard Worker int failed = 0;
339*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer ref_timer, test_timer;
340*77c1e3ccSAndroid Build Coastguard Worker for (int k = 0; k < 3; k++) {
341*77c1e3ccSAndroid Build Coastguard Worker int stride = 4 << rnd_(7); // Up to 256 stride
342*77c1e3ccSAndroid Build Coastguard Worker while (stride < width) { // Make sure it's valid
343*77c1e3ccSAndroid Build Coastguard Worker stride = 4 << rnd_(7);
344*77c1e3ccSAndroid Build Coastguard Worker }
345*77c1e3ccSAndroid Build Coastguard Worker if (is_random) {
346*77c1e3ccSAndroid Build Coastguard Worker GenRandomData(width, height, stride);
347*77c1e3ccSAndroid Build Coastguard Worker } else {
348*77c1e3ccSAndroid Build Coastguard Worker const int msb = is_hbd_ ? 12 : 8; // Up to 12 bit input
349*77c1e3ccSAndroid Build Coastguard Worker const int limit = (1 << msb) - 1;
350*77c1e3ccSAndroid Build Coastguard Worker if (k == 0) {
351*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride, src_, 0);
352*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride, ref_, limit);
353*77c1e3ccSAndroid Build Coastguard Worker } else {
354*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride, src_, limit);
355*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride, ref_, 0);
356*77c1e3ccSAndroid Build Coastguard Worker }
357*77c1e3ccSAndroid Build Coastguard Worker }
358*77c1e3ccSAndroid Build Coastguard Worker int64_t res_ref, res_tst;
359*77c1e3ccSAndroid Build Coastguard Worker uint8_t *src = src_;
360*77c1e3ccSAndroid Build Coastguard Worker uint8_t *ref = ref_;
361*77c1e3ccSAndroid Build Coastguard Worker if (is_hbd_) {
362*77c1e3ccSAndroid Build Coastguard Worker src = CONVERT_TO_BYTEPTR(src_);
363*77c1e3ccSAndroid Build Coastguard Worker ref = CONVERT_TO_BYTEPTR(ref_);
364*77c1e3ccSAndroid Build Coastguard Worker }
365*77c1e3ccSAndroid Build Coastguard Worker res_ref = params_.ref_func(src, stride, ref, stride, width, height);
366*77c1e3ccSAndroid Build Coastguard Worker res_tst = params_.tst_func(src, stride, ref, stride, width, height);
367*77c1e3ccSAndroid Build Coastguard Worker if (run_times > 1) {
368*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&ref_timer);
369*77c1e3ccSAndroid Build Coastguard Worker for (int j = 0; j < run_times; j++) {
370*77c1e3ccSAndroid Build Coastguard Worker params_.ref_func(src, stride, ref, stride, width, height);
371*77c1e3ccSAndroid Build Coastguard Worker }
372*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&ref_timer);
373*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time_c =
374*77c1e3ccSAndroid Build Coastguard Worker static_cast<int>(aom_usec_timer_elapsed(&ref_timer));
375*77c1e3ccSAndroid Build Coastguard Worker
376*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&test_timer);
377*77c1e3ccSAndroid Build Coastguard Worker for (int j = 0; j < run_times; j++) {
378*77c1e3ccSAndroid Build Coastguard Worker params_.tst_func(src, stride, ref, stride, width, height);
379*77c1e3ccSAndroid Build Coastguard Worker }
380*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&test_timer);
381*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time_simd =
382*77c1e3ccSAndroid Build Coastguard Worker static_cast<int>(aom_usec_timer_elapsed(&test_timer));
383*77c1e3ccSAndroid Build Coastguard Worker
384*77c1e3ccSAndroid Build Coastguard Worker printf(
385*77c1e3ccSAndroid Build Coastguard Worker "c_time=%d \t simd_time=%d \t "
386*77c1e3ccSAndroid Build Coastguard Worker "gain=%d\n",
387*77c1e3ccSAndroid Build Coastguard Worker elapsed_time_c, elapsed_time_simd,
388*77c1e3ccSAndroid Build Coastguard Worker (elapsed_time_c / elapsed_time_simd));
389*77c1e3ccSAndroid Build Coastguard Worker } else {
390*77c1e3ccSAndroid Build Coastguard Worker if (!failed) {
391*77c1e3ccSAndroid Build Coastguard Worker failed = res_ref != res_tst;
392*77c1e3ccSAndroid Build Coastguard Worker EXPECT_EQ(res_ref, res_tst)
393*77c1e3ccSAndroid Build Coastguard Worker << "Error:" << (is_hbd_ ? "hbd " : " ") << k << " SSE Test ["
394*77c1e3ccSAndroid Build Coastguard Worker << width << "x" << height
395*77c1e3ccSAndroid Build Coastguard Worker << "] C output does not match optimized output.";
396*77c1e3ccSAndroid Build Coastguard Worker }
397*77c1e3ccSAndroid Build Coastguard Worker }
398*77c1e3ccSAndroid Build Coastguard Worker }
399*77c1e3ccSAndroid Build Coastguard Worker }
400*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SSETest,OperationCheck)401*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SSETest, OperationCheck) {
402*77c1e3ccSAndroid Build Coastguard Worker for (int height = 4; height <= 128; height += 4) {
403*77c1e3ccSAndroid Build Coastguard Worker RunTest(true, width_, height, 1); // GenRandomData
404*77c1e3ccSAndroid Build Coastguard Worker }
405*77c1e3ccSAndroid Build Coastguard Worker }
406*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SSETest,ExtremeValues)407*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SSETest, ExtremeValues) {
408*77c1e3ccSAndroid Build Coastguard Worker for (int height = 4; height <= 128; height += 4) {
409*77c1e3ccSAndroid Build Coastguard Worker RunTest(false, width_, height, 1);
410*77c1e3ccSAndroid Build Coastguard Worker }
411*77c1e3ccSAndroid Build Coastguard Worker }
412*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SSETest,DISABLED_Speed)413*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SSETest, DISABLED_Speed) {
414*77c1e3ccSAndroid Build Coastguard Worker for (int height = 4; height <= 128; height += 4) {
415*77c1e3ccSAndroid Build Coastguard Worker RunTest(true, width_, height, 100);
416*77c1e3ccSAndroid Build Coastguard Worker }
417*77c1e3ccSAndroid Build Coastguard Worker }
418*77c1e3ccSAndroid Build Coastguard Worker
419*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
420*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs sse_neon[] = {
421*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs(&aom_sse_c, &aom_sse_neon),
422*77c1e3ccSAndroid Build Coastguard Worker #if CONFIG_AV1_HIGHBITDEPTH
423*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs(&aom_highbd_sse_c, &aom_highbd_sse_neon)
424*77c1e3ccSAndroid Build Coastguard Worker #endif
425*77c1e3ccSAndroid Build Coastguard Worker };
426*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(NEON, SSETest,
427*77c1e3ccSAndroid Build Coastguard Worker Combine(ValuesIn(sse_neon), Range(4, 129, 4)));
428*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_NEON
429*77c1e3ccSAndroid Build Coastguard Worker
430*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON_DOTPROD
431*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs sse_neon_dotprod[] = {
432*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs(&aom_sse_c, &aom_sse_neon_dotprod),
433*77c1e3ccSAndroid Build Coastguard Worker };
434*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(NEON_DOTPROD, SSETest,
435*77c1e3ccSAndroid Build Coastguard Worker Combine(ValuesIn(sse_neon_dotprod), Range(4, 129, 4)));
436*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_NEON_DOTPROD
437*77c1e3ccSAndroid Build Coastguard Worker
438*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE4_1
439*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs sse_sse4[] = {
440*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs(&aom_sse_c, &aom_sse_sse4_1),
441*77c1e3ccSAndroid Build Coastguard Worker #if CONFIG_AV1_HIGHBITDEPTH
442*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs(&aom_highbd_sse_c, &aom_highbd_sse_sse4_1)
443*77c1e3ccSAndroid Build Coastguard Worker #endif
444*77c1e3ccSAndroid Build Coastguard Worker };
445*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SSE4_1, SSETest,
446*77c1e3ccSAndroid Build Coastguard Worker Combine(ValuesIn(sse_sse4), Range(4, 129, 4)));
447*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SSE4_1
448*77c1e3ccSAndroid Build Coastguard Worker
449*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
450*77c1e3ccSAndroid Build Coastguard Worker
451*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs sse_avx2[] = {
452*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs(&aom_sse_c, &aom_sse_avx2),
453*77c1e3ccSAndroid Build Coastguard Worker #if CONFIG_AV1_HIGHBITDEPTH
454*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs(&aom_highbd_sse_c, &aom_highbd_sse_avx2)
455*77c1e3ccSAndroid Build Coastguard Worker #endif
456*77c1e3ccSAndroid Build Coastguard Worker };
457*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(AVX2, SSETest,
458*77c1e3ccSAndroid Build Coastguard Worker Combine(ValuesIn(sse_avx2), Range(4, 129, 4)));
459*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_AVX2
460*77c1e3ccSAndroid Build Coastguard Worker
461*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SVE
462*77c1e3ccSAndroid Build Coastguard Worker #if CONFIG_AV1_HIGHBITDEPTH
463*77c1e3ccSAndroid Build Coastguard Worker TestSSEFuncs sse_sve[] = { TestSSEFuncs(&aom_highbd_sse_c,
464*77c1e3ccSAndroid Build Coastguard Worker &aom_highbd_sse_sve) };
465*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SVE, SSETest,
466*77c1e3ccSAndroid Build Coastguard Worker Combine(ValuesIn(sse_sve), Range(4, 129, 4)));
467*77c1e3ccSAndroid Build Coastguard Worker #endif
468*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SVE
469*77c1e3ccSAndroid Build Coastguard Worker
470*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
471*77c1e3ccSAndroid Build Coastguard Worker // get_blk sum squares test functions
472*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
473*77c1e3ccSAndroid Build Coastguard Worker
474*77c1e3ccSAndroid Build Coastguard Worker typedef void (*sse_sum_func)(const int16_t *data, int stride, int bw, int bh,
475*77c1e3ccSAndroid Build Coastguard Worker int *x_sum, int64_t *x2_sum);
476*77c1e3ccSAndroid Build Coastguard Worker typedef libaom_test::FuncParam<sse_sum_func> TestSSE_SumFuncs;
477*77c1e3ccSAndroid Build Coastguard Worker
478*77c1e3ccSAndroid Build Coastguard Worker typedef std::tuple<TestSSE_SumFuncs, TX_SIZE> SSE_SumTestParam;
479*77c1e3ccSAndroid Build Coastguard Worker
480*77c1e3ccSAndroid Build Coastguard Worker class SSE_Sum_Test : public ::testing::TestWithParam<SSE_SumTestParam> {
481*77c1e3ccSAndroid Build Coastguard Worker public:
482*77c1e3ccSAndroid Build Coastguard Worker ~SSE_Sum_Test() override = default;
SetUp()483*77c1e3ccSAndroid Build Coastguard Worker void SetUp() override {
484*77c1e3ccSAndroid Build Coastguard Worker params_ = GET_PARAM(0);
485*77c1e3ccSAndroid Build Coastguard Worker rnd_.Reset(ACMRandom::DeterministicSeed());
486*77c1e3ccSAndroid Build Coastguard Worker src_ = reinterpret_cast<int16_t *>(aom_memalign(32, 256 * 256 * 2));
487*77c1e3ccSAndroid Build Coastguard Worker ASSERT_NE(src_, nullptr);
488*77c1e3ccSAndroid Build Coastguard Worker }
489*77c1e3ccSAndroid Build Coastguard Worker
TearDown()490*77c1e3ccSAndroid Build Coastguard Worker void TearDown() override { aom_free(src_); }
491*77c1e3ccSAndroid Build Coastguard Worker void RunTest(bool is_random, int tx_size, int run_times);
492*77c1e3ccSAndroid Build Coastguard Worker
GenRandomData(int width,int height,int stride)493*77c1e3ccSAndroid Build Coastguard Worker void GenRandomData(int width, int height, int stride) {
494*77c1e3ccSAndroid Build Coastguard Worker const int msb = 11; // Up to 12 bit input
495*77c1e3ccSAndroid Build Coastguard Worker const int limit = 1 << (msb + 1);
496*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
497*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
498*77c1e3ccSAndroid Build Coastguard Worker src_[ii * stride + jj] = rnd_(limit);
499*77c1e3ccSAndroid Build Coastguard Worker }
500*77c1e3ccSAndroid Build Coastguard Worker }
501*77c1e3ccSAndroid Build Coastguard Worker }
502*77c1e3ccSAndroid Build Coastguard Worker
GenExtremeData(int width,int height,int stride,int16_t * data,int16_t val)503*77c1e3ccSAndroid Build Coastguard Worker void GenExtremeData(int width, int height, int stride, int16_t *data,
504*77c1e3ccSAndroid Build Coastguard Worker int16_t val) {
505*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
506*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
507*77c1e3ccSAndroid Build Coastguard Worker data[ii * stride + jj] = val;
508*77c1e3ccSAndroid Build Coastguard Worker }
509*77c1e3ccSAndroid Build Coastguard Worker }
510*77c1e3ccSAndroid Build Coastguard Worker }
511*77c1e3ccSAndroid Build Coastguard Worker
512*77c1e3ccSAndroid Build Coastguard Worker protected:
513*77c1e3ccSAndroid Build Coastguard Worker TestSSE_SumFuncs params_;
514*77c1e3ccSAndroid Build Coastguard Worker int16_t *src_;
515*77c1e3ccSAndroid Build Coastguard Worker ACMRandom rnd_;
516*77c1e3ccSAndroid Build Coastguard Worker };
517*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(SSE_Sum_Test);
518*77c1e3ccSAndroid Build Coastguard Worker
RunTest(bool is_random,int tx_size,int run_times)519*77c1e3ccSAndroid Build Coastguard Worker void SSE_Sum_Test::RunTest(bool is_random, int tx_size, int run_times) {
520*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer ref_timer, test_timer;
521*77c1e3ccSAndroid Build Coastguard Worker int width = tx_size_wide[tx_size];
522*77c1e3ccSAndroid Build Coastguard Worker int height = tx_size_high[tx_size];
523*77c1e3ccSAndroid Build Coastguard Worker for (int k = 0; k < 3; k++) {
524*77c1e3ccSAndroid Build Coastguard Worker int stride = 4 << rnd_(7); // Up to 256 stride
525*77c1e3ccSAndroid Build Coastguard Worker while (stride < width) { // Make sure it's valid
526*77c1e3ccSAndroid Build Coastguard Worker stride = 4 << rnd_(7);
527*77c1e3ccSAndroid Build Coastguard Worker }
528*77c1e3ccSAndroid Build Coastguard Worker if (is_random) {
529*77c1e3ccSAndroid Build Coastguard Worker GenRandomData(width, height, stride);
530*77c1e3ccSAndroid Build Coastguard Worker } else {
531*77c1e3ccSAndroid Build Coastguard Worker const int msb = 12; // Up to 12 bit input
532*77c1e3ccSAndroid Build Coastguard Worker const int limit = (1 << msb) - 1;
533*77c1e3ccSAndroid Build Coastguard Worker if (k == 0) {
534*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride, src_, limit);
535*77c1e3ccSAndroid Build Coastguard Worker } else {
536*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride, src_, -limit);
537*77c1e3ccSAndroid Build Coastguard Worker }
538*77c1e3ccSAndroid Build Coastguard Worker }
539*77c1e3ccSAndroid Build Coastguard Worker int sum_c = 0;
540*77c1e3ccSAndroid Build Coastguard Worker int64_t sse_intr = 0;
541*77c1e3ccSAndroid Build Coastguard Worker int sum_intr = 0;
542*77c1e3ccSAndroid Build Coastguard Worker int64_t sse_c = 0;
543*77c1e3ccSAndroid Build Coastguard Worker
544*77c1e3ccSAndroid Build Coastguard Worker params_.ref_func(src_, stride, width, height, &sum_c, &sse_c);
545*77c1e3ccSAndroid Build Coastguard Worker params_.tst_func(src_, stride, width, height, &sum_intr, &sse_intr);
546*77c1e3ccSAndroid Build Coastguard Worker
547*77c1e3ccSAndroid Build Coastguard Worker if (run_times > 1) {
548*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&ref_timer);
549*77c1e3ccSAndroid Build Coastguard Worker for (int j = 0; j < run_times; j++) {
550*77c1e3ccSAndroid Build Coastguard Worker params_.ref_func(src_, stride, width, height, &sum_c, &sse_c);
551*77c1e3ccSAndroid Build Coastguard Worker }
552*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&ref_timer);
553*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time_c =
554*77c1e3ccSAndroid Build Coastguard Worker static_cast<int>(aom_usec_timer_elapsed(&ref_timer));
555*77c1e3ccSAndroid Build Coastguard Worker
556*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&test_timer);
557*77c1e3ccSAndroid Build Coastguard Worker for (int j = 0; j < run_times; j++) {
558*77c1e3ccSAndroid Build Coastguard Worker params_.tst_func(src_, stride, width, height, &sum_intr, &sse_intr);
559*77c1e3ccSAndroid Build Coastguard Worker }
560*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&test_timer);
561*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time_simd =
562*77c1e3ccSAndroid Build Coastguard Worker static_cast<int>(aom_usec_timer_elapsed(&test_timer));
563*77c1e3ccSAndroid Build Coastguard Worker
564*77c1e3ccSAndroid Build Coastguard Worker printf(
565*77c1e3ccSAndroid Build Coastguard Worker "c_time=%d \t simd_time=%d \t "
566*77c1e3ccSAndroid Build Coastguard Worker "gain=%f\t width=%d\t height=%d \n",
567*77c1e3ccSAndroid Build Coastguard Worker elapsed_time_c, elapsed_time_simd,
568*77c1e3ccSAndroid Build Coastguard Worker (float)((float)elapsed_time_c / (float)elapsed_time_simd), width,
569*77c1e3ccSAndroid Build Coastguard Worker height);
570*77c1e3ccSAndroid Build Coastguard Worker
571*77c1e3ccSAndroid Build Coastguard Worker } else {
572*77c1e3ccSAndroid Build Coastguard Worker EXPECT_EQ(sum_c, sum_intr)
573*77c1e3ccSAndroid Build Coastguard Worker << "Error:" << k << " SSE Sum Test [" << width << "x" << height
574*77c1e3ccSAndroid Build Coastguard Worker << "] C output does not match optimized output.";
575*77c1e3ccSAndroid Build Coastguard Worker EXPECT_EQ(sse_c, sse_intr)
576*77c1e3ccSAndroid Build Coastguard Worker << "Error:" << k << " SSE Sum Test [" << width << "x" << height
577*77c1e3ccSAndroid Build Coastguard Worker << "] C output does not match optimized output.";
578*77c1e3ccSAndroid Build Coastguard Worker }
579*77c1e3ccSAndroid Build Coastguard Worker }
580*77c1e3ccSAndroid Build Coastguard Worker }
581*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SSE_Sum_Test,OperationCheck)582*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SSE_Sum_Test, OperationCheck) {
583*77c1e3ccSAndroid Build Coastguard Worker RunTest(true, GET_PARAM(1), 1); // GenRandomData
584*77c1e3ccSAndroid Build Coastguard Worker }
585*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SSE_Sum_Test,ExtremeValues)586*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SSE_Sum_Test, ExtremeValues) { RunTest(false, GET_PARAM(1), 1); }
587*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(SSE_Sum_Test,DISABLED_Speed)588*77c1e3ccSAndroid Build Coastguard Worker TEST_P(SSE_Sum_Test, DISABLED_Speed) { RunTest(true, GET_PARAM(1), 10000); }
589*77c1e3ccSAndroid Build Coastguard Worker
590*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE2 || HAVE_AVX2 || HAVE_NEON
591*77c1e3ccSAndroid Build Coastguard Worker const TX_SIZE kValidBlockSize[] = { TX_4X4, TX_8X8, TX_16X16, TX_32X32,
592*77c1e3ccSAndroid Build Coastguard Worker TX_64X64, TX_4X8, TX_8X4, TX_8X16,
593*77c1e3ccSAndroid Build Coastguard Worker TX_16X8, TX_16X32, TX_32X16, TX_64X32,
594*77c1e3ccSAndroid Build Coastguard Worker TX_32X64, TX_4X16, TX_16X4, TX_8X32,
595*77c1e3ccSAndroid Build Coastguard Worker TX_32X8, TX_16X64, TX_64X16 };
596*77c1e3ccSAndroid Build Coastguard Worker #endif
597*77c1e3ccSAndroid Build Coastguard Worker
598*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE2
599*77c1e3ccSAndroid Build Coastguard Worker TestSSE_SumFuncs sse_sum_sse2[] = { TestSSE_SumFuncs(
600*77c1e3ccSAndroid Build Coastguard Worker &aom_get_blk_sse_sum_c, &aom_get_blk_sse_sum_sse2) };
601*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SSE2, SSE_Sum_Test,
602*77c1e3ccSAndroid Build Coastguard Worker Combine(ValuesIn(sse_sum_sse2),
603*77c1e3ccSAndroid Build Coastguard Worker ValuesIn(kValidBlockSize)));
604*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SSE2
605*77c1e3ccSAndroid Build Coastguard Worker
606*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
607*77c1e3ccSAndroid Build Coastguard Worker TestSSE_SumFuncs sse_sum_avx2[] = { TestSSE_SumFuncs(
608*77c1e3ccSAndroid Build Coastguard Worker &aom_get_blk_sse_sum_c, &aom_get_blk_sse_sum_avx2) };
609*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(AVX2, SSE_Sum_Test,
610*77c1e3ccSAndroid Build Coastguard Worker Combine(ValuesIn(sse_sum_avx2),
611*77c1e3ccSAndroid Build Coastguard Worker ValuesIn(kValidBlockSize)));
612*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_AVX2
613*77c1e3ccSAndroid Build Coastguard Worker
614*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
615*77c1e3ccSAndroid Build Coastguard Worker TestSSE_SumFuncs sse_sum_neon[] = { TestSSE_SumFuncs(
616*77c1e3ccSAndroid Build Coastguard Worker &aom_get_blk_sse_sum_c, &aom_get_blk_sse_sum_neon) };
617*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(NEON, SSE_Sum_Test,
618*77c1e3ccSAndroid Build Coastguard Worker Combine(ValuesIn(sse_sum_neon),
619*77c1e3ccSAndroid Build Coastguard Worker ValuesIn(kValidBlockSize)));
620*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_NEON
621*77c1e3ccSAndroid Build Coastguard Worker
622*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SVE
623*77c1e3ccSAndroid Build Coastguard Worker TestSSE_SumFuncs sse_sum_sve[] = { TestSSE_SumFuncs(&aom_get_blk_sse_sum_c,
624*77c1e3ccSAndroid Build Coastguard Worker &aom_get_blk_sse_sum_sve) };
625*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SVE, SSE_Sum_Test,
626*77c1e3ccSAndroid Build Coastguard Worker Combine(ValuesIn(sse_sum_sve),
627*77c1e3ccSAndroid Build Coastguard Worker ValuesIn(kValidBlockSize)));
628*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SVE
629*77c1e3ccSAndroid Build Coastguard Worker
630*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
631*77c1e3ccSAndroid Build Coastguard Worker // 2D Variance test functions
632*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
633*77c1e3ccSAndroid Build Coastguard Worker
634*77c1e3ccSAndroid Build Coastguard Worker typedef uint64_t (*Var2DFunc)(uint8_t *src, int stride, int width, int height);
635*77c1e3ccSAndroid Build Coastguard Worker typedef libaom_test::FuncParam<Var2DFunc> TestFuncVar2D;
636*77c1e3ccSAndroid Build Coastguard Worker
637*77c1e3ccSAndroid Build Coastguard Worker const uint16_t test_block_size[2] = { 128, 256 };
638*77c1e3ccSAndroid Build Coastguard Worker
639*77c1e3ccSAndroid Build Coastguard Worker class Lowbd2dVarTest : public ::testing::TestWithParam<TestFuncVar2D> {
640*77c1e3ccSAndroid Build Coastguard Worker public:
641*77c1e3ccSAndroid Build Coastguard Worker ~Lowbd2dVarTest() override = default;
SetUp()642*77c1e3ccSAndroid Build Coastguard Worker void SetUp() override {
643*77c1e3ccSAndroid Build Coastguard Worker params_ = this->GetParam();
644*77c1e3ccSAndroid Build Coastguard Worker rnd_.Reset(ACMRandom::DeterministicSeed());
645*77c1e3ccSAndroid Build Coastguard Worker src_ = reinterpret_cast<uint8_t *>(
646*77c1e3ccSAndroid Build Coastguard Worker aom_memalign(16, 512 * 512 * sizeof(uint8_t)));
647*77c1e3ccSAndroid Build Coastguard Worker ASSERT_NE(src_, nullptr);
648*77c1e3ccSAndroid Build Coastguard Worker }
649*77c1e3ccSAndroid Build Coastguard Worker
TearDown()650*77c1e3ccSAndroid Build Coastguard Worker void TearDown() override { aom_free(src_); }
651*77c1e3ccSAndroid Build Coastguard Worker void RunTest(bool is_random);
652*77c1e3ccSAndroid Build Coastguard Worker void RunSpeedTest();
653*77c1e3ccSAndroid Build Coastguard Worker
GenRandomData(int width,int height,int stride)654*77c1e3ccSAndroid Build Coastguard Worker void GenRandomData(int width, int height, int stride) {
655*77c1e3ccSAndroid Build Coastguard Worker const int msb = 7; // Up to 8 bit input
656*77c1e3ccSAndroid Build Coastguard Worker const int limit = 1 << (msb + 1);
657*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
658*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
659*77c1e3ccSAndroid Build Coastguard Worker src_[ii * stride + jj] = rnd_(limit);
660*77c1e3ccSAndroid Build Coastguard Worker }
661*77c1e3ccSAndroid Build Coastguard Worker }
662*77c1e3ccSAndroid Build Coastguard Worker }
663*77c1e3ccSAndroid Build Coastguard Worker
GenExtremeData(int width,int height,int stride)664*77c1e3ccSAndroid Build Coastguard Worker void GenExtremeData(int width, int height, int stride) {
665*77c1e3ccSAndroid Build Coastguard Worker const int msb = 7; // Up to 8 bit input
666*77c1e3ccSAndroid Build Coastguard Worker const int limit = 1 << (msb + 1);
667*77c1e3ccSAndroid Build Coastguard Worker const int val = rnd_(2) ? limit - 1 : 0;
668*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
669*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
670*77c1e3ccSAndroid Build Coastguard Worker src_[ii * stride + jj] = val;
671*77c1e3ccSAndroid Build Coastguard Worker }
672*77c1e3ccSAndroid Build Coastguard Worker }
673*77c1e3ccSAndroid Build Coastguard Worker }
674*77c1e3ccSAndroid Build Coastguard Worker
675*77c1e3ccSAndroid Build Coastguard Worker protected:
676*77c1e3ccSAndroid Build Coastguard Worker TestFuncVar2D params_;
677*77c1e3ccSAndroid Build Coastguard Worker uint8_t *src_;
678*77c1e3ccSAndroid Build Coastguard Worker ACMRandom rnd_;
679*77c1e3ccSAndroid Build Coastguard Worker };
680*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(Lowbd2dVarTest);
681*77c1e3ccSAndroid Build Coastguard Worker
RunTest(bool is_random)682*77c1e3ccSAndroid Build Coastguard Worker void Lowbd2dVarTest::RunTest(bool is_random) {
683*77c1e3ccSAndroid Build Coastguard Worker int failed = 0;
684*77c1e3ccSAndroid Build Coastguard Worker for (int k = 0; k < kNumIterations; k++) {
685*77c1e3ccSAndroid Build Coastguard Worker const int width = 4 * (rnd_(63) + 1); // Up to 256x256
686*77c1e3ccSAndroid Build Coastguard Worker const int height = 4 * (rnd_(63) + 1); // Up to 256x256
687*77c1e3ccSAndroid Build Coastguard Worker int stride = 4 << rnd_(8); // Up to 512 stride
688*77c1e3ccSAndroid Build Coastguard Worker while (stride < width) { // Make sure it's valid
689*77c1e3ccSAndroid Build Coastguard Worker stride = 4 << rnd_(8);
690*77c1e3ccSAndroid Build Coastguard Worker }
691*77c1e3ccSAndroid Build Coastguard Worker if (is_random) {
692*77c1e3ccSAndroid Build Coastguard Worker GenRandomData(width, height, stride);
693*77c1e3ccSAndroid Build Coastguard Worker } else {
694*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride);
695*77c1e3ccSAndroid Build Coastguard Worker }
696*77c1e3ccSAndroid Build Coastguard Worker
697*77c1e3ccSAndroid Build Coastguard Worker const uint64_t res_ref = params_.ref_func(src_, stride, width, height);
698*77c1e3ccSAndroid Build Coastguard Worker uint64_t res_tst;
699*77c1e3ccSAndroid Build Coastguard Worker API_REGISTER_STATE_CHECK(res_tst =
700*77c1e3ccSAndroid Build Coastguard Worker params_.tst_func(src_, stride, width, height));
701*77c1e3ccSAndroid Build Coastguard Worker
702*77c1e3ccSAndroid Build Coastguard Worker if (!failed) {
703*77c1e3ccSAndroid Build Coastguard Worker failed = res_ref != res_tst;
704*77c1e3ccSAndroid Build Coastguard Worker EXPECT_EQ(res_ref, res_tst)
705*77c1e3ccSAndroid Build Coastguard Worker << "Error: Sum Squares Test [" << width << "x" << height
706*77c1e3ccSAndroid Build Coastguard Worker << "] C output does not match optimized output.";
707*77c1e3ccSAndroid Build Coastguard Worker }
708*77c1e3ccSAndroid Build Coastguard Worker }
709*77c1e3ccSAndroid Build Coastguard Worker }
710*77c1e3ccSAndroid Build Coastguard Worker
RunSpeedTest()711*77c1e3ccSAndroid Build Coastguard Worker void Lowbd2dVarTest::RunSpeedTest() {
712*77c1e3ccSAndroid Build Coastguard Worker for (int block = 0; block < 2; block++) {
713*77c1e3ccSAndroid Build Coastguard Worker const int width = test_block_size[block];
714*77c1e3ccSAndroid Build Coastguard Worker const int height = test_block_size[block];
715*77c1e3ccSAndroid Build Coastguard Worker int stride = 4 << rnd_(8); // Up to 512 stride
716*77c1e3ccSAndroid Build Coastguard Worker while (stride < width) { // Make sure it's valid
717*77c1e3ccSAndroid Build Coastguard Worker stride = 4 << rnd_(8);
718*77c1e3ccSAndroid Build Coastguard Worker }
719*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride);
720*77c1e3ccSAndroid Build Coastguard Worker const int num_loops = 1000000000 / (width + height);
721*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer;
722*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer);
723*77c1e3ccSAndroid Build Coastguard Worker
724*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < num_loops; ++i)
725*77c1e3ccSAndroid Build Coastguard Worker params_.ref_func(src_, stride, width, height);
726*77c1e3ccSAndroid Build Coastguard Worker
727*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&timer);
728*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer));
729*77c1e3ccSAndroid Build Coastguard Worker
730*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer1;
731*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer1);
732*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < num_loops; ++i)
733*77c1e3ccSAndroid Build Coastguard Worker params_.tst_func(src_, stride, width, height);
734*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&timer1);
735*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time1 = static_cast<int>(aom_usec_timer_elapsed(&timer1));
736*77c1e3ccSAndroid Build Coastguard Worker printf("%3dx%-3d: Scaling = %.2f\n", width, height,
737*77c1e3ccSAndroid Build Coastguard Worker (double)elapsed_time / elapsed_time1);
738*77c1e3ccSAndroid Build Coastguard Worker }
739*77c1e3ccSAndroid Build Coastguard Worker }
740*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(Lowbd2dVarTest,OperationCheck)741*77c1e3ccSAndroid Build Coastguard Worker TEST_P(Lowbd2dVarTest, OperationCheck) {
742*77c1e3ccSAndroid Build Coastguard Worker RunTest(true); // GenRandomData
743*77c1e3ccSAndroid Build Coastguard Worker }
744*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(Lowbd2dVarTest,ExtremeValues)745*77c1e3ccSAndroid Build Coastguard Worker TEST_P(Lowbd2dVarTest, ExtremeValues) {
746*77c1e3ccSAndroid Build Coastguard Worker RunTest(false); // GenExtremeData
747*77c1e3ccSAndroid Build Coastguard Worker }
748*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(Lowbd2dVarTest,DISABLED_Speed)749*77c1e3ccSAndroid Build Coastguard Worker TEST_P(Lowbd2dVarTest, DISABLED_Speed) { RunSpeedTest(); }
750*77c1e3ccSAndroid Build Coastguard Worker
751*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE2
752*77c1e3ccSAndroid Build Coastguard Worker
753*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SSE2, Lowbd2dVarTest,
754*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncVar2D(&aom_var_2d_u8_c,
755*77c1e3ccSAndroid Build Coastguard Worker &aom_var_2d_u8_sse2)));
756*77c1e3ccSAndroid Build Coastguard Worker
757*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SSE2
758*77c1e3ccSAndroid Build Coastguard Worker
759*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
760*77c1e3ccSAndroid Build Coastguard Worker
761*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(AVX2, Lowbd2dVarTest,
762*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncVar2D(&aom_var_2d_u8_c,
763*77c1e3ccSAndroid Build Coastguard Worker &aom_var_2d_u8_avx2)));
764*77c1e3ccSAndroid Build Coastguard Worker
765*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SSE2
766*77c1e3ccSAndroid Build Coastguard Worker
767*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
768*77c1e3ccSAndroid Build Coastguard Worker
769*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(NEON, Lowbd2dVarTest,
770*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncVar2D(&aom_var_2d_u8_c,
771*77c1e3ccSAndroid Build Coastguard Worker &aom_var_2d_u8_neon)));
772*77c1e3ccSAndroid Build Coastguard Worker
773*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_NEON
774*77c1e3ccSAndroid Build Coastguard Worker
775*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON_DOTPROD
776*77c1e3ccSAndroid Build Coastguard Worker
777*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(NEON_DOTPROD, Lowbd2dVarTest,
778*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncVar2D(
779*77c1e3ccSAndroid Build Coastguard Worker &aom_var_2d_u8_c, &aom_var_2d_u8_neon_dotprod)));
780*77c1e3ccSAndroid Build Coastguard Worker
781*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_NEON_DOTPROD
782*77c1e3ccSAndroid Build Coastguard Worker
783*77c1e3ccSAndroid Build Coastguard Worker #if CONFIG_AV1_HIGHBITDEPTH
784*77c1e3ccSAndroid Build Coastguard Worker class Highbd2dVarTest : public ::testing::TestWithParam<TestFuncVar2D> {
785*77c1e3ccSAndroid Build Coastguard Worker public:
786*77c1e3ccSAndroid Build Coastguard Worker ~Highbd2dVarTest() override = default;
SetUp()787*77c1e3ccSAndroid Build Coastguard Worker void SetUp() override {
788*77c1e3ccSAndroid Build Coastguard Worker params_ = this->GetParam();
789*77c1e3ccSAndroid Build Coastguard Worker rnd_.Reset(ACMRandom::DeterministicSeed());
790*77c1e3ccSAndroid Build Coastguard Worker src_ = reinterpret_cast<uint16_t *>(
791*77c1e3ccSAndroid Build Coastguard Worker aom_memalign(16, 512 * 512 * sizeof(uint16_t)));
792*77c1e3ccSAndroid Build Coastguard Worker ASSERT_NE(src_, nullptr);
793*77c1e3ccSAndroid Build Coastguard Worker }
794*77c1e3ccSAndroid Build Coastguard Worker
TearDown()795*77c1e3ccSAndroid Build Coastguard Worker void TearDown() override { aom_free(src_); }
796*77c1e3ccSAndroid Build Coastguard Worker void RunTest(bool is_random);
797*77c1e3ccSAndroid Build Coastguard Worker void RunSpeedTest();
798*77c1e3ccSAndroid Build Coastguard Worker
GenRandomData(int width,int height,int stride)799*77c1e3ccSAndroid Build Coastguard Worker void GenRandomData(int width, int height, int stride) {
800*77c1e3ccSAndroid Build Coastguard Worker const int msb = 11; // Up to 12 bit input
801*77c1e3ccSAndroid Build Coastguard Worker const int limit = 1 << (msb + 1);
802*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
803*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
804*77c1e3ccSAndroid Build Coastguard Worker src_[ii * stride + jj] = rnd_(limit);
805*77c1e3ccSAndroid Build Coastguard Worker }
806*77c1e3ccSAndroid Build Coastguard Worker }
807*77c1e3ccSAndroid Build Coastguard Worker }
808*77c1e3ccSAndroid Build Coastguard Worker
GenExtremeData(int width,int height,int stride)809*77c1e3ccSAndroid Build Coastguard Worker void GenExtremeData(int width, int height, int stride) {
810*77c1e3ccSAndroid Build Coastguard Worker const int msb = 11; // Up to 12 bit input
811*77c1e3ccSAndroid Build Coastguard Worker const int limit = 1 << (msb + 1);
812*77c1e3ccSAndroid Build Coastguard Worker const int val = rnd_(2) ? limit - 1 : 0;
813*77c1e3ccSAndroid Build Coastguard Worker for (int ii = 0; ii < height; ii++) {
814*77c1e3ccSAndroid Build Coastguard Worker for (int jj = 0; jj < width; jj++) {
815*77c1e3ccSAndroid Build Coastguard Worker src_[ii * stride + jj] = val;
816*77c1e3ccSAndroid Build Coastguard Worker }
817*77c1e3ccSAndroid Build Coastguard Worker }
818*77c1e3ccSAndroid Build Coastguard Worker }
819*77c1e3ccSAndroid Build Coastguard Worker
820*77c1e3ccSAndroid Build Coastguard Worker protected:
821*77c1e3ccSAndroid Build Coastguard Worker TestFuncVar2D params_;
822*77c1e3ccSAndroid Build Coastguard Worker uint16_t *src_;
823*77c1e3ccSAndroid Build Coastguard Worker ACMRandom rnd_;
824*77c1e3ccSAndroid Build Coastguard Worker };
825*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(Highbd2dVarTest);
826*77c1e3ccSAndroid Build Coastguard Worker
RunTest(bool is_random)827*77c1e3ccSAndroid Build Coastguard Worker void Highbd2dVarTest::RunTest(bool is_random) {
828*77c1e3ccSAndroid Build Coastguard Worker int failed = 0;
829*77c1e3ccSAndroid Build Coastguard Worker for (int k = 0; k < kNumIterations; k++) {
830*77c1e3ccSAndroid Build Coastguard Worker const int width = 4 * (rnd_(63) + 1); // Up to 256x256
831*77c1e3ccSAndroid Build Coastguard Worker const int height = 4 * (rnd_(63) + 1); // Up to 256x256
832*77c1e3ccSAndroid Build Coastguard Worker int stride = 4 << rnd_(8); // Up to 512 stride
833*77c1e3ccSAndroid Build Coastguard Worker while (stride < width) { // Make sure it's valid
834*77c1e3ccSAndroid Build Coastguard Worker stride = 4 << rnd_(8);
835*77c1e3ccSAndroid Build Coastguard Worker }
836*77c1e3ccSAndroid Build Coastguard Worker if (is_random) {
837*77c1e3ccSAndroid Build Coastguard Worker GenRandomData(width, height, stride);
838*77c1e3ccSAndroid Build Coastguard Worker } else {
839*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride);
840*77c1e3ccSAndroid Build Coastguard Worker }
841*77c1e3ccSAndroid Build Coastguard Worker
842*77c1e3ccSAndroid Build Coastguard Worker const uint64_t res_ref =
843*77c1e3ccSAndroid Build Coastguard Worker params_.ref_func(CONVERT_TO_BYTEPTR(src_), stride, width, height);
844*77c1e3ccSAndroid Build Coastguard Worker uint64_t res_tst;
845*77c1e3ccSAndroid Build Coastguard Worker API_REGISTER_STATE_CHECK(
846*77c1e3ccSAndroid Build Coastguard Worker res_tst =
847*77c1e3ccSAndroid Build Coastguard Worker params_.tst_func(CONVERT_TO_BYTEPTR(src_), stride, width, height));
848*77c1e3ccSAndroid Build Coastguard Worker
849*77c1e3ccSAndroid Build Coastguard Worker if (!failed) {
850*77c1e3ccSAndroid Build Coastguard Worker failed = res_ref != res_tst;
851*77c1e3ccSAndroid Build Coastguard Worker EXPECT_EQ(res_ref, res_tst)
852*77c1e3ccSAndroid Build Coastguard Worker << "Error: Sum Squares Test [" << width << "x" << height
853*77c1e3ccSAndroid Build Coastguard Worker << "] C output does not match optimized output.";
854*77c1e3ccSAndroid Build Coastguard Worker }
855*77c1e3ccSAndroid Build Coastguard Worker }
856*77c1e3ccSAndroid Build Coastguard Worker }
857*77c1e3ccSAndroid Build Coastguard Worker
RunSpeedTest()858*77c1e3ccSAndroid Build Coastguard Worker void Highbd2dVarTest::RunSpeedTest() {
859*77c1e3ccSAndroid Build Coastguard Worker for (int block = 0; block < 2; block++) {
860*77c1e3ccSAndroid Build Coastguard Worker const int width = test_block_size[block];
861*77c1e3ccSAndroid Build Coastguard Worker const int height = test_block_size[block];
862*77c1e3ccSAndroid Build Coastguard Worker int stride = 4 << rnd_(8); // Up to 512 stride
863*77c1e3ccSAndroid Build Coastguard Worker while (stride < width) { // Make sure it's valid
864*77c1e3ccSAndroid Build Coastguard Worker stride = 4 << rnd_(8);
865*77c1e3ccSAndroid Build Coastguard Worker }
866*77c1e3ccSAndroid Build Coastguard Worker GenExtremeData(width, height, stride);
867*77c1e3ccSAndroid Build Coastguard Worker const int num_loops = 1000000000 / (width + height);
868*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer;
869*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer);
870*77c1e3ccSAndroid Build Coastguard Worker
871*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < num_loops; ++i)
872*77c1e3ccSAndroid Build Coastguard Worker params_.ref_func(CONVERT_TO_BYTEPTR(src_), stride, width, height);
873*77c1e3ccSAndroid Build Coastguard Worker
874*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&timer);
875*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer));
876*77c1e3ccSAndroid Build Coastguard Worker
877*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer1;
878*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer1);
879*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < num_loops; ++i)
880*77c1e3ccSAndroid Build Coastguard Worker params_.tst_func(CONVERT_TO_BYTEPTR(src_), stride, width, height);
881*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&timer1);
882*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time1 = static_cast<int>(aom_usec_timer_elapsed(&timer1));
883*77c1e3ccSAndroid Build Coastguard Worker printf("%3dx%-3d: Scaling = %.2f\n", width, height,
884*77c1e3ccSAndroid Build Coastguard Worker (double)elapsed_time / elapsed_time1);
885*77c1e3ccSAndroid Build Coastguard Worker }
886*77c1e3ccSAndroid Build Coastguard Worker }
887*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(Highbd2dVarTest,OperationCheck)888*77c1e3ccSAndroid Build Coastguard Worker TEST_P(Highbd2dVarTest, OperationCheck) {
889*77c1e3ccSAndroid Build Coastguard Worker RunTest(true); // GenRandomData
890*77c1e3ccSAndroid Build Coastguard Worker }
891*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(Highbd2dVarTest,ExtremeValues)892*77c1e3ccSAndroid Build Coastguard Worker TEST_P(Highbd2dVarTest, ExtremeValues) {
893*77c1e3ccSAndroid Build Coastguard Worker RunTest(false); // GenExtremeData
894*77c1e3ccSAndroid Build Coastguard Worker }
895*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(Highbd2dVarTest,DISABLED_Speed)896*77c1e3ccSAndroid Build Coastguard Worker TEST_P(Highbd2dVarTest, DISABLED_Speed) { RunSpeedTest(); }
897*77c1e3ccSAndroid Build Coastguard Worker
898*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE2
899*77c1e3ccSAndroid Build Coastguard Worker
900*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
901*77c1e3ccSAndroid Build Coastguard Worker SSE2, Highbd2dVarTest,
902*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncVar2D(&aom_var_2d_u16_c, &aom_var_2d_u16_sse2)));
903*77c1e3ccSAndroid Build Coastguard Worker
904*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SSE2
905*77c1e3ccSAndroid Build Coastguard Worker
906*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
907*77c1e3ccSAndroid Build Coastguard Worker
908*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
909*77c1e3ccSAndroid Build Coastguard Worker AVX2, Highbd2dVarTest,
910*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncVar2D(&aom_var_2d_u16_c, &aom_var_2d_u16_avx2)));
911*77c1e3ccSAndroid Build Coastguard Worker
912*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SSE2
913*77c1e3ccSAndroid Build Coastguard Worker
914*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
915*77c1e3ccSAndroid Build Coastguard Worker
916*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
917*77c1e3ccSAndroid Build Coastguard Worker NEON, Highbd2dVarTest,
918*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncVar2D(&aom_var_2d_u16_c, &aom_var_2d_u16_neon)));
919*77c1e3ccSAndroid Build Coastguard Worker
920*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_NEON
921*77c1e3ccSAndroid Build Coastguard Worker
922*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SVE
923*77c1e3ccSAndroid Build Coastguard Worker
924*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SVE, Highbd2dVarTest,
925*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(TestFuncVar2D(&aom_var_2d_u16_c,
926*77c1e3ccSAndroid Build Coastguard Worker &aom_var_2d_u16_sve)));
927*77c1e3ccSAndroid Build Coastguard Worker
928*77c1e3ccSAndroid Build Coastguard Worker #endif // HAVE_SVE
929*77c1e3ccSAndroid Build Coastguard Worker #endif // CONFIG_AV1_HIGHBITDEPTH
930*77c1e3ccSAndroid Build Coastguard Worker } // namespace
931