xref: /aosp_15_r20/external/libaom/test/blend_a64_mask_test.cc (revision 77c1e3ccc04c968bd2bc212e87364f250e820521)
1*77c1e3ccSAndroid Build Coastguard Worker /*
2*77c1e3ccSAndroid Build Coastguard Worker  * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3*77c1e3ccSAndroid Build Coastguard Worker  *
4*77c1e3ccSAndroid Build Coastguard Worker  * This source code is subject to the terms of the BSD 2 Clause License and
5*77c1e3ccSAndroid Build Coastguard Worker  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6*77c1e3ccSAndroid Build Coastguard Worker  * was not distributed with this source code in the LICENSE file, you can
7*77c1e3ccSAndroid Build Coastguard Worker  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8*77c1e3ccSAndroid Build Coastguard Worker  * Media Patent License 1.0 was not distributed with this source code in the
9*77c1e3ccSAndroid Build Coastguard Worker  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10*77c1e3ccSAndroid Build Coastguard Worker  */
11*77c1e3ccSAndroid Build Coastguard Worker 
12*77c1e3ccSAndroid Build Coastguard Worker #include <math.h>
13*77c1e3ccSAndroid Build Coastguard Worker #include <stdlib.h>
14*77c1e3ccSAndroid Build Coastguard Worker #include <string.h>
15*77c1e3ccSAndroid Build Coastguard Worker 
16*77c1e3ccSAndroid Build Coastguard Worker #include "gtest/gtest.h"
17*77c1e3ccSAndroid Build Coastguard Worker #include "test/register_state_check.h"
18*77c1e3ccSAndroid Build Coastguard Worker #include "test/function_equivalence_test.h"
19*77c1e3ccSAndroid Build Coastguard Worker 
20*77c1e3ccSAndroid Build Coastguard Worker #include "config/aom_config.h"
21*77c1e3ccSAndroid Build Coastguard Worker #include "config/aom_dsp_rtcd.h"
22*77c1e3ccSAndroid Build Coastguard Worker #include "config/av1_rtcd.h"
23*77c1e3ccSAndroid Build Coastguard Worker 
24*77c1e3ccSAndroid Build Coastguard Worker #include "aom/aom_integer.h"
25*77c1e3ccSAndroid Build Coastguard Worker 
26*77c1e3ccSAndroid Build Coastguard Worker #include "av1/common/enums.h"
27*77c1e3ccSAndroid Build Coastguard Worker 
28*77c1e3ccSAndroid Build Coastguard Worker #include "aom_dsp/blend.h"
29*77c1e3ccSAndroid Build Coastguard Worker 
30*77c1e3ccSAndroid Build Coastguard Worker using libaom_test::FunctionEquivalenceTest;
31*77c1e3ccSAndroid Build Coastguard Worker 
32*77c1e3ccSAndroid Build Coastguard Worker namespace {
33*77c1e3ccSAndroid Build Coastguard Worker 
34*77c1e3ccSAndroid Build Coastguard Worker template <typename BlendA64Func, typename SrcPixel, typename DstPixel>
35*77c1e3ccSAndroid Build Coastguard Worker class BlendA64MaskTest : public FunctionEquivalenceTest<BlendA64Func> {
36*77c1e3ccSAndroid Build Coastguard Worker  protected:
37*77c1e3ccSAndroid Build Coastguard Worker   static const int kIterations = 10000;
38*77c1e3ccSAndroid Build Coastguard Worker   static const int kMaxWidth = MAX_SB_SIZE * 5;  // * 5 to cover longer strides
39*77c1e3ccSAndroid Build Coastguard Worker   static const int kMaxHeight = MAX_SB_SIZE;
40*77c1e3ccSAndroid Build Coastguard Worker   static const int kBufSize = kMaxWidth * kMaxHeight;
41*77c1e3ccSAndroid Build Coastguard Worker   static const int kMaxMaskWidth = 2 * MAX_SB_SIZE;
42*77c1e3ccSAndroid Build Coastguard Worker   static const int kMaxMaskSize = kMaxMaskWidth * kMaxMaskWidth;
43*77c1e3ccSAndroid Build Coastguard Worker 
44*77c1e3ccSAndroid Build Coastguard Worker   ~BlendA64MaskTest() override = default;
45*77c1e3ccSAndroid Build Coastguard Worker 
46*77c1e3ccSAndroid Build Coastguard Worker   virtual void Execute(const SrcPixel *p_src0, const SrcPixel *p_src1,
47*77c1e3ccSAndroid Build Coastguard Worker                        int run_times) = 0;
48*77c1e3ccSAndroid Build Coastguard Worker 
49*77c1e3ccSAndroid Build Coastguard Worker   template <typename Pixel>
GetSources(Pixel ** src0,Pixel ** src1,Pixel *,int run_times)50*77c1e3ccSAndroid Build Coastguard Worker   void GetSources(Pixel **src0, Pixel **src1, Pixel * /*dst*/, int run_times) {
51*77c1e3ccSAndroid Build Coastguard Worker     if (run_times > 1) {
52*77c1e3ccSAndroid Build Coastguard Worker       *src0 = src0_;
53*77c1e3ccSAndroid Build Coastguard Worker       *src1 = src1_;
54*77c1e3ccSAndroid Build Coastguard Worker       return;
55*77c1e3ccSAndroid Build Coastguard Worker     }
56*77c1e3ccSAndroid Build Coastguard Worker     switch (this->rng_(3)) {
57*77c1e3ccSAndroid Build Coastguard Worker       case 0:  // Separate sources
58*77c1e3ccSAndroid Build Coastguard Worker         *src0 = src0_;
59*77c1e3ccSAndroid Build Coastguard Worker         *src1 = src1_;
60*77c1e3ccSAndroid Build Coastguard Worker         break;
61*77c1e3ccSAndroid Build Coastguard Worker       case 1:  // src0 == dst
62*77c1e3ccSAndroid Build Coastguard Worker         *src0 = dst_tst_;
63*77c1e3ccSAndroid Build Coastguard Worker         src0_stride_ = dst_stride_;
64*77c1e3ccSAndroid Build Coastguard Worker         src0_offset_ = dst_offset_;
65*77c1e3ccSAndroid Build Coastguard Worker         *src1 = src1_;
66*77c1e3ccSAndroid Build Coastguard Worker         break;
67*77c1e3ccSAndroid Build Coastguard Worker       case 2:  // src1 == dst
68*77c1e3ccSAndroid Build Coastguard Worker         *src0 = src0_;
69*77c1e3ccSAndroid Build Coastguard Worker         *src1 = dst_tst_;
70*77c1e3ccSAndroid Build Coastguard Worker         src1_stride_ = dst_stride_;
71*77c1e3ccSAndroid Build Coastguard Worker         src1_offset_ = dst_offset_;
72*77c1e3ccSAndroid Build Coastguard Worker         break;
73*77c1e3ccSAndroid Build Coastguard Worker       default: FAIL();
74*77c1e3ccSAndroid Build Coastguard Worker     }
75*77c1e3ccSAndroid Build Coastguard Worker   }
76*77c1e3ccSAndroid Build Coastguard Worker 
GetSources(uint16_t ** src0,uint16_t ** src1,uint8_t *,int)77*77c1e3ccSAndroid Build Coastguard Worker   void GetSources(uint16_t **src0, uint16_t **src1, uint8_t * /*dst*/,
78*77c1e3ccSAndroid Build Coastguard Worker                   int /*run_times*/) {
79*77c1e3ccSAndroid Build Coastguard Worker     *src0 = src0_;
80*77c1e3ccSAndroid Build Coastguard Worker     *src1 = src1_;
81*77c1e3ccSAndroid Build Coastguard Worker   }
82*77c1e3ccSAndroid Build Coastguard Worker 
Rand1()83*77c1e3ccSAndroid Build Coastguard Worker   uint8_t Rand1() { return this->rng_.Rand8() & 1; }
84*77c1e3ccSAndroid Build Coastguard Worker 
RunOneTest(int block_size,int subx,int suby,int run_times)85*77c1e3ccSAndroid Build Coastguard Worker   void RunOneTest(int block_size, int subx, int suby, int run_times) {
86*77c1e3ccSAndroid Build Coastguard Worker     w_ = block_size_wide[block_size];
87*77c1e3ccSAndroid Build Coastguard Worker     h_ = block_size_high[block_size];
88*77c1e3ccSAndroid Build Coastguard Worker     run_times = run_times > 1 ? run_times / w_ : 1;
89*77c1e3ccSAndroid Build Coastguard Worker     ASSERT_GT(run_times, 0);
90*77c1e3ccSAndroid Build Coastguard Worker     subx_ = subx;
91*77c1e3ccSAndroid Build Coastguard Worker     suby_ = suby;
92*77c1e3ccSAndroid Build Coastguard Worker 
93*77c1e3ccSAndroid Build Coastguard Worker     dst_offset_ = this->rng_(33);
94*77c1e3ccSAndroid Build Coastguard Worker     dst_stride_ = this->rng_(kMaxWidth + 1 - w_) + w_;
95*77c1e3ccSAndroid Build Coastguard Worker 
96*77c1e3ccSAndroid Build Coastguard Worker     src0_offset_ = this->rng_(33);
97*77c1e3ccSAndroid Build Coastguard Worker     src0_stride_ = this->rng_(kMaxWidth + 1 - w_) + w_;
98*77c1e3ccSAndroid Build Coastguard Worker 
99*77c1e3ccSAndroid Build Coastguard Worker     src1_offset_ = this->rng_(33);
100*77c1e3ccSAndroid Build Coastguard Worker     src1_stride_ = this->rng_(kMaxWidth + 1 - w_) + w_;
101*77c1e3ccSAndroid Build Coastguard Worker 
102*77c1e3ccSAndroid Build Coastguard Worker     mask_stride_ =
103*77c1e3ccSAndroid Build Coastguard Worker         this->rng_(kMaxWidth + 1 - w_ * (subx_ ? 2 : 1)) + w_ * (subx_ ? 2 : 1);
104*77c1e3ccSAndroid Build Coastguard Worker 
105*77c1e3ccSAndroid Build Coastguard Worker     SrcPixel *p_src0;
106*77c1e3ccSAndroid Build Coastguard Worker     SrcPixel *p_src1;
107*77c1e3ccSAndroid Build Coastguard Worker 
108*77c1e3ccSAndroid Build Coastguard Worker     p_src0 = src0_;
109*77c1e3ccSAndroid Build Coastguard Worker     p_src1 = src1_;
110*77c1e3ccSAndroid Build Coastguard Worker 
111*77c1e3ccSAndroid Build Coastguard Worker     GetSources(&p_src0, &p_src1, &dst_ref_[0], run_times);
112*77c1e3ccSAndroid Build Coastguard Worker 
113*77c1e3ccSAndroid Build Coastguard Worker     Execute(p_src0, p_src1, run_times);
114*77c1e3ccSAndroid Build Coastguard Worker 
115*77c1e3ccSAndroid Build Coastguard Worker     for (int r = 0; r < h_; ++r) {
116*77c1e3ccSAndroid Build Coastguard Worker       for (int c = 0; c < w_; ++c) {
117*77c1e3ccSAndroid Build Coastguard Worker         ASSERT_EQ(dst_ref_[dst_offset_ + r * dst_stride_ + c],
118*77c1e3ccSAndroid Build Coastguard Worker                   dst_tst_[dst_offset_ + r * dst_stride_ + c])
119*77c1e3ccSAndroid Build Coastguard Worker             << w_ << "x" << h_ << " subx " << subx_ << " suby " << suby_
120*77c1e3ccSAndroid Build Coastguard Worker             << " r: " << r << " c: " << c;
121*77c1e3ccSAndroid Build Coastguard Worker       }
122*77c1e3ccSAndroid Build Coastguard Worker     }
123*77c1e3ccSAndroid Build Coastguard Worker   }
124*77c1e3ccSAndroid Build Coastguard Worker 
RunTest(int block_size,int run_times)125*77c1e3ccSAndroid Build Coastguard Worker   void RunTest(int block_size, int run_times) {
126*77c1e3ccSAndroid Build Coastguard Worker     for (subx_ = 0; subx_ <= 1; subx_++) {
127*77c1e3ccSAndroid Build Coastguard Worker       for (suby_ = 0; suby_ <= 1; suby_++) {
128*77c1e3ccSAndroid Build Coastguard Worker         RunOneTest(block_size, subx_, suby_, run_times);
129*77c1e3ccSAndroid Build Coastguard Worker       }
130*77c1e3ccSAndroid Build Coastguard Worker     }
131*77c1e3ccSAndroid Build Coastguard Worker   }
132*77c1e3ccSAndroid Build Coastguard Worker 
133*77c1e3ccSAndroid Build Coastguard Worker   DstPixel dst_ref_[kBufSize];
134*77c1e3ccSAndroid Build Coastguard Worker   DstPixel dst_tst_[kBufSize];
135*77c1e3ccSAndroid Build Coastguard Worker   uint32_t dst_stride_;
136*77c1e3ccSAndroid Build Coastguard Worker   uint32_t dst_offset_;
137*77c1e3ccSAndroid Build Coastguard Worker 
138*77c1e3ccSAndroid Build Coastguard Worker   SrcPixel src0_[kBufSize];
139*77c1e3ccSAndroid Build Coastguard Worker   uint32_t src0_stride_;
140*77c1e3ccSAndroid Build Coastguard Worker   uint32_t src0_offset_;
141*77c1e3ccSAndroid Build Coastguard Worker 
142*77c1e3ccSAndroid Build Coastguard Worker   SrcPixel src1_[kBufSize];
143*77c1e3ccSAndroid Build Coastguard Worker   uint32_t src1_stride_;
144*77c1e3ccSAndroid Build Coastguard Worker   uint32_t src1_offset_;
145*77c1e3ccSAndroid Build Coastguard Worker 
146*77c1e3ccSAndroid Build Coastguard Worker   uint8_t mask_[kMaxMaskSize];
147*77c1e3ccSAndroid Build Coastguard Worker   size_t mask_stride_;
148*77c1e3ccSAndroid Build Coastguard Worker 
149*77c1e3ccSAndroid Build Coastguard Worker   int w_;
150*77c1e3ccSAndroid Build Coastguard Worker   int h_;
151*77c1e3ccSAndroid Build Coastguard Worker 
152*77c1e3ccSAndroid Build Coastguard Worker   int suby_;
153*77c1e3ccSAndroid Build Coastguard Worker   int subx_;
154*77c1e3ccSAndroid Build Coastguard Worker };
155*77c1e3ccSAndroid Build Coastguard Worker 
156*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
157*77c1e3ccSAndroid Build Coastguard Worker // 8 bit version
158*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
159*77c1e3ccSAndroid Build Coastguard Worker 
160*77c1e3ccSAndroid Build Coastguard Worker typedef void (*F8B)(uint8_t *dst, uint32_t dst_stride, const uint8_t *src0,
161*77c1e3ccSAndroid Build Coastguard Worker                     uint32_t src0_stride, const uint8_t *src1,
162*77c1e3ccSAndroid Build Coastguard Worker                     uint32_t src1_stride, const uint8_t *mask,
163*77c1e3ccSAndroid Build Coastguard Worker                     uint32_t mask_stride, int w, int h, int subx, int suby);
164*77c1e3ccSAndroid Build Coastguard Worker typedef libaom_test::FuncParam<F8B> TestFuncs;
165*77c1e3ccSAndroid Build Coastguard Worker 
166*77c1e3ccSAndroid Build Coastguard Worker class BlendA64MaskTest8B : public BlendA64MaskTest<F8B, uint8_t, uint8_t> {
167*77c1e3ccSAndroid Build Coastguard Worker  protected:
Execute(const uint8_t * p_src0,const uint8_t * p_src1,int run_times)168*77c1e3ccSAndroid Build Coastguard Worker   void Execute(const uint8_t *p_src0, const uint8_t *p_src1,
169*77c1e3ccSAndroid Build Coastguard Worker                int run_times) override {
170*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer timer;
171*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_start(&timer);
172*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < run_times; ++i) {
173*77c1e3ccSAndroid Build Coastguard Worker       params_.ref_func(dst_ref_ + dst_offset_, dst_stride_,
174*77c1e3ccSAndroid Build Coastguard Worker                        p_src0 + src0_offset_, src0_stride_,
175*77c1e3ccSAndroid Build Coastguard Worker                        p_src1 + src1_offset_, src1_stride_, mask_,
176*77c1e3ccSAndroid Build Coastguard Worker                        kMaxMaskWidth, w_, h_, subx_, suby_);
177*77c1e3ccSAndroid Build Coastguard Worker     }
178*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_mark(&timer);
179*77c1e3ccSAndroid Build Coastguard Worker     const double time1 = static_cast<double>(aom_usec_timer_elapsed(&timer));
180*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_start(&timer);
181*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < run_times; ++i) {
182*77c1e3ccSAndroid Build Coastguard Worker       params_.tst_func(dst_tst_ + dst_offset_, dst_stride_,
183*77c1e3ccSAndroid Build Coastguard Worker                        p_src0 + src0_offset_, src0_stride_,
184*77c1e3ccSAndroid Build Coastguard Worker                        p_src1 + src1_offset_, src1_stride_, mask_,
185*77c1e3ccSAndroid Build Coastguard Worker                        kMaxMaskWidth, w_, h_, subx_, suby_);
186*77c1e3ccSAndroid Build Coastguard Worker     }
187*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_mark(&timer);
188*77c1e3ccSAndroid Build Coastguard Worker     const double time2 = static_cast<double>(aom_usec_timer_elapsed(&timer));
189*77c1e3ccSAndroid Build Coastguard Worker     if (run_times > 1) {
190*77c1e3ccSAndroid Build Coastguard Worker       printf("%3dx%-3d subx %d suby %d :%7.2f/%7.2fns", w_, h_, subx_, suby_,
191*77c1e3ccSAndroid Build Coastguard Worker              time1, time2);
192*77c1e3ccSAndroid Build Coastguard Worker       printf("(%3.2f)\n", time1 / time2);
193*77c1e3ccSAndroid Build Coastguard Worker     }
194*77c1e3ccSAndroid Build Coastguard Worker   }
195*77c1e3ccSAndroid Build Coastguard Worker };
196*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(BlendA64MaskTest8B);
197*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTest8B,RandomValues)198*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTest8B, RandomValues) {
199*77c1e3ccSAndroid Build Coastguard Worker   for (int bsize = 0; bsize < BLOCK_SIZES_ALL && !HasFatalFailure(); ++bsize) {
200*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kBufSize; ++i) {
201*77c1e3ccSAndroid Build Coastguard Worker       dst_ref_[i] = rng_.Rand8();
202*77c1e3ccSAndroid Build Coastguard Worker       dst_tst_[i] = rng_.Rand8();
203*77c1e3ccSAndroid Build Coastguard Worker 
204*77c1e3ccSAndroid Build Coastguard Worker       src0_[i] = rng_.Rand8();
205*77c1e3ccSAndroid Build Coastguard Worker       src1_[i] = rng_.Rand8();
206*77c1e3ccSAndroid Build Coastguard Worker     }
207*77c1e3ccSAndroid Build Coastguard Worker 
208*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kMaxMaskSize; ++i)
209*77c1e3ccSAndroid Build Coastguard Worker       mask_[i] = rng_(AOM_BLEND_A64_MAX_ALPHA + 1);
210*77c1e3ccSAndroid Build Coastguard Worker 
211*77c1e3ccSAndroid Build Coastguard Worker     RunTest(bsize, 1);
212*77c1e3ccSAndroid Build Coastguard Worker   }
213*77c1e3ccSAndroid Build Coastguard Worker }
214*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTest8B,ExtremeValues)215*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTest8B, ExtremeValues) {
216*77c1e3ccSAndroid Build Coastguard Worker   for (int i = 0; i < kBufSize; ++i) {
217*77c1e3ccSAndroid Build Coastguard Worker     dst_ref_[i] = rng_(2) + 254;
218*77c1e3ccSAndroid Build Coastguard Worker     dst_tst_[i] = rng_(2) + 254;
219*77c1e3ccSAndroid Build Coastguard Worker     src0_[i] = rng_(2) + 254;
220*77c1e3ccSAndroid Build Coastguard Worker     src1_[i] = rng_(2) + 254;
221*77c1e3ccSAndroid Build Coastguard Worker   }
222*77c1e3ccSAndroid Build Coastguard Worker 
223*77c1e3ccSAndroid Build Coastguard Worker   for (int i = 0; i < kMaxMaskSize; ++i)
224*77c1e3ccSAndroid Build Coastguard Worker     mask_[i] = rng_(2) + AOM_BLEND_A64_MAX_ALPHA - 1;
225*77c1e3ccSAndroid Build Coastguard Worker 
226*77c1e3ccSAndroid Build Coastguard Worker   for (int bsize = 0; bsize < BLOCK_SIZES_ALL && !HasFatalFailure(); ++bsize)
227*77c1e3ccSAndroid Build Coastguard Worker     RunTest(bsize, 1);
228*77c1e3ccSAndroid Build Coastguard Worker }
229*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTest8B,DISABLED_Speed)230*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTest8B, DISABLED_Speed) {
231*77c1e3ccSAndroid Build Coastguard Worker   const int kRunTimes = 10000000;
232*77c1e3ccSAndroid Build Coastguard Worker   for (int bsize = 0; bsize < BLOCK_SIZES_ALL; ++bsize) {
233*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kBufSize; ++i) {
234*77c1e3ccSAndroid Build Coastguard Worker       dst_ref_[i] = rng_.Rand8();
235*77c1e3ccSAndroid Build Coastguard Worker       dst_tst_[i] = rng_.Rand8();
236*77c1e3ccSAndroid Build Coastguard Worker 
237*77c1e3ccSAndroid Build Coastguard Worker       src0_[i] = rng_.Rand8();
238*77c1e3ccSAndroid Build Coastguard Worker       src1_[i] = rng_.Rand8();
239*77c1e3ccSAndroid Build Coastguard Worker     }
240*77c1e3ccSAndroid Build Coastguard Worker 
241*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kMaxMaskSize; ++i)
242*77c1e3ccSAndroid Build Coastguard Worker       mask_[i] = rng_(AOM_BLEND_A64_MAX_ALPHA + 1);
243*77c1e3ccSAndroid Build Coastguard Worker 
244*77c1e3ccSAndroid Build Coastguard Worker     RunTest(bsize, kRunTimes);
245*77c1e3ccSAndroid Build Coastguard Worker   }
246*77c1e3ccSAndroid Build Coastguard Worker }
247*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE4_1
248*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SSE4_1, BlendA64MaskTest8B,
249*77c1e3ccSAndroid Build Coastguard Worker                          ::testing::Values(TestFuncs(
250*77c1e3ccSAndroid Build Coastguard Worker                              aom_blend_a64_mask_c, aom_blend_a64_mask_sse4_1)));
251*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_SSE4_1
252*77c1e3ccSAndroid Build Coastguard Worker 
253*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
254*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(AVX2, BlendA64MaskTest8B,
255*77c1e3ccSAndroid Build Coastguard Worker                          ::testing::Values(TestFuncs(aom_blend_a64_mask_sse4_1,
256*77c1e3ccSAndroid Build Coastguard Worker                                                      aom_blend_a64_mask_avx2)));
257*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_AVX2
258*77c1e3ccSAndroid Build Coastguard Worker 
259*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
260*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(NEON, BlendA64MaskTest8B,
261*77c1e3ccSAndroid Build Coastguard Worker                          ::testing::Values(TestFuncs(aom_blend_a64_mask_c,
262*77c1e3ccSAndroid Build Coastguard Worker                                                      aom_blend_a64_mask_neon)));
263*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_NEON
264*77c1e3ccSAndroid Build Coastguard Worker 
265*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
266*77c1e3ccSAndroid Build Coastguard Worker // 8 bit _d16 version
267*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
268*77c1e3ccSAndroid Build Coastguard Worker 
269*77c1e3ccSAndroid Build Coastguard Worker typedef void (*F8B_D16)(uint8_t *dst, uint32_t dst_stride, const uint16_t *src0,
270*77c1e3ccSAndroid Build Coastguard Worker                         uint32_t src0_stride, const uint16_t *src1,
271*77c1e3ccSAndroid Build Coastguard Worker                         uint32_t src1_stride, const uint8_t *mask,
272*77c1e3ccSAndroid Build Coastguard Worker                         uint32_t mask_stride, int w, int h, int subx, int suby,
273*77c1e3ccSAndroid Build Coastguard Worker                         ConvolveParams *conv_params);
274*77c1e3ccSAndroid Build Coastguard Worker typedef libaom_test::FuncParam<F8B_D16> TestFuncs_d16;
275*77c1e3ccSAndroid Build Coastguard Worker 
276*77c1e3ccSAndroid Build Coastguard Worker class BlendA64MaskTest8B_d16
277*77c1e3ccSAndroid Build Coastguard Worker     : public BlendA64MaskTest<F8B_D16, uint16_t, uint8_t> {
278*77c1e3ccSAndroid Build Coastguard Worker  protected:
279*77c1e3ccSAndroid Build Coastguard Worker   // max number of bits used by the source
280*77c1e3ccSAndroid Build Coastguard Worker   static const int kSrcMaxBitsMask = 0x3fff;
281*77c1e3ccSAndroid Build Coastguard Worker 
Execute(const uint16_t * p_src0,const uint16_t * p_src1,int run_times)282*77c1e3ccSAndroid Build Coastguard Worker   void Execute(const uint16_t *p_src0, const uint16_t *p_src1,
283*77c1e3ccSAndroid Build Coastguard Worker                int run_times) override {
284*77c1e3ccSAndroid Build Coastguard Worker     ConvolveParams conv_params;
285*77c1e3ccSAndroid Build Coastguard Worker     conv_params.round_0 = ROUND0_BITS;
286*77c1e3ccSAndroid Build Coastguard Worker     conv_params.round_1 = COMPOUND_ROUND1_BITS;
287*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer timer;
288*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_start(&timer);
289*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < run_times; ++i) {
290*77c1e3ccSAndroid Build Coastguard Worker       params_.ref_func(dst_ref_ + dst_offset_, dst_stride_,
291*77c1e3ccSAndroid Build Coastguard Worker                        p_src0 + src0_offset_, src0_stride_,
292*77c1e3ccSAndroid Build Coastguard Worker                        p_src1 + src1_offset_, src1_stride_, mask_,
293*77c1e3ccSAndroid Build Coastguard Worker                        kMaxMaskWidth, w_, h_, subx_, suby_, &conv_params);
294*77c1e3ccSAndroid Build Coastguard Worker     }
295*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_mark(&timer);
296*77c1e3ccSAndroid Build Coastguard Worker     const double time1 = static_cast<double>(aom_usec_timer_elapsed(&timer));
297*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_start(&timer);
298*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < run_times; ++i) {
299*77c1e3ccSAndroid Build Coastguard Worker       params_.tst_func(dst_tst_ + dst_offset_, dst_stride_,
300*77c1e3ccSAndroid Build Coastguard Worker                        p_src0 + src0_offset_, src0_stride_,
301*77c1e3ccSAndroid Build Coastguard Worker                        p_src1 + src1_offset_, src1_stride_, mask_,
302*77c1e3ccSAndroid Build Coastguard Worker                        kMaxMaskWidth, w_, h_, subx_, suby_, &conv_params);
303*77c1e3ccSAndroid Build Coastguard Worker     }
304*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_mark(&timer);
305*77c1e3ccSAndroid Build Coastguard Worker     const double time2 = static_cast<double>(aom_usec_timer_elapsed(&timer));
306*77c1e3ccSAndroid Build Coastguard Worker     if (run_times > 1) {
307*77c1e3ccSAndroid Build Coastguard Worker       printf("%3dx%-3d subx %d suby %d :%7.2f/%7.2fns", w_, h_, subx_, suby_,
308*77c1e3ccSAndroid Build Coastguard Worker              time1, time2);
309*77c1e3ccSAndroid Build Coastguard Worker       printf("(%3.2f)\n", time1 / time2);
310*77c1e3ccSAndroid Build Coastguard Worker     }
311*77c1e3ccSAndroid Build Coastguard Worker   }
312*77c1e3ccSAndroid Build Coastguard Worker };
313*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(BlendA64MaskTest8B_d16);
314*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTest8B_d16,RandomValues)315*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTest8B_d16, RandomValues) {
316*77c1e3ccSAndroid Build Coastguard Worker   for (int bsize = 0; bsize < BLOCK_SIZES_ALL && !HasFatalFailure(); ++bsize) {
317*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kBufSize; ++i) {
318*77c1e3ccSAndroid Build Coastguard Worker       dst_ref_[i] = rng_.Rand8();
319*77c1e3ccSAndroid Build Coastguard Worker       dst_tst_[i] = rng_.Rand8();
320*77c1e3ccSAndroid Build Coastguard Worker 
321*77c1e3ccSAndroid Build Coastguard Worker       src0_[i] = rng_.Rand16() & kSrcMaxBitsMask;
322*77c1e3ccSAndroid Build Coastguard Worker       src1_[i] = rng_.Rand16() & kSrcMaxBitsMask;
323*77c1e3ccSAndroid Build Coastguard Worker     }
324*77c1e3ccSAndroid Build Coastguard Worker 
325*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kMaxMaskSize; ++i)
326*77c1e3ccSAndroid Build Coastguard Worker       mask_[i] = rng_(AOM_BLEND_A64_MAX_ALPHA + 1);
327*77c1e3ccSAndroid Build Coastguard Worker 
328*77c1e3ccSAndroid Build Coastguard Worker     RunTest(bsize, 1);
329*77c1e3ccSAndroid Build Coastguard Worker   }
330*77c1e3ccSAndroid Build Coastguard Worker }
331*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTest8B_d16,ExtremeValues)332*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTest8B_d16, ExtremeValues) {
333*77c1e3ccSAndroid Build Coastguard Worker   for (int i = 0; i < kBufSize; ++i) {
334*77c1e3ccSAndroid Build Coastguard Worker     dst_ref_[i] = 255;
335*77c1e3ccSAndroid Build Coastguard Worker     dst_tst_[i] = 255;
336*77c1e3ccSAndroid Build Coastguard Worker 
337*77c1e3ccSAndroid Build Coastguard Worker     src0_[i] = kSrcMaxBitsMask;
338*77c1e3ccSAndroid Build Coastguard Worker     src1_[i] = kSrcMaxBitsMask;
339*77c1e3ccSAndroid Build Coastguard Worker   }
340*77c1e3ccSAndroid Build Coastguard Worker 
341*77c1e3ccSAndroid Build Coastguard Worker   for (int i = 0; i < kMaxMaskSize; ++i) mask_[i] = AOM_BLEND_A64_MAX_ALPHA - 1;
342*77c1e3ccSAndroid Build Coastguard Worker 
343*77c1e3ccSAndroid Build Coastguard Worker   for (int bsize = 0; bsize < BLOCK_SIZES_ALL && !HasFatalFailure(); ++bsize)
344*77c1e3ccSAndroid Build Coastguard Worker     RunTest(bsize, 1);
345*77c1e3ccSAndroid Build Coastguard Worker }
346*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTest8B_d16,DISABLED_Speed)347*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTest8B_d16, DISABLED_Speed) {
348*77c1e3ccSAndroid Build Coastguard Worker   const int kRunTimes = 10000000;
349*77c1e3ccSAndroid Build Coastguard Worker   for (int bsize = 0; bsize < BLOCK_SIZES_ALL; ++bsize) {
350*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kBufSize; ++i) {
351*77c1e3ccSAndroid Build Coastguard Worker       dst_ref_[i] = rng_.Rand8();
352*77c1e3ccSAndroid Build Coastguard Worker       dst_tst_[i] = rng_.Rand8();
353*77c1e3ccSAndroid Build Coastguard Worker 
354*77c1e3ccSAndroid Build Coastguard Worker       src0_[i] = rng_.Rand16() & kSrcMaxBitsMask;
355*77c1e3ccSAndroid Build Coastguard Worker       src1_[i] = rng_.Rand16() & kSrcMaxBitsMask;
356*77c1e3ccSAndroid Build Coastguard Worker     }
357*77c1e3ccSAndroid Build Coastguard Worker 
358*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kMaxMaskSize; ++i)
359*77c1e3ccSAndroid Build Coastguard Worker       mask_[i] = rng_(AOM_BLEND_A64_MAX_ALPHA + 1);
360*77c1e3ccSAndroid Build Coastguard Worker 
361*77c1e3ccSAndroid Build Coastguard Worker     RunTest(bsize, kRunTimes);
362*77c1e3ccSAndroid Build Coastguard Worker   }
363*77c1e3ccSAndroid Build Coastguard Worker }
364*77c1e3ccSAndroid Build Coastguard Worker 
365*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE4_1
366*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
367*77c1e3ccSAndroid Build Coastguard Worker     SSE4_1, BlendA64MaskTest8B_d16,
368*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncs_d16(aom_lowbd_blend_a64_d16_mask_c,
369*77c1e3ccSAndroid Build Coastguard Worker                                     aom_lowbd_blend_a64_d16_mask_sse4_1)));
370*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_SSE4_1
371*77c1e3ccSAndroid Build Coastguard Worker 
372*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
373*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
374*77c1e3ccSAndroid Build Coastguard Worker     AVX2, BlendA64MaskTest8B_d16,
375*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncs_d16(aom_lowbd_blend_a64_d16_mask_c,
376*77c1e3ccSAndroid Build Coastguard Worker                                     aom_lowbd_blend_a64_d16_mask_avx2)));
377*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_AVX2
378*77c1e3ccSAndroid Build Coastguard Worker 
379*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
380*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
381*77c1e3ccSAndroid Build Coastguard Worker     NEON, BlendA64MaskTest8B_d16,
382*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncs_d16(aom_lowbd_blend_a64_d16_mask_c,
383*77c1e3ccSAndroid Build Coastguard Worker                                     aom_lowbd_blend_a64_d16_mask_neon)));
384*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_NEON
385*77c1e3ccSAndroid Build Coastguard Worker 
386*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
387*77c1e3ccSAndroid Build Coastguard Worker // High bit-depth version
388*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
389*77c1e3ccSAndroid Build Coastguard Worker #if CONFIG_AV1_HIGHBITDEPTH
390*77c1e3ccSAndroid Build Coastguard Worker typedef void (*FHBD)(uint8_t *dst, uint32_t dst_stride, const uint8_t *src0,
391*77c1e3ccSAndroid Build Coastguard Worker                      uint32_t src0_stride, const uint8_t *src1,
392*77c1e3ccSAndroid Build Coastguard Worker                      uint32_t src1_stride, const uint8_t *mask,
393*77c1e3ccSAndroid Build Coastguard Worker                      uint32_t mask_stride, int w, int h, int subx, int suby,
394*77c1e3ccSAndroid Build Coastguard Worker                      int bd);
395*77c1e3ccSAndroid Build Coastguard Worker typedef libaom_test::FuncParam<FHBD> TestFuncsHBD;
396*77c1e3ccSAndroid Build Coastguard Worker 
397*77c1e3ccSAndroid Build Coastguard Worker class BlendA64MaskTestHBD : public BlendA64MaskTest<FHBD, uint16_t, uint16_t> {
398*77c1e3ccSAndroid Build Coastguard Worker  protected:
Execute(const uint16_t * p_src0,const uint16_t * p_src1,int run_times)399*77c1e3ccSAndroid Build Coastguard Worker   void Execute(const uint16_t *p_src0, const uint16_t *p_src1,
400*77c1e3ccSAndroid Build Coastguard Worker                int run_times) override {
401*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer timer;
402*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_start(&timer);
403*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < run_times; ++i) {
404*77c1e3ccSAndroid Build Coastguard Worker       params_.ref_func(CONVERT_TO_BYTEPTR(dst_ref_ + dst_offset_), dst_stride_,
405*77c1e3ccSAndroid Build Coastguard Worker                        CONVERT_TO_BYTEPTR(p_src0 + src0_offset_), src0_stride_,
406*77c1e3ccSAndroid Build Coastguard Worker                        CONVERT_TO_BYTEPTR(p_src1 + src1_offset_), src1_stride_,
407*77c1e3ccSAndroid Build Coastguard Worker                        mask_, kMaxMaskWidth, w_, h_, subx_, suby_, bit_depth_);
408*77c1e3ccSAndroid Build Coastguard Worker     }
409*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_mark(&timer);
410*77c1e3ccSAndroid Build Coastguard Worker     const double time1 = static_cast<double>(aom_usec_timer_elapsed(&timer));
411*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_start(&timer);
412*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < run_times; ++i) {
413*77c1e3ccSAndroid Build Coastguard Worker       params_.tst_func(CONVERT_TO_BYTEPTR(dst_tst_ + dst_offset_), dst_stride_,
414*77c1e3ccSAndroid Build Coastguard Worker                        CONVERT_TO_BYTEPTR(p_src0 + src0_offset_), src0_stride_,
415*77c1e3ccSAndroid Build Coastguard Worker                        CONVERT_TO_BYTEPTR(p_src1 + src1_offset_), src1_stride_,
416*77c1e3ccSAndroid Build Coastguard Worker                        mask_, kMaxMaskWidth, w_, h_, subx_, suby_, bit_depth_);
417*77c1e3ccSAndroid Build Coastguard Worker     }
418*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_mark(&timer);
419*77c1e3ccSAndroid Build Coastguard Worker     const double time2 = static_cast<double>(aom_usec_timer_elapsed(&timer));
420*77c1e3ccSAndroid Build Coastguard Worker     if (run_times > 1) {
421*77c1e3ccSAndroid Build Coastguard Worker       printf("%3dx%-3d subx %d suby %d :%7.2f/%7.2fns", w_, h_, subx_, suby_,
422*77c1e3ccSAndroid Build Coastguard Worker              time1, time2);
423*77c1e3ccSAndroid Build Coastguard Worker       printf("(%3.2f)\n", time1 / time2);
424*77c1e3ccSAndroid Build Coastguard Worker     }
425*77c1e3ccSAndroid Build Coastguard Worker   }
426*77c1e3ccSAndroid Build Coastguard Worker 
427*77c1e3ccSAndroid Build Coastguard Worker   int bit_depth_;
428*77c1e3ccSAndroid Build Coastguard Worker };
429*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(BlendA64MaskTestHBD);
430*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTestHBD,RandomValues)431*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTestHBD, RandomValues) {
432*77c1e3ccSAndroid Build Coastguard Worker   for (bit_depth_ = 8; bit_depth_ <= 12 && !HasFatalFailure();
433*77c1e3ccSAndroid Build Coastguard Worker        bit_depth_ += 2) {
434*77c1e3ccSAndroid Build Coastguard Worker     const int hi = 1 << bit_depth_;
435*77c1e3ccSAndroid Build Coastguard Worker 
436*77c1e3ccSAndroid Build Coastguard Worker     for (int bsize = 0; bsize < BLOCK_SIZES_ALL; ++bsize) {
437*77c1e3ccSAndroid Build Coastguard Worker       for (int i = 0; i < kBufSize; ++i) {
438*77c1e3ccSAndroid Build Coastguard Worker         dst_ref_[i] = rng_(hi);
439*77c1e3ccSAndroid Build Coastguard Worker         dst_tst_[i] = rng_(hi);
440*77c1e3ccSAndroid Build Coastguard Worker         src0_[i] = rng_(hi);
441*77c1e3ccSAndroid Build Coastguard Worker         src1_[i] = rng_(hi);
442*77c1e3ccSAndroid Build Coastguard Worker       }
443*77c1e3ccSAndroid Build Coastguard Worker 
444*77c1e3ccSAndroid Build Coastguard Worker       for (int i = 0; i < kMaxMaskSize; ++i)
445*77c1e3ccSAndroid Build Coastguard Worker         mask_[i] = rng_(AOM_BLEND_A64_MAX_ALPHA + 1);
446*77c1e3ccSAndroid Build Coastguard Worker 
447*77c1e3ccSAndroid Build Coastguard Worker       RunTest(bsize, 1);
448*77c1e3ccSAndroid Build Coastguard Worker     }
449*77c1e3ccSAndroid Build Coastguard Worker   }
450*77c1e3ccSAndroid Build Coastguard Worker }
451*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTestHBD,ExtremeValues)452*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTestHBD, ExtremeValues) {
453*77c1e3ccSAndroid Build Coastguard Worker   for (bit_depth_ = 8; bit_depth_ <= 12 && !HasFatalFailure();
454*77c1e3ccSAndroid Build Coastguard Worker        bit_depth_ += 2) {
455*77c1e3ccSAndroid Build Coastguard Worker     const int hi = 1 << bit_depth_;
456*77c1e3ccSAndroid Build Coastguard Worker     const int lo = hi - 2;
457*77c1e3ccSAndroid Build Coastguard Worker 
458*77c1e3ccSAndroid Build Coastguard Worker     for (int bsize = 0; bsize < BLOCK_SIZES_ALL && !HasFatalFailure();
459*77c1e3ccSAndroid Build Coastguard Worker          ++bsize) {
460*77c1e3ccSAndroid Build Coastguard Worker       for (int i = 0; i < kBufSize; ++i) {
461*77c1e3ccSAndroid Build Coastguard Worker         dst_ref_[i] = rng_(hi - lo) + lo;
462*77c1e3ccSAndroid Build Coastguard Worker         dst_tst_[i] = rng_(hi - lo) + lo;
463*77c1e3ccSAndroid Build Coastguard Worker         src0_[i] = rng_(hi - lo) + lo;
464*77c1e3ccSAndroid Build Coastguard Worker         src1_[i] = rng_(hi - lo) + lo;
465*77c1e3ccSAndroid Build Coastguard Worker       }
466*77c1e3ccSAndroid Build Coastguard Worker 
467*77c1e3ccSAndroid Build Coastguard Worker       for (int i = 0; i < kMaxMaskSize; ++i)
468*77c1e3ccSAndroid Build Coastguard Worker         mask_[i] = rng_(2) + AOM_BLEND_A64_MAX_ALPHA - 1;
469*77c1e3ccSAndroid Build Coastguard Worker 
470*77c1e3ccSAndroid Build Coastguard Worker       RunTest(bsize, 1);
471*77c1e3ccSAndroid Build Coastguard Worker     }
472*77c1e3ccSAndroid Build Coastguard Worker   }
473*77c1e3ccSAndroid Build Coastguard Worker }
474*77c1e3ccSAndroid Build Coastguard Worker 
475*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE4_1
476*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
477*77c1e3ccSAndroid Build Coastguard Worker     SSE4_1, BlendA64MaskTestHBD,
478*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncsHBD(aom_highbd_blend_a64_mask_c,
479*77c1e3ccSAndroid Build Coastguard Worker                                    aom_highbd_blend_a64_mask_sse4_1)));
480*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_SSE4_1
481*77c1e3ccSAndroid Build Coastguard Worker 
482*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
483*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
484*77c1e3ccSAndroid Build Coastguard Worker     NEON, BlendA64MaskTestHBD,
485*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncsHBD(aom_highbd_blend_a64_mask_c,
486*77c1e3ccSAndroid Build Coastguard Worker                                    aom_highbd_blend_a64_mask_neon)));
487*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_NEON
488*77c1e3ccSAndroid Build Coastguard Worker 
489*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
490*77c1e3ccSAndroid Build Coastguard Worker // HBD _d16 version
491*77c1e3ccSAndroid Build Coastguard Worker //////////////////////////////////////////////////////////////////////////////
492*77c1e3ccSAndroid Build Coastguard Worker 
493*77c1e3ccSAndroid Build Coastguard Worker typedef void (*FHBD_D16)(uint8_t *dst, uint32_t dst_stride,
494*77c1e3ccSAndroid Build Coastguard Worker                          const CONV_BUF_TYPE *src0, uint32_t src0_stride,
495*77c1e3ccSAndroid Build Coastguard Worker                          const CONV_BUF_TYPE *src1, uint32_t src1_stride,
496*77c1e3ccSAndroid Build Coastguard Worker                          const uint8_t *mask, uint32_t mask_stride, int w,
497*77c1e3ccSAndroid Build Coastguard Worker                          int h, int subx, int suby, ConvolveParams *conv_params,
498*77c1e3ccSAndroid Build Coastguard Worker                          const int bd);
499*77c1e3ccSAndroid Build Coastguard Worker typedef libaom_test::FuncParam<FHBD_D16> TestFuncsHBD_d16;
500*77c1e3ccSAndroid Build Coastguard Worker 
501*77c1e3ccSAndroid Build Coastguard Worker class BlendA64MaskTestHBD_d16
502*77c1e3ccSAndroid Build Coastguard Worker     : public BlendA64MaskTest<FHBD_D16, uint16_t, uint16_t> {
503*77c1e3ccSAndroid Build Coastguard Worker  protected:
504*77c1e3ccSAndroid Build Coastguard Worker   // max number of bits used by the source
505*77c1e3ccSAndroid Build Coastguard Worker   static const int kSrcMaxBitsMask = (1 << 14) - 1;
506*77c1e3ccSAndroid Build Coastguard Worker   static const int kSrcMaxBitsMaskHBD = (1 << 16) - 1;
507*77c1e3ccSAndroid Build Coastguard Worker 
Execute(const uint16_t * p_src0,const uint16_t * p_src1,int run_times)508*77c1e3ccSAndroid Build Coastguard Worker   void Execute(const uint16_t *p_src0, const uint16_t *p_src1,
509*77c1e3ccSAndroid Build Coastguard Worker                int run_times) override {
510*77c1e3ccSAndroid Build Coastguard Worker     ASSERT_GT(run_times, 0) << "Cannot run 0 iterations of the test.";
511*77c1e3ccSAndroid Build Coastguard Worker     ConvolveParams conv_params;
512*77c1e3ccSAndroid Build Coastguard Worker     conv_params.round_0 = (bit_depth_ == 12) ? ROUND0_BITS + 2 : ROUND0_BITS;
513*77c1e3ccSAndroid Build Coastguard Worker     conv_params.round_1 = COMPOUND_ROUND1_BITS;
514*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer timer;
515*77c1e3ccSAndroid Build Coastguard Worker     aom_usec_timer_start(&timer);
516*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < run_times; ++i) {
517*77c1e3ccSAndroid Build Coastguard Worker       params_.ref_func(CONVERT_TO_BYTEPTR(dst_ref_ + dst_offset_), dst_stride_,
518*77c1e3ccSAndroid Build Coastguard Worker                        p_src0 + src0_offset_, src0_stride_,
519*77c1e3ccSAndroid Build Coastguard Worker                        p_src1 + src1_offset_, src1_stride_, mask_,
520*77c1e3ccSAndroid Build Coastguard Worker                        kMaxMaskWidth, w_, h_, subx_, suby_, &conv_params,
521*77c1e3ccSAndroid Build Coastguard Worker                        bit_depth_);
522*77c1e3ccSAndroid Build Coastguard Worker     }
523*77c1e3ccSAndroid Build Coastguard Worker     if (params_.tst_func) {
524*77c1e3ccSAndroid Build Coastguard Worker       aom_usec_timer_mark(&timer);
525*77c1e3ccSAndroid Build Coastguard Worker       const double time1 = static_cast<double>(aom_usec_timer_elapsed(&timer));
526*77c1e3ccSAndroid Build Coastguard Worker       aom_usec_timer_start(&timer);
527*77c1e3ccSAndroid Build Coastguard Worker       for (int i = 0; i < run_times; ++i) {
528*77c1e3ccSAndroid Build Coastguard Worker         params_.tst_func(CONVERT_TO_BYTEPTR(dst_tst_ + dst_offset_),
529*77c1e3ccSAndroid Build Coastguard Worker                          dst_stride_, p_src0 + src0_offset_, src0_stride_,
530*77c1e3ccSAndroid Build Coastguard Worker                          p_src1 + src1_offset_, src1_stride_, mask_,
531*77c1e3ccSAndroid Build Coastguard Worker                          kMaxMaskWidth, w_, h_, subx_, suby_, &conv_params,
532*77c1e3ccSAndroid Build Coastguard Worker                          bit_depth_);
533*77c1e3ccSAndroid Build Coastguard Worker       }
534*77c1e3ccSAndroid Build Coastguard Worker       aom_usec_timer_mark(&timer);
535*77c1e3ccSAndroid Build Coastguard Worker       const double time2 = static_cast<double>(aom_usec_timer_elapsed(&timer));
536*77c1e3ccSAndroid Build Coastguard Worker       if (run_times > 1) {
537*77c1e3ccSAndroid Build Coastguard Worker         printf("%3dx%-3d subx %d suby %d :%7.2f/%7.2fns", w_, h_, subx_, suby_,
538*77c1e3ccSAndroid Build Coastguard Worker                time1, time2);
539*77c1e3ccSAndroid Build Coastguard Worker         printf("(%3.2f)\n", time1 / time2);
540*77c1e3ccSAndroid Build Coastguard Worker       }
541*77c1e3ccSAndroid Build Coastguard Worker     }
542*77c1e3ccSAndroid Build Coastguard Worker   }
543*77c1e3ccSAndroid Build Coastguard Worker 
544*77c1e3ccSAndroid Build Coastguard Worker   int bit_depth_;
545*77c1e3ccSAndroid Build Coastguard Worker   int src_max_bits_mask_;
546*77c1e3ccSAndroid Build Coastguard Worker };
547*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTestHBD_d16,RandomValues)548*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTestHBD_d16, RandomValues) {
549*77c1e3ccSAndroid Build Coastguard Worker   if (params_.tst_func == nullptr) return;
550*77c1e3ccSAndroid Build Coastguard Worker   for (bit_depth_ = 8; bit_depth_ <= 12 && !HasFatalFailure();
551*77c1e3ccSAndroid Build Coastguard Worker        bit_depth_ += 2) {
552*77c1e3ccSAndroid Build Coastguard Worker     src_max_bits_mask_ =
553*77c1e3ccSAndroid Build Coastguard Worker         (bit_depth_ == 8) ? kSrcMaxBitsMask : kSrcMaxBitsMaskHBD;
554*77c1e3ccSAndroid Build Coastguard Worker 
555*77c1e3ccSAndroid Build Coastguard Worker     for (int bsize = 0; bsize < BLOCK_SIZES_ALL && !HasFatalFailure();
556*77c1e3ccSAndroid Build Coastguard Worker          ++bsize) {
557*77c1e3ccSAndroid Build Coastguard Worker       for (int i = 0; i < kBufSize; ++i) {
558*77c1e3ccSAndroid Build Coastguard Worker         dst_ref_[i] = rng_.Rand8();
559*77c1e3ccSAndroid Build Coastguard Worker         dst_tst_[i] = rng_.Rand8();
560*77c1e3ccSAndroid Build Coastguard Worker 
561*77c1e3ccSAndroid Build Coastguard Worker         src0_[i] = rng_.Rand16() & src_max_bits_mask_;
562*77c1e3ccSAndroid Build Coastguard Worker         src1_[i] = rng_.Rand16() & src_max_bits_mask_;
563*77c1e3ccSAndroid Build Coastguard Worker       }
564*77c1e3ccSAndroid Build Coastguard Worker 
565*77c1e3ccSAndroid Build Coastguard Worker       for (int i = 0; i < kMaxMaskSize; ++i)
566*77c1e3ccSAndroid Build Coastguard Worker         mask_[i] = rng_(AOM_BLEND_A64_MAX_ALPHA + 1);
567*77c1e3ccSAndroid Build Coastguard Worker 
568*77c1e3ccSAndroid Build Coastguard Worker       RunTest(bsize, 1);
569*77c1e3ccSAndroid Build Coastguard Worker     }
570*77c1e3ccSAndroid Build Coastguard Worker   }
571*77c1e3ccSAndroid Build Coastguard Worker }
572*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTestHBD_d16,ExtremeValues)573*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTestHBD_d16, ExtremeValues) {
574*77c1e3ccSAndroid Build Coastguard Worker   for (bit_depth_ = 8; bit_depth_ <= 12; bit_depth_ += 2) {
575*77c1e3ccSAndroid Build Coastguard Worker     src_max_bits_mask_ =
576*77c1e3ccSAndroid Build Coastguard Worker         (bit_depth_ == 8) ? kSrcMaxBitsMask : kSrcMaxBitsMaskHBD;
577*77c1e3ccSAndroid Build Coastguard Worker 
578*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kBufSize; ++i) {
579*77c1e3ccSAndroid Build Coastguard Worker       dst_ref_[i] = 0;
580*77c1e3ccSAndroid Build Coastguard Worker       dst_tst_[i] = (1 << bit_depth_) - 1;
581*77c1e3ccSAndroid Build Coastguard Worker 
582*77c1e3ccSAndroid Build Coastguard Worker       src0_[i] = src_max_bits_mask_;
583*77c1e3ccSAndroid Build Coastguard Worker       src1_[i] = src_max_bits_mask_;
584*77c1e3ccSAndroid Build Coastguard Worker     }
585*77c1e3ccSAndroid Build Coastguard Worker 
586*77c1e3ccSAndroid Build Coastguard Worker     for (int i = 0; i < kMaxMaskSize; ++i) mask_[i] = AOM_BLEND_A64_MAX_ALPHA;
587*77c1e3ccSAndroid Build Coastguard Worker     for (int bsize = 0; bsize < BLOCK_SIZES_ALL; ++bsize) {
588*77c1e3ccSAndroid Build Coastguard Worker       RunTest(bsize, 1);
589*77c1e3ccSAndroid Build Coastguard Worker     }
590*77c1e3ccSAndroid Build Coastguard Worker   }
591*77c1e3ccSAndroid Build Coastguard Worker }
592*77c1e3ccSAndroid Build Coastguard Worker 
TEST_P(BlendA64MaskTestHBD_d16,DISABLED_Speed)593*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BlendA64MaskTestHBD_d16, DISABLED_Speed) {
594*77c1e3ccSAndroid Build Coastguard Worker   const int kRunTimes = 10000000;
595*77c1e3ccSAndroid Build Coastguard Worker   for (int bsize = 0; bsize < BLOCK_SIZES_ALL; ++bsize) {
596*77c1e3ccSAndroid Build Coastguard Worker     for (bit_depth_ = 8; bit_depth_ <= 12; bit_depth_ += 2) {
597*77c1e3ccSAndroid Build Coastguard Worker       for (int i = 0; i < kBufSize; ++i) {
598*77c1e3ccSAndroid Build Coastguard Worker         dst_ref_[i] = rng_.Rand12() % (1 << bit_depth_);
599*77c1e3ccSAndroid Build Coastguard Worker         dst_tst_[i] = rng_.Rand12() % (1 << bit_depth_);
600*77c1e3ccSAndroid Build Coastguard Worker 
601*77c1e3ccSAndroid Build Coastguard Worker         src0_[i] = rng_.Rand16();
602*77c1e3ccSAndroid Build Coastguard Worker         src1_[i] = rng_.Rand16();
603*77c1e3ccSAndroid Build Coastguard Worker       }
604*77c1e3ccSAndroid Build Coastguard Worker 
605*77c1e3ccSAndroid Build Coastguard Worker       for (int i = 0; i < kMaxMaskSize; ++i)
606*77c1e3ccSAndroid Build Coastguard Worker         mask_[i] = rng_(AOM_BLEND_A64_MAX_ALPHA + 1);
607*77c1e3ccSAndroid Build Coastguard Worker 
608*77c1e3ccSAndroid Build Coastguard Worker       RunTest(bsize, kRunTimes);
609*77c1e3ccSAndroid Build Coastguard Worker     }
610*77c1e3ccSAndroid Build Coastguard Worker   }
611*77c1e3ccSAndroid Build Coastguard Worker }
612*77c1e3ccSAndroid Build Coastguard Worker 
613*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
614*77c1e3ccSAndroid Build Coastguard Worker     C, BlendA64MaskTestHBD_d16,
615*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncsHBD_d16(aom_highbd_blend_a64_d16_mask_c,
616*77c1e3ccSAndroid Build Coastguard Worker                                        aom_highbd_blend_a64_d16_mask_c)));
617*77c1e3ccSAndroid Build Coastguard Worker 
618*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE4_1
619*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
620*77c1e3ccSAndroid Build Coastguard Worker     SSE4_1, BlendA64MaskTestHBD_d16,
621*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncsHBD_d16(aom_highbd_blend_a64_d16_mask_c,
622*77c1e3ccSAndroid Build Coastguard Worker                                        aom_highbd_blend_a64_d16_mask_sse4_1)));
623*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_SSE4_1
624*77c1e3ccSAndroid Build Coastguard Worker 
625*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
626*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
627*77c1e3ccSAndroid Build Coastguard Worker     AVX2, BlendA64MaskTestHBD_d16,
628*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncsHBD_d16(aom_highbd_blend_a64_d16_mask_c,
629*77c1e3ccSAndroid Build Coastguard Worker                                        aom_highbd_blend_a64_d16_mask_avx2)));
630*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_AVX2
631*77c1e3ccSAndroid Build Coastguard Worker 
632*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
633*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
634*77c1e3ccSAndroid Build Coastguard Worker     NEON, BlendA64MaskTestHBD_d16,
635*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncsHBD_d16(aom_highbd_blend_a64_d16_mask_c,
636*77c1e3ccSAndroid Build Coastguard Worker                                        aom_highbd_blend_a64_d16_mask_neon)));
637*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_NEON
638*77c1e3ccSAndroid Build Coastguard Worker 
639*77c1e3ccSAndroid Build Coastguard Worker // TODO(slavarnway): Enable the following in the avx2 commit. (56501)
640*77c1e3ccSAndroid Build Coastguard Worker #if 0
641*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
642*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
643*77c1e3ccSAndroid Build Coastguard Worker     SSE4_1, BlendA64MaskTestHBD,
644*77c1e3ccSAndroid Build Coastguard Worker     ::testing::Values(TestFuncsHBD(aom_highbd_blend_a64_mask_c,
645*77c1e3ccSAndroid Build Coastguard Worker                                    aom_highbd_blend_a64_mask_avx2)));
646*77c1e3ccSAndroid Build Coastguard Worker #endif  // HAVE_AVX2
647*77c1e3ccSAndroid Build Coastguard Worker #endif
648*77c1e3ccSAndroid Build Coastguard Worker #endif  // CONFIG_AV1_HIGHBITDEPTH
649*77c1e3ccSAndroid Build Coastguard Worker }  // namespace
650