xref: /aosp_15_r20/external/libdav1d/tests/checkasm/refmvs.c (revision c09093415860a1c2373dacd84c4fde00c507cdfd)
1*c0909341SAndroid Build Coastguard Worker /*
2*c0909341SAndroid Build Coastguard Worker  * Copyright © 2021, VideoLAN and dav1d authors
3*c0909341SAndroid Build Coastguard Worker  * All rights reserved.
4*c0909341SAndroid Build Coastguard Worker  *
5*c0909341SAndroid Build Coastguard Worker  * Redistribution and use in source and binary forms, with or without
6*c0909341SAndroid Build Coastguard Worker  * modification, are permitted provided that the following conditions are met:
7*c0909341SAndroid Build Coastguard Worker  *
8*c0909341SAndroid Build Coastguard Worker  * 1. Redistributions of source code must retain the above copyright notice, this
9*c0909341SAndroid Build Coastguard Worker  *    list of conditions and the following disclaimer.
10*c0909341SAndroid Build Coastguard Worker  *
11*c0909341SAndroid Build Coastguard Worker  * 2. Redistributions in binary form must reproduce the above copyright notice,
12*c0909341SAndroid Build Coastguard Worker  *    this list of conditions and the following disclaimer in the documentation
13*c0909341SAndroid Build Coastguard Worker  *    and/or other materials provided with the distribution.
14*c0909341SAndroid Build Coastguard Worker  *
15*c0909341SAndroid Build Coastguard Worker  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
16*c0909341SAndroid Build Coastguard Worker  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17*c0909341SAndroid Build Coastguard Worker  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18*c0909341SAndroid Build Coastguard Worker  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
19*c0909341SAndroid Build Coastguard Worker  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
20*c0909341SAndroid Build Coastguard Worker  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
21*c0909341SAndroid Build Coastguard Worker  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
22*c0909341SAndroid Build Coastguard Worker  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
23*c0909341SAndroid Build Coastguard Worker  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
24*c0909341SAndroid Build Coastguard Worker  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25*c0909341SAndroid Build Coastguard Worker  */
26*c0909341SAndroid Build Coastguard Worker 
27*c0909341SAndroid Build Coastguard Worker #include "tests/checkasm/checkasm.h"
28*c0909341SAndroid Build Coastguard Worker #include "src/refmvs.h"
29*c0909341SAndroid Build Coastguard Worker 
30*c0909341SAndroid Build Coastguard Worker #include <stdio.h>
31*c0909341SAndroid Build Coastguard Worker 
gen_mv(const int total_bits,int spel_bits)32*c0909341SAndroid Build Coastguard Worker static inline int gen_mv(const int total_bits, int spel_bits) {
33*c0909341SAndroid Build Coastguard Worker     int bits = rnd() & ((1 << spel_bits) - 1);
34*c0909341SAndroid Build Coastguard Worker     do {
35*c0909341SAndroid Build Coastguard Worker         bits |= (rnd() & 1) << spel_bits;
36*c0909341SAndroid Build Coastguard Worker     } while (rnd() & 1 && ++spel_bits < total_bits);
37*c0909341SAndroid Build Coastguard Worker     // the do/while makes it relatively more likely to be close to zero (fpel)
38*c0909341SAndroid Build Coastguard Worker     // than far away
39*c0909341SAndroid Build Coastguard Worker     return rnd() & 1 ? -bits : bits;
40*c0909341SAndroid Build Coastguard Worker }
41*c0909341SAndroid Build Coastguard Worker 
42*c0909341SAndroid Build Coastguard Worker #define ARRAY_SIZE(n) (sizeof(n)/sizeof(*(n)))
43*c0909341SAndroid Build Coastguard Worker 
get_min_mv_val(const int idx)44*c0909341SAndroid Build Coastguard Worker static inline int get_min_mv_val(const int idx) {
45*c0909341SAndroid Build Coastguard Worker     if      (idx <= 9)  return idx;
46*c0909341SAndroid Build Coastguard Worker     else if (idx <= 18) return (idx - 9) * 10;
47*c0909341SAndroid Build Coastguard Worker     else if (idx <= 27) return (idx - 18) * 100;
48*c0909341SAndroid Build Coastguard Worker     else if (idx <= 36) return (idx - 27) * 1000;
49*c0909341SAndroid Build Coastguard Worker     else                return (idx - 36) * 10000;
50*c0909341SAndroid Build Coastguard Worker }
51*c0909341SAndroid Build Coastguard Worker 
gen_tmv(refmvs_temporal_block * const rb,const int * ref2ref)52*c0909341SAndroid Build Coastguard Worker static inline void gen_tmv(refmvs_temporal_block *const rb, const int *ref2ref) {
53*c0909341SAndroid Build Coastguard Worker     rb->ref = rnd() % 7;
54*c0909341SAndroid Build Coastguard Worker     if (!rb->ref) return;
55*c0909341SAndroid Build Coastguard Worker     static const int x_prob[] = {
56*c0909341SAndroid Build Coastguard Worker         26447556, 6800591, 3708783,  2198592, 1635940, 1145901, 1052602, 1261759,
57*c0909341SAndroid Build Coastguard Worker          1099739,  755108, 6075404,  4355916, 3254908, 2897157, 2273676, 2154432,
58*c0909341SAndroid Build Coastguard Worker          1937436, 1694818, 1466863, 10203087, 5241546, 3328819, 2187483, 1458997,
59*c0909341SAndroid Build Coastguard Worker          1030842,  806863,  587219,   525024, 1858953,  422368,  114626,   16992
60*c0909341SAndroid Build Coastguard Worker     };
61*c0909341SAndroid Build Coastguard Worker     static const int y_prob[] = {
62*c0909341SAndroid Build Coastguard Worker         33845001, 7591218,  6425971, 4115838, 4032161, 2515962, 2614601, 2343656,
63*c0909341SAndroid Build Coastguard Worker          2898897, 1397254, 10125350, 5124449, 3232914, 2185499, 1608775, 1342585,
64*c0909341SAndroid Build Coastguard Worker           980208,  795714,   649665, 3369250, 1298716,  486002,  279588,  235990,
65*c0909341SAndroid Build Coastguard Worker           110318,   89372,    66895,   46980,  153322,   32960,    4500,     389
66*c0909341SAndroid Build Coastguard Worker     };
67*c0909341SAndroid Build Coastguard Worker     const int prob = rnd() % 100000000;
68*c0909341SAndroid Build Coastguard Worker     int acc = 0;
69*c0909341SAndroid Build Coastguard Worker     for (unsigned i = 0; i < ARRAY_SIZE(x_prob); i++) {
70*c0909341SAndroid Build Coastguard Worker         acc += x_prob[i];
71*c0909341SAndroid Build Coastguard Worker         if (prob < acc) {
72*c0909341SAndroid Build Coastguard Worker             const int min = get_min_mv_val(i);
73*c0909341SAndroid Build Coastguard Worker             const int max = get_min_mv_val(i + 1);
74*c0909341SAndroid Build Coastguard Worker             const int val = min + rnd() % (max - min);
75*c0909341SAndroid Build Coastguard Worker             rb->mv.x = iclip(val * ref2ref[rb->ref], -(1 << 15), (1 << 15) - 1);
76*c0909341SAndroid Build Coastguard Worker             break;
77*c0909341SAndroid Build Coastguard Worker         }
78*c0909341SAndroid Build Coastguard Worker     }
79*c0909341SAndroid Build Coastguard Worker     acc = 0;
80*c0909341SAndroid Build Coastguard Worker     for (unsigned i = 0; i < ARRAY_SIZE(y_prob); i++) {
81*c0909341SAndroid Build Coastguard Worker         acc += y_prob[i];
82*c0909341SAndroid Build Coastguard Worker         if (prob < acc) {
83*c0909341SAndroid Build Coastguard Worker             const int min = get_min_mv_val(i);
84*c0909341SAndroid Build Coastguard Worker             const int max = get_min_mv_val(i + 1);
85*c0909341SAndroid Build Coastguard Worker             const int val = min + rnd() % (max - min);
86*c0909341SAndroid Build Coastguard Worker             rb->mv.y = iclip(val * ref2ref[rb->ref], -(1 << 15), (1 << 15) - 1);
87*c0909341SAndroid Build Coastguard Worker             break;
88*c0909341SAndroid Build Coastguard Worker         }
89*c0909341SAndroid Build Coastguard Worker     }
90*c0909341SAndroid Build Coastguard Worker }
91*c0909341SAndroid Build Coastguard Worker 
get_ref2cur(void)92*c0909341SAndroid Build Coastguard Worker static inline int get_ref2cur(void) {
93*c0909341SAndroid Build Coastguard Worker     const int prob = rnd() % 100;
94*c0909341SAndroid Build Coastguard Worker     static const uint8_t ref2cur[11] = { 35, 55, 67, 73, 78, 83, 84, 87, 90, 93, 100 };
95*c0909341SAndroid Build Coastguard Worker     for (int i = 0; i < 11; i++)
96*c0909341SAndroid Build Coastguard Worker         if (prob < ref2cur[i])
97*c0909341SAndroid Build Coastguard Worker             return rnd() & 1 ? -(i + 1) : i + 1;
98*c0909341SAndroid Build Coastguard Worker     return 0;
99*c0909341SAndroid Build Coastguard Worker }
100*c0909341SAndroid Build Coastguard Worker 
get_seqlen(void)101*c0909341SAndroid Build Coastguard Worker static inline int get_seqlen(void) {
102*c0909341SAndroid Build Coastguard Worker     int len = 0, max_len;
103*c0909341SAndroid Build Coastguard Worker     const int prob = rnd() % 100000;
104*c0909341SAndroid Build Coastguard Worker     // =1 =2 =3 =4  <8  =8 <16 =16 <32 =32 <48 =48 <64 =64 >64 eq240
105*c0909341SAndroid Build Coastguard Worker     //  5 17 1.5 16  5  10  5   7   4   3  1.5  2   1    2   20   15   chimera blocks
106*c0909341SAndroid Build Coastguard Worker     // 25 38 2.5 19 3.5 5.5 2 1.87 .86 .4  .18 .2 .067 .165 .478 .28   chimera sequences
107*c0909341SAndroid Build Coastguard Worker 
108*c0909341SAndroid Build Coastguard Worker     if      (prob < 25000) len = 1;       // =1   5%
109*c0909341SAndroid Build Coastguard Worker     else if (prob < 63000) len = 2;       // =2   17%
110*c0909341SAndroid Build Coastguard Worker     else if (prob < 65500) len = 3;       // =3   1.5%
111*c0909341SAndroid Build Coastguard Worker     else if (prob < 84500) len = 4;       // =4   16%
112*c0909341SAndroid Build Coastguard Worker     else if (prob < 88000) max_len = 7;   // <8   5% (43.5% tot <8)
113*c0909341SAndroid Build Coastguard Worker     else if (prob < 93500) len = 8;       // =8   10%
114*c0909341SAndroid Build Coastguard Worker     else if (prob < 95500) max_len = 15;  // <16  5%
115*c0909341SAndroid Build Coastguard Worker     else if (prob < 97370) len = 16;      // =16  7%
116*c0909341SAndroid Build Coastguard Worker     else if (prob < 98230) max_len = 31;  // <32  4%
117*c0909341SAndroid Build Coastguard Worker     else if (prob < 98630) len = 32;      // =32  3%
118*c0909341SAndroid Build Coastguard Worker     else if (prob < 98810) max_len = 47;  // <48  1.5%
119*c0909341SAndroid Build Coastguard Worker     else if (prob < 99010) len = 48;      // =48  2%
120*c0909341SAndroid Build Coastguard Worker     else if (prob < 99077) max_len = 63;  // <64  1%
121*c0909341SAndroid Build Coastguard Worker     else if (prob < 99242) len = 64;      // =64  2%
122*c0909341SAndroid Build Coastguard Worker     else if (prob < 99720) max_len = 239; // <240 5%
123*c0909341SAndroid Build Coastguard Worker     else                   len = 240;     // =240 15%
124*c0909341SAndroid Build Coastguard Worker 
125*c0909341SAndroid Build Coastguard Worker     if (!len) len = 1 + rnd() % max_len;
126*c0909341SAndroid Build Coastguard Worker     return len;
127*c0909341SAndroid Build Coastguard Worker }
128*c0909341SAndroid Build Coastguard Worker 
init_rp_ref(refmvs_frame const * const rf,const int col_start8,const int col_end8,const int row_start8,const int row_end8)129*c0909341SAndroid Build Coastguard Worker static inline void init_rp_ref(refmvs_frame const *const rf,
130*c0909341SAndroid Build Coastguard Worker                                const int col_start8, const int col_end8,
131*c0909341SAndroid Build Coastguard Worker                                const int row_start8, const int row_end8)
132*c0909341SAndroid Build Coastguard Worker {
133*c0909341SAndroid Build Coastguard Worker     const int col_start8i = imax(col_start8 - 8, 0);
134*c0909341SAndroid Build Coastguard Worker     const int col_end8i = imin(col_end8 + 8, rf->iw8);
135*c0909341SAndroid Build Coastguard Worker     for (int n = 0; n < rf->n_mfmvs; n++) {
136*c0909341SAndroid Build Coastguard Worker         refmvs_temporal_block *rp_ref = rf->rp_ref[rf->mfmv_ref[n]];
137*c0909341SAndroid Build Coastguard Worker         for (int i = row_start8; i < imin(row_end8, rf->ih8); i++) {
138*c0909341SAndroid Build Coastguard Worker             for (int j = col_start8i; j < col_end8i;) {
139*c0909341SAndroid Build Coastguard Worker                 refmvs_temporal_block rb;
140*c0909341SAndroid Build Coastguard Worker                 gen_tmv(&rb, rf->mfmv_ref2ref[n]);
141*c0909341SAndroid Build Coastguard Worker                 for (int k = get_seqlen(); k && j < col_end8i; k--, j++)
142*c0909341SAndroid Build Coastguard Worker                     rp_ref[i * rf->iw8 + j] = rb;
143*c0909341SAndroid Build Coastguard Worker             }
144*c0909341SAndroid Build Coastguard Worker         }
145*c0909341SAndroid Build Coastguard Worker     }
146*c0909341SAndroid Build Coastguard Worker }
147*c0909341SAndroid Build Coastguard Worker 
check_load_tmvs(const Dav1dRefmvsDSPContext * const c)148*c0909341SAndroid Build Coastguard Worker static void check_load_tmvs(const Dav1dRefmvsDSPContext *const c) {
149*c0909341SAndroid Build Coastguard Worker     refmvs_temporal_block *rp_ref[7] = {0};
150*c0909341SAndroid Build Coastguard Worker     refmvs_temporal_block c_rp_proj[240 * 63];
151*c0909341SAndroid Build Coastguard Worker     refmvs_temporal_block a_rp_proj[240 * 63];
152*c0909341SAndroid Build Coastguard Worker     refmvs_frame rf = {
153*c0909341SAndroid Build Coastguard Worker         .rp_ref = rp_ref,
154*c0909341SAndroid Build Coastguard Worker         .rp_stride = 240, .iw8 = 240, .ih8 = 63,
155*c0909341SAndroid Build Coastguard Worker         .n_mfmvs = 3
156*c0909341SAndroid Build Coastguard Worker     };
157*c0909341SAndroid Build Coastguard Worker     const size_t rp_ref_sz = rf.ih8 * rf.rp_stride * sizeof(refmvs_temporal_block);
158*c0909341SAndroid Build Coastguard Worker 
159*c0909341SAndroid Build Coastguard Worker     declare_func(void, const refmvs_frame *rf, int tile_row_idx,
160*c0909341SAndroid Build Coastguard Worker                  int col_start8, int col_end8, int row_start8, int row_end8);
161*c0909341SAndroid Build Coastguard Worker 
162*c0909341SAndroid Build Coastguard Worker     if (check_func(c->load_tmvs, "load_tmvs")) {
163*c0909341SAndroid Build Coastguard Worker         const int row_start8 = (rnd() & 3) << 4;
164*c0909341SAndroid Build Coastguard Worker         const int row_end8 = row_start8 + 16;
165*c0909341SAndroid Build Coastguard Worker         const int col_start8 = rnd() & 31;
166*c0909341SAndroid Build Coastguard Worker         const int col_end8 = rf.iw8 - (rnd() & 31);
167*c0909341SAndroid Build Coastguard Worker 
168*c0909341SAndroid Build Coastguard Worker         for (int n = 0; n < rf.n_mfmvs; n++) {
169*c0909341SAndroid Build Coastguard Worker             rf.mfmv_ref[n] = rnd() % 7;
170*c0909341SAndroid Build Coastguard Worker             rf.mfmv_ref2cur[n] = get_ref2cur();
171*c0909341SAndroid Build Coastguard Worker             for (int r = 0; r < 7; r++)
172*c0909341SAndroid Build Coastguard Worker                 rf.mfmv_ref2ref[n][r] = rnd() & 31;
173*c0909341SAndroid Build Coastguard Worker         }
174*c0909341SAndroid Build Coastguard Worker         for (int n = 0; n < rf.n_mfmvs; n++) {
175*c0909341SAndroid Build Coastguard Worker             refmvs_temporal_block **p_rp_ref = &rp_ref[rf.mfmv_ref[n]];
176*c0909341SAndroid Build Coastguard Worker             if (!*p_rp_ref)
177*c0909341SAndroid Build Coastguard Worker                 *p_rp_ref = malloc(rp_ref_sz);
178*c0909341SAndroid Build Coastguard Worker         }
179*c0909341SAndroid Build Coastguard Worker         init_rp_ref(&rf, 0, rf.iw8, row_start8, row_end8);
180*c0909341SAndroid Build Coastguard Worker         for (int i = 0; i < rf.iw8 * rf.ih8; i++) {
181*c0909341SAndroid Build Coastguard Worker             c_rp_proj[i].mv.n = a_rp_proj[i].mv.n = 0xdeadbeef;
182*c0909341SAndroid Build Coastguard Worker             c_rp_proj[i].ref = a_rp_proj[i].ref = 0xdd;
183*c0909341SAndroid Build Coastguard Worker         }
184*c0909341SAndroid Build Coastguard Worker 
185*c0909341SAndroid Build Coastguard Worker         rf.n_tile_threads = 1;
186*c0909341SAndroid Build Coastguard Worker 
187*c0909341SAndroid Build Coastguard Worker         rf.rp_proj = c_rp_proj;
188*c0909341SAndroid Build Coastguard Worker         call_ref(&rf, 0, col_start8, col_end8, row_start8, row_end8);
189*c0909341SAndroid Build Coastguard Worker         rf.rp_proj = a_rp_proj;
190*c0909341SAndroid Build Coastguard Worker         call_new(&rf, 0, col_start8, col_end8, row_start8, row_end8);
191*c0909341SAndroid Build Coastguard Worker 
192*c0909341SAndroid Build Coastguard Worker         for (int i = 0; i < rf.ih8; i++)
193*c0909341SAndroid Build Coastguard Worker             for (int j = 0; j < rf.iw8; j++)
194*c0909341SAndroid Build Coastguard Worker                 if (c_rp_proj[i * rf.iw8 + j].mv.n != a_rp_proj[i * rf.iw8 + j].mv.n ||
195*c0909341SAndroid Build Coastguard Worker                     (c_rp_proj[i * rf.iw8 + j].ref != a_rp_proj[i * rf.iw8 + j].ref &&
196*c0909341SAndroid Build Coastguard Worker                      c_rp_proj[i * rf.iw8 + j].mv.n != INVALID_MV))
197*c0909341SAndroid Build Coastguard Worker                 {
198*c0909341SAndroid Build Coastguard Worker                     if (fail()) {
199*c0909341SAndroid Build Coastguard Worker                         fprintf(stderr, "[%d][%d] c_rp.mv.x = 0x%x a_rp.mv.x = 0x%x\n",
200*c0909341SAndroid Build Coastguard Worker                                 i, j, c_rp_proj[i * rf.iw8 + j].mv.x, a_rp_proj[i * rf.iw8 + j].mv.x);
201*c0909341SAndroid Build Coastguard Worker                         fprintf(stderr, "[%d][%d] c_rp.mv.y = 0x%x a_rp.mv.y = 0x%x\n",
202*c0909341SAndroid Build Coastguard Worker                                 i, j, c_rp_proj[i * rf.iw8 + j].mv.y, a_rp_proj[i * rf.iw8 + j].mv.y);
203*c0909341SAndroid Build Coastguard Worker                         fprintf(stderr, "[%d][%d] c_rp.ref = %u a_rp.ref = %u\n",
204*c0909341SAndroid Build Coastguard Worker                                 i, j, c_rp_proj[i * rf.iw8 + j].ref, a_rp_proj[i * rf.iw8 + j].ref);
205*c0909341SAndroid Build Coastguard Worker                     }
206*c0909341SAndroid Build Coastguard Worker                 }
207*c0909341SAndroid Build Coastguard Worker 
208*c0909341SAndroid Build Coastguard Worker         if (checkasm_bench_func()) {
209*c0909341SAndroid Build Coastguard Worker             for (int n = 0; n < rf.n_mfmvs; n++) {
210*c0909341SAndroid Build Coastguard Worker                 rf.mfmv_ref2cur[n] = 1;
211*c0909341SAndroid Build Coastguard Worker                 for (int r = 0; r < 7; r++)
212*c0909341SAndroid Build Coastguard Worker                     rf.mfmv_ref2ref[n][r] = 1;
213*c0909341SAndroid Build Coastguard Worker             }
214*c0909341SAndroid Build Coastguard Worker             bench_new(&rf, 0, 0, rf.iw8, row_start8, row_end8);
215*c0909341SAndroid Build Coastguard Worker         }
216*c0909341SAndroid Build Coastguard Worker 
217*c0909341SAndroid Build Coastguard Worker         for (int n = 0; n < rf.n_mfmvs; n++) {
218*c0909341SAndroid Build Coastguard Worker             free(rp_ref[rf.mfmv_ref[n]]);
219*c0909341SAndroid Build Coastguard Worker             rp_ref[rf.mfmv_ref[n]] = NULL;
220*c0909341SAndroid Build Coastguard Worker         }
221*c0909341SAndroid Build Coastguard Worker     }
222*c0909341SAndroid Build Coastguard Worker 
223*c0909341SAndroid Build Coastguard Worker     report("load_tmvs");
224*c0909341SAndroid Build Coastguard Worker }
225*c0909341SAndroid Build Coastguard Worker 
check_save_tmvs(const Dav1dRefmvsDSPContext * const c)226*c0909341SAndroid Build Coastguard Worker static void check_save_tmvs(const Dav1dRefmvsDSPContext *const c) {
227*c0909341SAndroid Build Coastguard Worker     refmvs_block *rr[31];
228*c0909341SAndroid Build Coastguard Worker     refmvs_block r[31 * 256];
229*c0909341SAndroid Build Coastguard Worker     ALIGN_STK_64(refmvs_temporal_block, c_rp, 128 * 16,);
230*c0909341SAndroid Build Coastguard Worker     ALIGN_STK_64(refmvs_temporal_block, a_rp, 128 * 16,);
231*c0909341SAndroid Build Coastguard Worker     uint8_t ref_sign[7];
232*c0909341SAndroid Build Coastguard Worker 
233*c0909341SAndroid Build Coastguard Worker     for (int i = 0; i < 31; i++)
234*c0909341SAndroid Build Coastguard Worker         rr[i] = &r[i * 256];
235*c0909341SAndroid Build Coastguard Worker 
236*c0909341SAndroid Build Coastguard Worker     declare_func(void, refmvs_temporal_block *rp, const ptrdiff_t stride,
237*c0909341SAndroid Build Coastguard Worker                  refmvs_block *const *const rr, const uint8_t *const ref_sign,
238*c0909341SAndroid Build Coastguard Worker                  int col_end8, int row_end8, int col_start8, int row_start8);
239*c0909341SAndroid Build Coastguard Worker 
240*c0909341SAndroid Build Coastguard Worker     if (check_func(c->save_tmvs, "save_tmvs")) {
241*c0909341SAndroid Build Coastguard Worker         const int row_start8 = rnd() & 7;
242*c0909341SAndroid Build Coastguard Worker         const int row_end8 = 8 + (rnd() & 7);
243*c0909341SAndroid Build Coastguard Worker         const int col_start8 = rnd() & 31;
244*c0909341SAndroid Build Coastguard Worker         const int col_end8 = 96 + (rnd() & 31);
245*c0909341SAndroid Build Coastguard Worker 
246*c0909341SAndroid Build Coastguard Worker         for (int i = 0; i < 7; i++)
247*c0909341SAndroid Build Coastguard Worker             ref_sign[i] = rnd() & 1;
248*c0909341SAndroid Build Coastguard Worker 
249*c0909341SAndroid Build Coastguard Worker         for (int i = row_start8; i < row_end8; i++)
250*c0909341SAndroid Build Coastguard Worker             for (int j = col_start8; j < col_end8;) {
251*c0909341SAndroid Build Coastguard Worker                 int bs = rnd() % N_BS_SIZES;
252*c0909341SAndroid Build Coastguard Worker                 while (j + ((dav1d_block_dimensions[bs][0] + 1) >> 1) > col_end8)
253*c0909341SAndroid Build Coastguard Worker                     bs++;
254*c0909341SAndroid Build Coastguard Worker                 rr[i * 2][j * 2 + 1] = (refmvs_block) {
255*c0909341SAndroid Build Coastguard Worker                     .mv.mv[0].x = gen_mv(14, 10),
256*c0909341SAndroid Build Coastguard Worker                     .mv.mv[0].y = gen_mv(14, 10),
257*c0909341SAndroid Build Coastguard Worker                     .mv.mv[1].x = gen_mv(14, 10),
258*c0909341SAndroid Build Coastguard Worker                     .mv.mv[1].y = gen_mv(14, 10),
259*c0909341SAndroid Build Coastguard Worker                     .ref.ref = { (rnd() % 9) - 1, (rnd() % 9) - 1 },
260*c0909341SAndroid Build Coastguard Worker                     .bs = bs
261*c0909341SAndroid Build Coastguard Worker                 };
262*c0909341SAndroid Build Coastguard Worker                 for (int k = 0; k < (dav1d_block_dimensions[bs][0] + 1) >> 1; k++, j++) {
263*c0909341SAndroid Build Coastguard Worker                     c_rp[i * 128 + j].mv.n = 0xdeadbeef;
264*c0909341SAndroid Build Coastguard Worker                     c_rp[i * 128 + j].ref = 0xdd;
265*c0909341SAndroid Build Coastguard Worker                 }
266*c0909341SAndroid Build Coastguard Worker             }
267*c0909341SAndroid Build Coastguard Worker 
268*c0909341SAndroid Build Coastguard Worker         call_ref(c_rp + row_start8 * 128, 128, rr, ref_sign,
269*c0909341SAndroid Build Coastguard Worker                  col_end8, row_end8, col_start8, row_start8);
270*c0909341SAndroid Build Coastguard Worker         call_new(a_rp + row_start8 * 128, 128, rr, ref_sign,
271*c0909341SAndroid Build Coastguard Worker                  col_end8, row_end8, col_start8, row_start8);
272*c0909341SAndroid Build Coastguard Worker         for (int i = row_start8; i < row_end8; i++)
273*c0909341SAndroid Build Coastguard Worker             for (int j = col_start8; j < col_end8; j++)
274*c0909341SAndroid Build Coastguard Worker                 if (c_rp[i * 128 + j].mv.n != a_rp[i * 128 + j].mv.n ||
275*c0909341SAndroid Build Coastguard Worker                     c_rp[i * 128 + j].ref != a_rp[i * 128 + j].ref)
276*c0909341SAndroid Build Coastguard Worker                 {
277*c0909341SAndroid Build Coastguard Worker                     if (fail()) {
278*c0909341SAndroid Build Coastguard Worker                         fprintf(stderr, "[%d][%d] c_rp.mv.x = 0x%x a_rp.mv.x = 0x%x\n",
279*c0909341SAndroid Build Coastguard Worker                                 i, j, c_rp[i * 128 + j].mv.x, a_rp[i * 128 + j].mv.x);
280*c0909341SAndroid Build Coastguard Worker                         fprintf(stderr, "[%d][%d] c_rp.mv.y = 0x%x a_rp.mv.y = 0x%x\n",
281*c0909341SAndroid Build Coastguard Worker                                 i, j, c_rp[i * 128 + j].mv.y, a_rp[i * 128 + j].mv.y);
282*c0909341SAndroid Build Coastguard Worker                         fprintf(stderr, "[%d][%d] c_rp.ref = %u a_rp.ref = %u\n",
283*c0909341SAndroid Build Coastguard Worker                                 i, j, c_rp[i * 128 + j].ref, a_rp[i * 128 + j].ref);
284*c0909341SAndroid Build Coastguard Worker                     }
285*c0909341SAndroid Build Coastguard Worker                 }
286*c0909341SAndroid Build Coastguard Worker 
287*c0909341SAndroid Build Coastguard Worker         for (int bs = BS_4x4; bs < N_BS_SIZES; bs++) {
288*c0909341SAndroid Build Coastguard Worker             const int bw8 = (dav1d_block_dimensions[bs][0] + 1) >> 1;
289*c0909341SAndroid Build Coastguard Worker             for (int i = 0; i < 16; i++)
290*c0909341SAndroid Build Coastguard Worker                 for (int j = 0; j < 128; j += bw8) {
291*c0909341SAndroid Build Coastguard Worker                     rr[i * 2][j * 2 + 1].ref.ref[0] = (rnd() % 9) - 1;
292*c0909341SAndroid Build Coastguard Worker                     rr[i * 2][j * 2 + 1].ref.ref[1] = (rnd() % 9) - 1;
293*c0909341SAndroid Build Coastguard Worker                     rr[i * 2][j * 2 + 1].bs = bs;
294*c0909341SAndroid Build Coastguard Worker                 }
295*c0909341SAndroid Build Coastguard Worker             bench_new(alternate(c_rp, a_rp), 128, rr, ref_sign, 128, 16, 0, 0);
296*c0909341SAndroid Build Coastguard Worker         }
297*c0909341SAndroid Build Coastguard Worker     }
298*c0909341SAndroid Build Coastguard Worker 
299*c0909341SAndroid Build Coastguard Worker     report("save_tmvs");
300*c0909341SAndroid Build Coastguard Worker }
301*c0909341SAndroid Build Coastguard Worker 
check_splat_mv(const Dav1dRefmvsDSPContext * const c)302*c0909341SAndroid Build Coastguard Worker static void check_splat_mv(const Dav1dRefmvsDSPContext *const c) {
303*c0909341SAndroid Build Coastguard Worker     ALIGN_STK_64(refmvs_block, c_buf, 32 * 32,);
304*c0909341SAndroid Build Coastguard Worker     ALIGN_STK_64(refmvs_block, a_buf, 32 * 32,);
305*c0909341SAndroid Build Coastguard Worker     refmvs_block *c_dst[32];
306*c0909341SAndroid Build Coastguard Worker     refmvs_block *a_dst[32];
307*c0909341SAndroid Build Coastguard Worker     const size_t stride = 32 * sizeof(refmvs_block);
308*c0909341SAndroid Build Coastguard Worker 
309*c0909341SAndroid Build Coastguard Worker     for (int i = 0; i < 32; i++) {
310*c0909341SAndroid Build Coastguard Worker         c_dst[i] = c_buf + 32 * i;
311*c0909341SAndroid Build Coastguard Worker         a_dst[i] = a_buf + 32 * i;
312*c0909341SAndroid Build Coastguard Worker     }
313*c0909341SAndroid Build Coastguard Worker 
314*c0909341SAndroid Build Coastguard Worker     declare_func(void, refmvs_block **rr, const refmvs_block *rmv,
315*c0909341SAndroid Build Coastguard Worker                  int bx4, int bw4, int bh4);
316*c0909341SAndroid Build Coastguard Worker 
317*c0909341SAndroid Build Coastguard Worker     for (int w = 1; w <= 32; w *= 2) {
318*c0909341SAndroid Build Coastguard Worker         if (check_func(c->splat_mv, "splat_mv_w%d", w)) {
319*c0909341SAndroid Build Coastguard Worker             const int h_min = imax(w / 4, 1);
320*c0909341SAndroid Build Coastguard Worker             const int h_max = imin(w * 4, 32);
321*c0909341SAndroid Build Coastguard Worker             const int w_uint32 = w * sizeof(refmvs_block) / sizeof(uint32_t);
322*c0909341SAndroid Build Coastguard Worker             for (int h = h_min; h <= h_max; h *= 2) {
323*c0909341SAndroid Build Coastguard Worker                 const int offset = (int) ((unsigned) w * rnd()) & 31;
324*c0909341SAndroid Build Coastguard Worker                 union {
325*c0909341SAndroid Build Coastguard Worker                     refmvs_block rmv;
326*c0909341SAndroid Build Coastguard Worker                     uint32_t u32[3];
327*c0909341SAndroid Build Coastguard Worker                 } ALIGN(tmp, 16);
328*c0909341SAndroid Build Coastguard Worker                 tmp.u32[0] = rnd();
329*c0909341SAndroid Build Coastguard Worker                 tmp.u32[1] = rnd();
330*c0909341SAndroid Build Coastguard Worker                 tmp.u32[2] = rnd();
331*c0909341SAndroid Build Coastguard Worker 
332*c0909341SAndroid Build Coastguard Worker                 call_ref(c_dst, &tmp.rmv, offset, w, h);
333*c0909341SAndroid Build Coastguard Worker                 call_new(a_dst, &tmp.rmv, offset, w, h);
334*c0909341SAndroid Build Coastguard Worker                 checkasm_check(uint32_t, (uint32_t*)(c_buf + offset), stride,
335*c0909341SAndroid Build Coastguard Worker                                          (uint32_t*)(a_buf + offset), stride,
336*c0909341SAndroid Build Coastguard Worker                                          w_uint32, h, "dst");
337*c0909341SAndroid Build Coastguard Worker 
338*c0909341SAndroid Build Coastguard Worker                 bench_new(a_dst, &tmp.rmv, 0, w, h);
339*c0909341SAndroid Build Coastguard Worker             }
340*c0909341SAndroid Build Coastguard Worker         }
341*c0909341SAndroid Build Coastguard Worker     }
342*c0909341SAndroid Build Coastguard Worker     report("splat_mv");
343*c0909341SAndroid Build Coastguard Worker }
344*c0909341SAndroid Build Coastguard Worker 
checkasm_check_refmvs(void)345*c0909341SAndroid Build Coastguard Worker void checkasm_check_refmvs(void) {
346*c0909341SAndroid Build Coastguard Worker     Dav1dRefmvsDSPContext c;
347*c0909341SAndroid Build Coastguard Worker     dav1d_refmvs_dsp_init(&c);
348*c0909341SAndroid Build Coastguard Worker 
349*c0909341SAndroid Build Coastguard Worker     check_load_tmvs(&c);
350*c0909341SAndroid Build Coastguard Worker     check_save_tmvs(&c);
351*c0909341SAndroid Build Coastguard Worker     check_splat_mv(&c);
352*c0909341SAndroid Build Coastguard Worker }
353