xref: /aosp_15_r20/external/XNNPACK/test/f32-igemm-relu.cc (revision 4bdc94577ba0e567308109d787f7fec7b531ce36)
1*4bdc9457SAndroid Build Coastguard Worker // Copyright (c) Facebook, Inc. and its affiliates.
2*4bdc9457SAndroid Build Coastguard Worker // All rights reserved.
3*4bdc9457SAndroid Build Coastguard Worker //
4*4bdc9457SAndroid Build Coastguard Worker // Copyright 2019 Google LLC
5*4bdc9457SAndroid Build Coastguard Worker //
6*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
7*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
8*4bdc9457SAndroid Build Coastguard Worker //
9*4bdc9457SAndroid Build Coastguard Worker // Auto-generated file. Do not edit!
10*4bdc9457SAndroid Build Coastguard Worker //   Specification: test/f32-igemm-relu.yaml
11*4bdc9457SAndroid Build Coastguard Worker //   Generator: tools/generate-gemm-test.py
12*4bdc9457SAndroid Build Coastguard Worker 
13*4bdc9457SAndroid Build Coastguard Worker 
14*4bdc9457SAndroid Build Coastguard Worker #include <gtest/gtest.h>
15*4bdc9457SAndroid Build Coastguard Worker 
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/allocator.h>
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h>
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/isa-checks.h>
19*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microparams-init.h>
20*4bdc9457SAndroid Build Coastguard Worker 
21*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/gemm.h>
22*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/igemm.h>
23*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/ppmm.h>
24*4bdc9457SAndroid Build Coastguard Worker #include "gemm-microkernel-tester.h"
25*4bdc9457SAndroid Build Coastguard Worker 
26*4bdc9457SAndroid Build Coastguard Worker 
27*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_eq_4)28*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_eq_4) {
29*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
30*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
31*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
32*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
33*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
34*4bdc9457SAndroid Build Coastguard Worker       .m(1)
35*4bdc9457SAndroid Build Coastguard Worker       .n(8)
36*4bdc9457SAndroid Build Coastguard Worker       .k(4)
37*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
38*4bdc9457SAndroid Build Coastguard Worker   }
39*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,strided_cn)40*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, strided_cn) {
41*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
42*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
43*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
44*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
45*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
46*4bdc9457SAndroid Build Coastguard Worker       .m(1)
47*4bdc9457SAndroid Build Coastguard Worker       .n(8)
48*4bdc9457SAndroid Build Coastguard Worker       .k(4)
49*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
50*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
51*4bdc9457SAndroid Build Coastguard Worker   }
52*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_eq_4_subtile)53*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
54*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
55*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 1; m++) {
56*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
57*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
58*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
59*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
60*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
61*4bdc9457SAndroid Build Coastguard Worker           .m(m)
62*4bdc9457SAndroid Build Coastguard Worker           .n(n)
63*4bdc9457SAndroid Build Coastguard Worker           .k(4)
64*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
65*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
66*4bdc9457SAndroid Build Coastguard Worker       }
67*4bdc9457SAndroid Build Coastguard Worker     }
68*4bdc9457SAndroid Build Coastguard Worker   }
69*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)70*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
71*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 1; m++) {
72*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
73*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
74*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
75*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
76*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
77*4bdc9457SAndroid Build Coastguard Worker         .m(m)
78*4bdc9457SAndroid Build Coastguard Worker         .n(8)
79*4bdc9457SAndroid Build Coastguard Worker         .k(4)
80*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
81*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
82*4bdc9457SAndroid Build Coastguard Worker     }
83*4bdc9457SAndroid Build Coastguard Worker   }
84*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)85*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
86*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
87*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
88*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
89*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
90*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
91*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
92*4bdc9457SAndroid Build Coastguard Worker         .m(1)
93*4bdc9457SAndroid Build Coastguard Worker         .n(n)
94*4bdc9457SAndroid Build Coastguard Worker         .k(4)
95*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
96*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
97*4bdc9457SAndroid Build Coastguard Worker     }
98*4bdc9457SAndroid Build Coastguard Worker   }
99*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_lt_4)100*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_lt_4) {
101*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
102*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
103*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
104*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
105*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
106*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
107*4bdc9457SAndroid Build Coastguard Worker         .m(1)
108*4bdc9457SAndroid Build Coastguard Worker         .n(8)
109*4bdc9457SAndroid Build Coastguard Worker         .k(k)
110*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
111*4bdc9457SAndroid Build Coastguard Worker     }
112*4bdc9457SAndroid Build Coastguard Worker   }
113*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_lt_4_subtile)114*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
115*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
116*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
117*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
118*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
119*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
120*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
121*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
122*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
123*4bdc9457SAndroid Build Coastguard Worker             .m(m)
124*4bdc9457SAndroid Build Coastguard Worker             .n(n)
125*4bdc9457SAndroid Build Coastguard Worker             .k(k)
126*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
127*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
128*4bdc9457SAndroid Build Coastguard Worker         }
129*4bdc9457SAndroid Build Coastguard Worker       }
130*4bdc9457SAndroid Build Coastguard Worker     }
131*4bdc9457SAndroid Build Coastguard Worker   }
132*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_gt_4)133*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_gt_4) {
134*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
135*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
136*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
137*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
138*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
139*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
140*4bdc9457SAndroid Build Coastguard Worker         .m(1)
141*4bdc9457SAndroid Build Coastguard Worker         .n(8)
142*4bdc9457SAndroid Build Coastguard Worker         .k(k)
143*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
144*4bdc9457SAndroid Build Coastguard Worker     }
145*4bdc9457SAndroid Build Coastguard Worker   }
146*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_gt_4_subtile)147*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
148*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
149*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
150*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
151*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
152*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
153*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
154*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
155*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
156*4bdc9457SAndroid Build Coastguard Worker             .m(m)
157*4bdc9457SAndroid Build Coastguard Worker             .n(n)
158*4bdc9457SAndroid Build Coastguard Worker             .k(k)
159*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
160*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
161*4bdc9457SAndroid Build Coastguard Worker         }
162*4bdc9457SAndroid Build Coastguard Worker       }
163*4bdc9457SAndroid Build Coastguard Worker     }
164*4bdc9457SAndroid Build Coastguard Worker   }
165*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_div_4)166*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_div_4) {
167*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
168*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
169*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
170*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
171*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
172*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
173*4bdc9457SAndroid Build Coastguard Worker         .m(1)
174*4bdc9457SAndroid Build Coastguard Worker         .n(8)
175*4bdc9457SAndroid Build Coastguard Worker         .k(k)
176*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
177*4bdc9457SAndroid Build Coastguard Worker     }
178*4bdc9457SAndroid Build Coastguard Worker   }
179*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,k_div_4_subtile)180*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, k_div_4_subtile) {
181*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
182*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
183*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
184*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
185*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
186*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
187*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
188*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
189*4bdc9457SAndroid Build Coastguard Worker             .m(m)
190*4bdc9457SAndroid Build Coastguard Worker             .n(n)
191*4bdc9457SAndroid Build Coastguard Worker             .k(k)
192*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
193*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
194*4bdc9457SAndroid Build Coastguard Worker         }
195*4bdc9457SAndroid Build Coastguard Worker       }
196*4bdc9457SAndroid Build Coastguard Worker     }
197*4bdc9457SAndroid Build Coastguard Worker   }
198*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,n_gt_8)199*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, n_gt_8) {
200*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
201*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
202*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
203*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
204*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
205*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
206*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
207*4bdc9457SAndroid Build Coastguard Worker           .m(1)
208*4bdc9457SAndroid Build Coastguard Worker           .n(n)
209*4bdc9457SAndroid Build Coastguard Worker           .k(k)
210*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
211*4bdc9457SAndroid Build Coastguard Worker       }
212*4bdc9457SAndroid Build Coastguard Worker     }
213*4bdc9457SAndroid Build Coastguard Worker   }
214*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)215*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
216*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
217*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
218*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
219*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
220*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
221*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
222*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
223*4bdc9457SAndroid Build Coastguard Worker           .m(1)
224*4bdc9457SAndroid Build Coastguard Worker           .n(n)
225*4bdc9457SAndroid Build Coastguard Worker           .k(k)
226*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
227*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
228*4bdc9457SAndroid Build Coastguard Worker       }
229*4bdc9457SAndroid Build Coastguard Worker     }
230*4bdc9457SAndroid Build Coastguard Worker   }
231*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,n_gt_8_subtile)232*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
233*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
234*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
235*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
236*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
237*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
238*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
239*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
240*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
241*4bdc9457SAndroid Build Coastguard Worker             .m(m)
242*4bdc9457SAndroid Build Coastguard Worker             .n(n)
243*4bdc9457SAndroid Build Coastguard Worker             .k(k)
244*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
245*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
246*4bdc9457SAndroid Build Coastguard Worker         }
247*4bdc9457SAndroid Build Coastguard Worker       }
248*4bdc9457SAndroid Build Coastguard Worker     }
249*4bdc9457SAndroid Build Coastguard Worker   }
250*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,n_div_8)251*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, n_div_8) {
252*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
253*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
254*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
255*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
256*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
257*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
258*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
259*4bdc9457SAndroid Build Coastguard Worker           .m(1)
260*4bdc9457SAndroid Build Coastguard Worker           .n(n)
261*4bdc9457SAndroid Build Coastguard Worker           .k(k)
262*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
263*4bdc9457SAndroid Build Coastguard Worker       }
264*4bdc9457SAndroid Build Coastguard Worker     }
265*4bdc9457SAndroid Build Coastguard Worker   }
266*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,n_div_8_strided_cn)267*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
268*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
269*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
270*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
271*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
272*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
273*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
274*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
275*4bdc9457SAndroid Build Coastguard Worker           .m(1)
276*4bdc9457SAndroid Build Coastguard Worker           .n(n)
277*4bdc9457SAndroid Build Coastguard Worker           .k(k)
278*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
279*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
280*4bdc9457SAndroid Build Coastguard Worker       }
281*4bdc9457SAndroid Build Coastguard Worker     }
282*4bdc9457SAndroid Build Coastguard Worker   }
283*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,n_div_8_subtile)284*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, n_div_8_subtile) {
285*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
286*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
287*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
288*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
289*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
290*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
291*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
292*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
293*4bdc9457SAndroid Build Coastguard Worker             .m(m)
294*4bdc9457SAndroid Build Coastguard Worker             .n(n)
295*4bdc9457SAndroid Build Coastguard Worker             .k(k)
296*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
297*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
298*4bdc9457SAndroid Build Coastguard Worker         }
299*4bdc9457SAndroid Build Coastguard Worker       }
300*4bdc9457SAndroid Build Coastguard Worker     }
301*4bdc9457SAndroid Build Coastguard Worker   }
302*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,small_kernel)303*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, small_kernel) {
304*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
305*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
306*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
307*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
308*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
309*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
310*4bdc9457SAndroid Build Coastguard Worker         .m(1)
311*4bdc9457SAndroid Build Coastguard Worker         .n(8)
312*4bdc9457SAndroid Build Coastguard Worker         .k(k)
313*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
314*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
315*4bdc9457SAndroid Build Coastguard Worker     }
316*4bdc9457SAndroid Build Coastguard Worker   }
317*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,small_kernel_subtile)318*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, small_kernel_subtile) {
319*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
320*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
321*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
322*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
323*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
324*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
325*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
326*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
327*4bdc9457SAndroid Build Coastguard Worker             .m(m)
328*4bdc9457SAndroid Build Coastguard Worker             .n(n)
329*4bdc9457SAndroid Build Coastguard Worker             .k(k)
330*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
331*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
332*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
333*4bdc9457SAndroid Build Coastguard Worker         }
334*4bdc9457SAndroid Build Coastguard Worker       }
335*4bdc9457SAndroid Build Coastguard Worker     }
336*4bdc9457SAndroid Build Coastguard Worker   }
337*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,n_gt_8_small_kernel)338*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, n_gt_8_small_kernel) {
339*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
340*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
341*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
342*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
343*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
344*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
345*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
346*4bdc9457SAndroid Build Coastguard Worker           .m(1)
347*4bdc9457SAndroid Build Coastguard Worker           .n(n)
348*4bdc9457SAndroid Build Coastguard Worker           .k(k)
349*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
350*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
351*4bdc9457SAndroid Build Coastguard Worker       }
352*4bdc9457SAndroid Build Coastguard Worker     }
353*4bdc9457SAndroid Build Coastguard Worker   }
354*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,n_div_8_small_kernel)355*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, n_div_8_small_kernel) {
356*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
357*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
358*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
359*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
360*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
361*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
362*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
363*4bdc9457SAndroid Build Coastguard Worker           .m(1)
364*4bdc9457SAndroid Build Coastguard Worker           .n(n)
365*4bdc9457SAndroid Build Coastguard Worker           .k(k)
366*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
367*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
368*4bdc9457SAndroid Build Coastguard Worker       }
369*4bdc9457SAndroid Build Coastguard Worker     }
370*4bdc9457SAndroid Build Coastguard Worker   }
371*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,strided_cm_subtile)372*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, strided_cm_subtile) {
373*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
374*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
375*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
376*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
377*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
378*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
379*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
380*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
381*4bdc9457SAndroid Build Coastguard Worker             .m(m)
382*4bdc9457SAndroid Build Coastguard Worker             .n(n)
383*4bdc9457SAndroid Build Coastguard Worker             .k(k)
384*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
385*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
386*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
387*4bdc9457SAndroid Build Coastguard Worker         }
388*4bdc9457SAndroid Build Coastguard Worker       }
389*4bdc9457SAndroid Build Coastguard Worker     }
390*4bdc9457SAndroid Build Coastguard Worker   }
391*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,a_offset)392*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, a_offset) {
393*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
394*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
395*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
396*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
397*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
398*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
399*4bdc9457SAndroid Build Coastguard Worker         .m(1)
400*4bdc9457SAndroid Build Coastguard Worker         .n(8)
401*4bdc9457SAndroid Build Coastguard Worker         .k(k)
402*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
403*4bdc9457SAndroid Build Coastguard Worker         .a_offset(23)
404*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
405*4bdc9457SAndroid Build Coastguard Worker     }
406*4bdc9457SAndroid Build Coastguard Worker   }
407*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,zero)408*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, zero) {
409*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
410*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 1; mz++) {
411*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
412*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
413*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
414*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
415*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
416*4bdc9457SAndroid Build Coastguard Worker           .m(1)
417*4bdc9457SAndroid Build Coastguard Worker           .n(8)
418*4bdc9457SAndroid Build Coastguard Worker           .k(k)
419*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
420*4bdc9457SAndroid Build Coastguard Worker           .a_offset(23)
421*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
422*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
423*4bdc9457SAndroid Build Coastguard Worker       }
424*4bdc9457SAndroid Build Coastguard Worker     }
425*4bdc9457SAndroid Build Coastguard Worker   }
426*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT,strided_cm)427*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMSIMD_SPLAT, strided_cm) {
428*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
429*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
430*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
431*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
432*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
433*4bdc9457SAndroid Build Coastguard Worker       .m(1)
434*4bdc9457SAndroid Build Coastguard Worker       .n(8)
435*4bdc9457SAndroid Build Coastguard Worker       .k(4)
436*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
437*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat);
438*4bdc9457SAndroid Build Coastguard Worker   }
439*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
440*4bdc9457SAndroid Build Coastguard Worker 
441*4bdc9457SAndroid Build Coastguard Worker 
442*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_eq_4)443*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_eq_4) {
444*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
445*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
446*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
447*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
448*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
449*4bdc9457SAndroid Build Coastguard Worker       .m(1)
450*4bdc9457SAndroid Build Coastguard Worker       .n(8)
451*4bdc9457SAndroid Build Coastguard Worker       .k(4)
452*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
453*4bdc9457SAndroid Build Coastguard Worker   }
454*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,strided_cn)455*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, strided_cn) {
456*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
457*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
458*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
459*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
460*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
461*4bdc9457SAndroid Build Coastguard Worker       .m(1)
462*4bdc9457SAndroid Build Coastguard Worker       .n(8)
463*4bdc9457SAndroid Build Coastguard Worker       .k(4)
464*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
465*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
466*4bdc9457SAndroid Build Coastguard Worker   }
467*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_eq_4_subtile)468*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_eq_4_subtile) {
469*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
470*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 1; m++) {
471*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
472*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
473*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
474*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
475*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
476*4bdc9457SAndroid Build Coastguard Worker           .m(m)
477*4bdc9457SAndroid Build Coastguard Worker           .n(n)
478*4bdc9457SAndroid Build Coastguard Worker           .k(4)
479*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
480*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
481*4bdc9457SAndroid Build Coastguard Worker       }
482*4bdc9457SAndroid Build Coastguard Worker     }
483*4bdc9457SAndroid Build Coastguard Worker   }
484*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_eq_4_subtile_m)485*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_eq_4_subtile_m) {
486*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 1; m++) {
487*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
488*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
489*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
490*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
491*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
492*4bdc9457SAndroid Build Coastguard Worker         .m(m)
493*4bdc9457SAndroid Build Coastguard Worker         .n(8)
494*4bdc9457SAndroid Build Coastguard Worker         .k(4)
495*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
496*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
497*4bdc9457SAndroid Build Coastguard Worker     }
498*4bdc9457SAndroid Build Coastguard Worker   }
499*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_eq_4_subtile_n)500*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_eq_4_subtile_n) {
501*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
502*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
503*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
504*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
505*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
506*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
507*4bdc9457SAndroid Build Coastguard Worker         .m(1)
508*4bdc9457SAndroid Build Coastguard Worker         .n(n)
509*4bdc9457SAndroid Build Coastguard Worker         .k(4)
510*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
511*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
512*4bdc9457SAndroid Build Coastguard Worker     }
513*4bdc9457SAndroid Build Coastguard Worker   }
514*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_lt_4)515*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_lt_4) {
516*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
517*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
518*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
519*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
520*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
521*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
522*4bdc9457SAndroid Build Coastguard Worker         .m(1)
523*4bdc9457SAndroid Build Coastguard Worker         .n(8)
524*4bdc9457SAndroid Build Coastguard Worker         .k(k)
525*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
526*4bdc9457SAndroid Build Coastguard Worker     }
527*4bdc9457SAndroid Build Coastguard Worker   }
528*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_lt_4_subtile)529*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_lt_4_subtile) {
530*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
531*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
532*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
533*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
534*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
535*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
536*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
537*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
538*4bdc9457SAndroid Build Coastguard Worker             .m(m)
539*4bdc9457SAndroid Build Coastguard Worker             .n(n)
540*4bdc9457SAndroid Build Coastguard Worker             .k(k)
541*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
542*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
543*4bdc9457SAndroid Build Coastguard Worker         }
544*4bdc9457SAndroid Build Coastguard Worker       }
545*4bdc9457SAndroid Build Coastguard Worker     }
546*4bdc9457SAndroid Build Coastguard Worker   }
547*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_gt_4)548*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_gt_4) {
549*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
550*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
551*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
552*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
553*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
554*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
555*4bdc9457SAndroid Build Coastguard Worker         .m(1)
556*4bdc9457SAndroid Build Coastguard Worker         .n(8)
557*4bdc9457SAndroid Build Coastguard Worker         .k(k)
558*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
559*4bdc9457SAndroid Build Coastguard Worker     }
560*4bdc9457SAndroid Build Coastguard Worker   }
561*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_gt_4_subtile)562*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_gt_4_subtile) {
563*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
564*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
565*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
566*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
567*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
568*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
569*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
570*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
571*4bdc9457SAndroid Build Coastguard Worker             .m(m)
572*4bdc9457SAndroid Build Coastguard Worker             .n(n)
573*4bdc9457SAndroid Build Coastguard Worker             .k(k)
574*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
575*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
576*4bdc9457SAndroid Build Coastguard Worker         }
577*4bdc9457SAndroid Build Coastguard Worker       }
578*4bdc9457SAndroid Build Coastguard Worker     }
579*4bdc9457SAndroid Build Coastguard Worker   }
580*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_div_4)581*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_div_4) {
582*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
583*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
584*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
585*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
586*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
587*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
588*4bdc9457SAndroid Build Coastguard Worker         .m(1)
589*4bdc9457SAndroid Build Coastguard Worker         .n(8)
590*4bdc9457SAndroid Build Coastguard Worker         .k(k)
591*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
592*4bdc9457SAndroid Build Coastguard Worker     }
593*4bdc9457SAndroid Build Coastguard Worker   }
594*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,k_div_4_subtile)595*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, k_div_4_subtile) {
596*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
597*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
598*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
599*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
600*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
601*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
602*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
603*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
604*4bdc9457SAndroid Build Coastguard Worker             .m(m)
605*4bdc9457SAndroid Build Coastguard Worker             .n(n)
606*4bdc9457SAndroid Build Coastguard Worker             .k(k)
607*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
608*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
609*4bdc9457SAndroid Build Coastguard Worker         }
610*4bdc9457SAndroid Build Coastguard Worker       }
611*4bdc9457SAndroid Build Coastguard Worker     }
612*4bdc9457SAndroid Build Coastguard Worker   }
613*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,n_gt_8)614*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, n_gt_8) {
615*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
616*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
617*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
618*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
619*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
620*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
621*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
622*4bdc9457SAndroid Build Coastguard Worker           .m(1)
623*4bdc9457SAndroid Build Coastguard Worker           .n(n)
624*4bdc9457SAndroid Build Coastguard Worker           .k(k)
625*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
626*4bdc9457SAndroid Build Coastguard Worker       }
627*4bdc9457SAndroid Build Coastguard Worker     }
628*4bdc9457SAndroid Build Coastguard Worker   }
629*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,n_gt_8_strided_cn)630*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, n_gt_8_strided_cn) {
631*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
632*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
633*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
634*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
635*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
636*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
637*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
638*4bdc9457SAndroid Build Coastguard Worker           .m(1)
639*4bdc9457SAndroid Build Coastguard Worker           .n(n)
640*4bdc9457SAndroid Build Coastguard Worker           .k(k)
641*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
642*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
643*4bdc9457SAndroid Build Coastguard Worker       }
644*4bdc9457SAndroid Build Coastguard Worker     }
645*4bdc9457SAndroid Build Coastguard Worker   }
646*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,n_gt_8_subtile)647*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, n_gt_8_subtile) {
648*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
649*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
650*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
651*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
652*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
653*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
654*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
655*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
656*4bdc9457SAndroid Build Coastguard Worker             .m(m)
657*4bdc9457SAndroid Build Coastguard Worker             .n(n)
658*4bdc9457SAndroid Build Coastguard Worker             .k(k)
659*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
660*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
661*4bdc9457SAndroid Build Coastguard Worker         }
662*4bdc9457SAndroid Build Coastguard Worker       }
663*4bdc9457SAndroid Build Coastguard Worker     }
664*4bdc9457SAndroid Build Coastguard Worker   }
665*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,n_div_8)666*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, n_div_8) {
667*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
668*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
669*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
670*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
671*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
672*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
673*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
674*4bdc9457SAndroid Build Coastguard Worker           .m(1)
675*4bdc9457SAndroid Build Coastguard Worker           .n(n)
676*4bdc9457SAndroid Build Coastguard Worker           .k(k)
677*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
678*4bdc9457SAndroid Build Coastguard Worker       }
679*4bdc9457SAndroid Build Coastguard Worker     }
680*4bdc9457SAndroid Build Coastguard Worker   }
681*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,n_div_8_strided_cn)682*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, n_div_8_strided_cn) {
683*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
684*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
685*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
686*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
687*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
688*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
689*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
690*4bdc9457SAndroid Build Coastguard Worker           .m(1)
691*4bdc9457SAndroid Build Coastguard Worker           .n(n)
692*4bdc9457SAndroid Build Coastguard Worker           .k(k)
693*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
694*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
695*4bdc9457SAndroid Build Coastguard Worker       }
696*4bdc9457SAndroid Build Coastguard Worker     }
697*4bdc9457SAndroid Build Coastguard Worker   }
698*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,n_div_8_subtile)699*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, n_div_8_subtile) {
700*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
701*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
702*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
703*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
704*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
705*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
706*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
707*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
708*4bdc9457SAndroid Build Coastguard Worker             .m(m)
709*4bdc9457SAndroid Build Coastguard Worker             .n(n)
710*4bdc9457SAndroid Build Coastguard Worker             .k(k)
711*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
712*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
713*4bdc9457SAndroid Build Coastguard Worker         }
714*4bdc9457SAndroid Build Coastguard Worker       }
715*4bdc9457SAndroid Build Coastguard Worker     }
716*4bdc9457SAndroid Build Coastguard Worker   }
717*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,small_kernel)718*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, small_kernel) {
719*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
720*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
721*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
722*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
723*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
724*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
725*4bdc9457SAndroid Build Coastguard Worker         .m(1)
726*4bdc9457SAndroid Build Coastguard Worker         .n(8)
727*4bdc9457SAndroid Build Coastguard Worker         .k(k)
728*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
729*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
730*4bdc9457SAndroid Build Coastguard Worker     }
731*4bdc9457SAndroid Build Coastguard Worker   }
732*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,small_kernel_subtile)733*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, small_kernel_subtile) {
734*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
735*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
736*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
737*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
738*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
739*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
740*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
741*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
742*4bdc9457SAndroid Build Coastguard Worker             .m(m)
743*4bdc9457SAndroid Build Coastguard Worker             .n(n)
744*4bdc9457SAndroid Build Coastguard Worker             .k(k)
745*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
746*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
747*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
748*4bdc9457SAndroid Build Coastguard Worker         }
749*4bdc9457SAndroid Build Coastguard Worker       }
750*4bdc9457SAndroid Build Coastguard Worker     }
751*4bdc9457SAndroid Build Coastguard Worker   }
752*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,n_gt_8_small_kernel)753*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, n_gt_8_small_kernel) {
754*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
755*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
756*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
757*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
758*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
759*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
760*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
761*4bdc9457SAndroid Build Coastguard Worker           .m(1)
762*4bdc9457SAndroid Build Coastguard Worker           .n(n)
763*4bdc9457SAndroid Build Coastguard Worker           .k(k)
764*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
765*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
766*4bdc9457SAndroid Build Coastguard Worker       }
767*4bdc9457SAndroid Build Coastguard Worker     }
768*4bdc9457SAndroid Build Coastguard Worker   }
769*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,n_div_8_small_kernel)770*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, n_div_8_small_kernel) {
771*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
772*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
773*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
774*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
775*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
776*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
777*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
778*4bdc9457SAndroid Build Coastguard Worker           .m(1)
779*4bdc9457SAndroid Build Coastguard Worker           .n(n)
780*4bdc9457SAndroid Build Coastguard Worker           .k(k)
781*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
782*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
783*4bdc9457SAndroid Build Coastguard Worker       }
784*4bdc9457SAndroid Build Coastguard Worker     }
785*4bdc9457SAndroid Build Coastguard Worker   }
786*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,strided_cm_subtile)787*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, strided_cm_subtile) {
788*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
789*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
790*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
791*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
792*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
793*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
794*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
795*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
796*4bdc9457SAndroid Build Coastguard Worker             .m(m)
797*4bdc9457SAndroid Build Coastguard Worker             .n(n)
798*4bdc9457SAndroid Build Coastguard Worker             .k(k)
799*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
800*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
801*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
802*4bdc9457SAndroid Build Coastguard Worker         }
803*4bdc9457SAndroid Build Coastguard Worker       }
804*4bdc9457SAndroid Build Coastguard Worker     }
805*4bdc9457SAndroid Build Coastguard Worker   }
806*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,a_offset)807*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, a_offset) {
808*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
809*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
810*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
811*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
812*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
813*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
814*4bdc9457SAndroid Build Coastguard Worker         .m(1)
815*4bdc9457SAndroid Build Coastguard Worker         .n(8)
816*4bdc9457SAndroid Build Coastguard Worker         .k(k)
817*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
818*4bdc9457SAndroid Build Coastguard Worker         .a_offset(23)
819*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
820*4bdc9457SAndroid Build Coastguard Worker     }
821*4bdc9457SAndroid Build Coastguard Worker   }
822*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,zero)823*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, zero) {
824*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
825*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 1; mz++) {
826*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
827*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
828*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
829*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
830*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
831*4bdc9457SAndroid Build Coastguard Worker           .m(1)
832*4bdc9457SAndroid Build Coastguard Worker           .n(8)
833*4bdc9457SAndroid Build Coastguard Worker           .k(k)
834*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
835*4bdc9457SAndroid Build Coastguard Worker           .a_offset(23)
836*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
837*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
838*4bdc9457SAndroid Build Coastguard Worker       }
839*4bdc9457SAndroid Build Coastguard Worker     }
840*4bdc9457SAndroid Build Coastguard Worker   }
841*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD,strided_cm)842*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMSIMD, strided_cm) {
843*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
844*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
845*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
846*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
847*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
848*4bdc9457SAndroid Build Coastguard Worker       .m(1)
849*4bdc9457SAndroid Build Coastguard Worker       .n(8)
850*4bdc9457SAndroid Build Coastguard Worker       .k(4)
851*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
852*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd);
853*4bdc9457SAndroid Build Coastguard Worker   }
854*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
855*4bdc9457SAndroid Build Coastguard Worker 
856*4bdc9457SAndroid Build Coastguard Worker 
857*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_eq_1)858*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_eq_1) {
859*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
860*4bdc9457SAndroid Build Coastguard Worker       .mr(3)
861*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
862*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
863*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
864*4bdc9457SAndroid Build Coastguard Worker       .m(3)
865*4bdc9457SAndroid Build Coastguard Worker       .n(8)
866*4bdc9457SAndroid Build Coastguard Worker       .k(1)
867*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
868*4bdc9457SAndroid Build Coastguard Worker   }
869*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,strided_cn)870*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, strided_cn) {
871*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
872*4bdc9457SAndroid Build Coastguard Worker       .mr(3)
873*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
874*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
875*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
876*4bdc9457SAndroid Build Coastguard Worker       .m(3)
877*4bdc9457SAndroid Build Coastguard Worker       .n(8)
878*4bdc9457SAndroid Build Coastguard Worker       .k(1)
879*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
880*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
881*4bdc9457SAndroid Build Coastguard Worker   }
882*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)883*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
884*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
885*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 3; m++) {
886*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
887*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
888*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
889*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
890*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
891*4bdc9457SAndroid Build Coastguard Worker           .m(m)
892*4bdc9457SAndroid Build Coastguard Worker           .n(n)
893*4bdc9457SAndroid Build Coastguard Worker           .k(1)
894*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
895*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
896*4bdc9457SAndroid Build Coastguard Worker       }
897*4bdc9457SAndroid Build Coastguard Worker     }
898*4bdc9457SAndroid Build Coastguard Worker   }
899*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)900*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
901*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 3; m++) {
902*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
903*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
904*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
905*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
906*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
907*4bdc9457SAndroid Build Coastguard Worker         .m(m)
908*4bdc9457SAndroid Build Coastguard Worker         .n(8)
909*4bdc9457SAndroid Build Coastguard Worker         .k(1)
910*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
911*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
912*4bdc9457SAndroid Build Coastguard Worker     }
913*4bdc9457SAndroid Build Coastguard Worker   }
914*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)915*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
916*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
917*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
918*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
919*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
920*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
921*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
922*4bdc9457SAndroid Build Coastguard Worker         .m(3)
923*4bdc9457SAndroid Build Coastguard Worker         .n(n)
924*4bdc9457SAndroid Build Coastguard Worker         .k(1)
925*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
926*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
927*4bdc9457SAndroid Build Coastguard Worker     }
928*4bdc9457SAndroid Build Coastguard Worker   }
929*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_gt_1)930*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_gt_1) {
931*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 2; k < 10; k++) {
932*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
933*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
934*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
935*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
936*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
937*4bdc9457SAndroid Build Coastguard Worker         .m(3)
938*4bdc9457SAndroid Build Coastguard Worker         .n(8)
939*4bdc9457SAndroid Build Coastguard Worker         .k(k)
940*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
941*4bdc9457SAndroid Build Coastguard Worker     }
942*4bdc9457SAndroid Build Coastguard Worker   }
943*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)944*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
945*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 2; k < 10; k++) {
946*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
947*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
948*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
949*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
950*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
951*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
952*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
953*4bdc9457SAndroid Build Coastguard Worker             .m(m)
954*4bdc9457SAndroid Build Coastguard Worker             .n(n)
955*4bdc9457SAndroid Build Coastguard Worker             .k(k)
956*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
957*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
958*4bdc9457SAndroid Build Coastguard Worker         }
959*4bdc9457SAndroid Build Coastguard Worker       }
960*4bdc9457SAndroid Build Coastguard Worker     }
961*4bdc9457SAndroid Build Coastguard Worker   }
962*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_gt_8)963*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_gt_8) {
964*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
965*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
966*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
967*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
968*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
969*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
970*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
971*4bdc9457SAndroid Build Coastguard Worker           .m(3)
972*4bdc9457SAndroid Build Coastguard Worker           .n(n)
973*4bdc9457SAndroid Build Coastguard Worker           .k(k)
974*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
975*4bdc9457SAndroid Build Coastguard Worker       }
976*4bdc9457SAndroid Build Coastguard Worker     }
977*4bdc9457SAndroid Build Coastguard Worker   }
978*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)979*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
980*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
981*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
982*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
983*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
984*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
985*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
986*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
987*4bdc9457SAndroid Build Coastguard Worker           .m(3)
988*4bdc9457SAndroid Build Coastguard Worker           .n(n)
989*4bdc9457SAndroid Build Coastguard Worker           .k(k)
990*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
991*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
992*4bdc9457SAndroid Build Coastguard Worker       }
993*4bdc9457SAndroid Build Coastguard Worker     }
994*4bdc9457SAndroid Build Coastguard Worker   }
995*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)996*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
997*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
998*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
999*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
1000*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1001*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
1002*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1003*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1004*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1005*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1006*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1007*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1008*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1009*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1010*4bdc9457SAndroid Build Coastguard Worker         }
1011*4bdc9457SAndroid Build Coastguard Worker       }
1012*4bdc9457SAndroid Build Coastguard Worker     }
1013*4bdc9457SAndroid Build Coastguard Worker   }
1014*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_div_8)1015*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_div_8) {
1016*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1017*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1018*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1019*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
1020*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1021*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1022*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1023*4bdc9457SAndroid Build Coastguard Worker           .m(3)
1024*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1025*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1026*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1027*4bdc9457SAndroid Build Coastguard Worker       }
1028*4bdc9457SAndroid Build Coastguard Worker     }
1029*4bdc9457SAndroid Build Coastguard Worker   }
1030*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)1031*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
1032*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1033*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1034*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1035*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
1036*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1037*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1038*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1039*4bdc9457SAndroid Build Coastguard Worker           .m(3)
1040*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1041*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1042*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
1043*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1044*4bdc9457SAndroid Build Coastguard Worker       }
1045*4bdc9457SAndroid Build Coastguard Worker     }
1046*4bdc9457SAndroid Build Coastguard Worker   }
1047*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)1048*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
1049*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1050*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1051*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
1052*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1053*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
1054*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1055*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1056*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1057*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1058*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1059*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1060*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1061*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1062*4bdc9457SAndroid Build Coastguard Worker         }
1063*4bdc9457SAndroid Build Coastguard Worker       }
1064*4bdc9457SAndroid Build Coastguard Worker     }
1065*4bdc9457SAndroid Build Coastguard Worker   }
1066*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,small_kernel)1067*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, small_kernel) {
1068*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1069*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1070*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
1071*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1072*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1073*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1074*4bdc9457SAndroid Build Coastguard Worker         .m(3)
1075*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1076*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1077*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
1078*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1079*4bdc9457SAndroid Build Coastguard Worker     }
1080*4bdc9457SAndroid Build Coastguard Worker   }
1081*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,small_kernel_subtile)1082*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, small_kernel_subtile) {
1083*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1084*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1085*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
1086*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1087*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
1088*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1089*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1090*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1091*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1092*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1093*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1094*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
1095*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1096*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1097*4bdc9457SAndroid Build Coastguard Worker         }
1098*4bdc9457SAndroid Build Coastguard Worker       }
1099*4bdc9457SAndroid Build Coastguard Worker     }
1100*4bdc9457SAndroid Build Coastguard Worker   }
1101*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_gt_8_small_kernel)1102*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_gt_8_small_kernel) {
1103*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
1104*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1105*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1106*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
1107*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1108*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1109*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1110*4bdc9457SAndroid Build Coastguard Worker           .m(3)
1111*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1112*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1113*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
1114*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1115*4bdc9457SAndroid Build Coastguard Worker       }
1116*4bdc9457SAndroid Build Coastguard Worker     }
1117*4bdc9457SAndroid Build Coastguard Worker   }
1118*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_div_8_small_kernel)1119*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_div_8_small_kernel) {
1120*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1121*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1122*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1123*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
1124*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1125*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1126*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1127*4bdc9457SAndroid Build Coastguard Worker           .m(3)
1128*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1129*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1130*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
1131*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1132*4bdc9457SAndroid Build Coastguard Worker       }
1133*4bdc9457SAndroid Build Coastguard Worker     }
1134*4bdc9457SAndroid Build Coastguard Worker   }
1135*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)1136*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
1137*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1138*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1139*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
1140*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1141*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
1142*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1143*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1144*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1145*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1146*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1147*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1148*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
1149*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1150*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1151*4bdc9457SAndroid Build Coastguard Worker         }
1152*4bdc9457SAndroid Build Coastguard Worker       }
1153*4bdc9457SAndroid Build Coastguard Worker     }
1154*4bdc9457SAndroid Build Coastguard Worker   }
1155*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,a_offset)1156*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, a_offset) {
1157*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1158*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1159*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
1160*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1161*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1162*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1163*4bdc9457SAndroid Build Coastguard Worker         .m(3)
1164*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1165*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1166*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
1167*4bdc9457SAndroid Build Coastguard Worker         .a_offset(17)
1168*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1169*4bdc9457SAndroid Build Coastguard Worker     }
1170*4bdc9457SAndroid Build Coastguard Worker   }
1171*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,zero)1172*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, zero) {
1173*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1174*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 3; mz++) {
1175*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1176*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
1177*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1178*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1179*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1180*4bdc9457SAndroid Build Coastguard Worker           .m(3)
1181*4bdc9457SAndroid Build Coastguard Worker           .n(8)
1182*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1183*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
1184*4bdc9457SAndroid Build Coastguard Worker           .a_offset(17)
1185*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
1186*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1187*4bdc9457SAndroid Build Coastguard Worker       }
1188*4bdc9457SAndroid Build Coastguard Worker     }
1189*4bdc9457SAndroid Build Coastguard Worker   }
1190*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT,strided_cm)1191*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMSIMD_LOADSPLAT, strided_cm) {
1192*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
1193*4bdc9457SAndroid Build Coastguard Worker       .mr(3)
1194*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
1195*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
1196*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
1197*4bdc9457SAndroid Build Coastguard Worker       .m(3)
1198*4bdc9457SAndroid Build Coastguard Worker       .n(8)
1199*4bdc9457SAndroid Build Coastguard Worker       .k(1)
1200*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
1201*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat);
1202*4bdc9457SAndroid Build Coastguard Worker   }
1203*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1204*4bdc9457SAndroid Build Coastguard Worker 
1205*4bdc9457SAndroid Build Coastguard Worker 
1206*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_eq_1)1207*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_eq_1) {
1208*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
1209*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
1210*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
1211*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
1212*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
1213*4bdc9457SAndroid Build Coastguard Worker       .m(4)
1214*4bdc9457SAndroid Build Coastguard Worker       .n(8)
1215*4bdc9457SAndroid Build Coastguard Worker       .k(1)
1216*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1217*4bdc9457SAndroid Build Coastguard Worker   }
1218*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,strided_cn)1219*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, strided_cn) {
1220*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
1221*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
1222*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
1223*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
1224*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
1225*4bdc9457SAndroid Build Coastguard Worker       .m(4)
1226*4bdc9457SAndroid Build Coastguard Worker       .n(8)
1227*4bdc9457SAndroid Build Coastguard Worker       .k(1)
1228*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
1229*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1230*4bdc9457SAndroid Build Coastguard Worker   }
1231*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)1232*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
1233*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
1234*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 4; m++) {
1235*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1236*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1237*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1238*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1239*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1240*4bdc9457SAndroid Build Coastguard Worker           .m(m)
1241*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1242*4bdc9457SAndroid Build Coastguard Worker           .k(1)
1243*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
1244*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1245*4bdc9457SAndroid Build Coastguard Worker       }
1246*4bdc9457SAndroid Build Coastguard Worker     }
1247*4bdc9457SAndroid Build Coastguard Worker   }
1248*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)1249*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
1250*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 4; m++) {
1251*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1252*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1253*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1254*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1255*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1256*4bdc9457SAndroid Build Coastguard Worker         .m(m)
1257*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1258*4bdc9457SAndroid Build Coastguard Worker         .k(1)
1259*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
1260*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1261*4bdc9457SAndroid Build Coastguard Worker     }
1262*4bdc9457SAndroid Build Coastguard Worker   }
1263*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)1264*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
1265*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
1266*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1267*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1268*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1269*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1270*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1271*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1272*4bdc9457SAndroid Build Coastguard Worker         .n(n)
1273*4bdc9457SAndroid Build Coastguard Worker         .k(1)
1274*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
1275*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1276*4bdc9457SAndroid Build Coastguard Worker     }
1277*4bdc9457SAndroid Build Coastguard Worker   }
1278*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_gt_1)1279*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_gt_1) {
1280*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 2; k < 10; k++) {
1281*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1282*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1283*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1284*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1285*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1286*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1287*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1288*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1289*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1290*4bdc9457SAndroid Build Coastguard Worker     }
1291*4bdc9457SAndroid Build Coastguard Worker   }
1292*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)1293*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
1294*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 2; k < 10; k++) {
1295*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1296*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1297*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1298*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1299*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1300*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1301*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1302*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1303*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1304*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1305*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1306*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1307*4bdc9457SAndroid Build Coastguard Worker         }
1308*4bdc9457SAndroid Build Coastguard Worker       }
1309*4bdc9457SAndroid Build Coastguard Worker     }
1310*4bdc9457SAndroid Build Coastguard Worker   }
1311*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_gt_8)1312*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_gt_8) {
1313*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
1314*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1315*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1316*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1317*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1318*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1319*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1320*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1321*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1322*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1323*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1324*4bdc9457SAndroid Build Coastguard Worker       }
1325*4bdc9457SAndroid Build Coastguard Worker     }
1326*4bdc9457SAndroid Build Coastguard Worker   }
1327*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)1328*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
1329*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
1330*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1331*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1332*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1333*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1334*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1335*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1336*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1337*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1338*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1339*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
1340*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1341*4bdc9457SAndroid Build Coastguard Worker       }
1342*4bdc9457SAndroid Build Coastguard Worker     }
1343*4bdc9457SAndroid Build Coastguard Worker   }
1344*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)1345*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
1346*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
1347*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1348*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1349*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1350*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1351*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1352*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1353*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1354*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1355*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1356*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1357*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1358*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1359*4bdc9457SAndroid Build Coastguard Worker         }
1360*4bdc9457SAndroid Build Coastguard Worker       }
1361*4bdc9457SAndroid Build Coastguard Worker     }
1362*4bdc9457SAndroid Build Coastguard Worker   }
1363*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_div_8)1364*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_div_8) {
1365*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1366*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1367*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1368*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1369*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1370*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1371*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1372*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1373*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1374*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1375*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1376*4bdc9457SAndroid Build Coastguard Worker       }
1377*4bdc9457SAndroid Build Coastguard Worker     }
1378*4bdc9457SAndroid Build Coastguard Worker   }
1379*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)1380*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
1381*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1382*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1383*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1384*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1385*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1386*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1387*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1388*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1389*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1390*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1391*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
1392*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1393*4bdc9457SAndroid Build Coastguard Worker       }
1394*4bdc9457SAndroid Build Coastguard Worker     }
1395*4bdc9457SAndroid Build Coastguard Worker   }
1396*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)1397*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
1398*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1399*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1400*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1401*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1402*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1403*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1404*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1405*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1406*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1407*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1408*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1409*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1410*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1411*4bdc9457SAndroid Build Coastguard Worker         }
1412*4bdc9457SAndroid Build Coastguard Worker       }
1413*4bdc9457SAndroid Build Coastguard Worker     }
1414*4bdc9457SAndroid Build Coastguard Worker   }
1415*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,small_kernel)1416*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, small_kernel) {
1417*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1418*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1419*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1420*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1421*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1422*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1423*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1424*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1425*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1426*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
1427*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1428*4bdc9457SAndroid Build Coastguard Worker     }
1429*4bdc9457SAndroid Build Coastguard Worker   }
1430*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,small_kernel_subtile)1431*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, small_kernel_subtile) {
1432*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1433*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1434*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1435*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1436*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1437*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1438*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1439*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1440*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1441*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1442*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1443*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
1444*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1445*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1446*4bdc9457SAndroid Build Coastguard Worker         }
1447*4bdc9457SAndroid Build Coastguard Worker       }
1448*4bdc9457SAndroid Build Coastguard Worker     }
1449*4bdc9457SAndroid Build Coastguard Worker   }
1450*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_gt_8_small_kernel)1451*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_gt_8_small_kernel) {
1452*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
1453*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1454*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1455*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1456*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1457*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1458*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1459*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1460*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1461*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1462*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
1463*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1464*4bdc9457SAndroid Build Coastguard Worker       }
1465*4bdc9457SAndroid Build Coastguard Worker     }
1466*4bdc9457SAndroid Build Coastguard Worker   }
1467*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_div_8_small_kernel)1468*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_div_8_small_kernel) {
1469*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1470*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
1471*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1472*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1473*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1474*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1475*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1476*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1477*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1478*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1479*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
1480*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1481*4bdc9457SAndroid Build Coastguard Worker       }
1482*4bdc9457SAndroid Build Coastguard Worker     }
1483*4bdc9457SAndroid Build Coastguard Worker   }
1484*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)1485*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
1486*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1487*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1488*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1489*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1490*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1491*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1492*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1493*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1494*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1495*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1496*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1497*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
1498*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1499*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1500*4bdc9457SAndroid Build Coastguard Worker         }
1501*4bdc9457SAndroid Build Coastguard Worker       }
1502*4bdc9457SAndroid Build Coastguard Worker     }
1503*4bdc9457SAndroid Build Coastguard Worker   }
1504*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,a_offset)1505*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, a_offset) {
1506*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1507*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1508*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1509*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1510*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1511*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1512*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1513*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1514*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1515*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
1516*4bdc9457SAndroid Build Coastguard Worker         .a_offset(23)
1517*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1518*4bdc9457SAndroid Build Coastguard Worker     }
1519*4bdc9457SAndroid Build Coastguard Worker   }
1520*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,zero)1521*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, zero) {
1522*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
1523*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 4; mz++) {
1524*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1525*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1526*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1527*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1528*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1529*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1530*4bdc9457SAndroid Build Coastguard Worker           .n(8)
1531*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1532*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
1533*4bdc9457SAndroid Build Coastguard Worker           .a_offset(23)
1534*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
1535*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1536*4bdc9457SAndroid Build Coastguard Worker       }
1537*4bdc9457SAndroid Build Coastguard Worker     }
1538*4bdc9457SAndroid Build Coastguard Worker   }
1539*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT,strided_cm)1540*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_LOADSPLAT, strided_cm) {
1541*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
1542*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
1543*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
1544*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
1545*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
1546*4bdc9457SAndroid Build Coastguard Worker       .m(4)
1547*4bdc9457SAndroid Build Coastguard Worker       .n(8)
1548*4bdc9457SAndroid Build Coastguard Worker       .k(1)
1549*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
1550*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1551*4bdc9457SAndroid Build Coastguard Worker   }
1552*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1553*4bdc9457SAndroid Build Coastguard Worker 
1554*4bdc9457SAndroid Build Coastguard Worker 
1555*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_eq_4)1556*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_eq_4) {
1557*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
1558*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
1559*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
1560*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
1561*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
1562*4bdc9457SAndroid Build Coastguard Worker       .m(4)
1563*4bdc9457SAndroid Build Coastguard Worker       .n(8)
1564*4bdc9457SAndroid Build Coastguard Worker       .k(4)
1565*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1566*4bdc9457SAndroid Build Coastguard Worker   }
1567*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,strided_cn)1568*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, strided_cn) {
1569*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
1570*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
1571*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
1572*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
1573*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
1574*4bdc9457SAndroid Build Coastguard Worker       .m(4)
1575*4bdc9457SAndroid Build Coastguard Worker       .n(8)
1576*4bdc9457SAndroid Build Coastguard Worker       .k(4)
1577*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
1578*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1579*4bdc9457SAndroid Build Coastguard Worker   }
1580*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_eq_4_subtile)1581*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
1582*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
1583*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 4; m++) {
1584*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1585*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1586*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1587*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1588*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1589*4bdc9457SAndroid Build Coastguard Worker           .m(m)
1590*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1591*4bdc9457SAndroid Build Coastguard Worker           .k(4)
1592*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
1593*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1594*4bdc9457SAndroid Build Coastguard Worker       }
1595*4bdc9457SAndroid Build Coastguard Worker     }
1596*4bdc9457SAndroid Build Coastguard Worker   }
1597*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)1598*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
1599*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 4; m++) {
1600*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1601*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1602*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1603*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1604*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1605*4bdc9457SAndroid Build Coastguard Worker         .m(m)
1606*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1607*4bdc9457SAndroid Build Coastguard Worker         .k(4)
1608*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
1609*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1610*4bdc9457SAndroid Build Coastguard Worker     }
1611*4bdc9457SAndroid Build Coastguard Worker   }
1612*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)1613*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
1614*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
1615*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1616*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1617*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1618*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1619*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1620*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1621*4bdc9457SAndroid Build Coastguard Worker         .n(n)
1622*4bdc9457SAndroid Build Coastguard Worker         .k(4)
1623*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
1624*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1625*4bdc9457SAndroid Build Coastguard Worker     }
1626*4bdc9457SAndroid Build Coastguard Worker   }
1627*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_lt_4)1628*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_lt_4) {
1629*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
1630*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1631*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1632*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1633*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1634*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1635*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1636*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1637*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1638*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1639*4bdc9457SAndroid Build Coastguard Worker     }
1640*4bdc9457SAndroid Build Coastguard Worker   }
1641*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_lt_4_subtile)1642*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
1643*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
1644*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1645*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1646*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1647*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1648*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1649*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1650*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1651*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1652*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1653*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1654*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1655*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1656*4bdc9457SAndroid Build Coastguard Worker         }
1657*4bdc9457SAndroid Build Coastguard Worker       }
1658*4bdc9457SAndroid Build Coastguard Worker     }
1659*4bdc9457SAndroid Build Coastguard Worker   }
1660*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_gt_4)1661*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_gt_4) {
1662*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
1663*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1664*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1665*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1666*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1667*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1668*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1669*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1670*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1671*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1672*4bdc9457SAndroid Build Coastguard Worker     }
1673*4bdc9457SAndroid Build Coastguard Worker   }
1674*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_gt_4_subtile)1675*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
1676*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
1677*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1678*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1679*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1680*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1681*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1682*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1683*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1684*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1685*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1686*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1687*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1688*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1689*4bdc9457SAndroid Build Coastguard Worker         }
1690*4bdc9457SAndroid Build Coastguard Worker       }
1691*4bdc9457SAndroid Build Coastguard Worker     }
1692*4bdc9457SAndroid Build Coastguard Worker   }
1693*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_div_4)1694*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_div_4) {
1695*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
1696*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1697*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1698*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1699*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1700*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1701*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1702*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1703*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1704*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1705*4bdc9457SAndroid Build Coastguard Worker     }
1706*4bdc9457SAndroid Build Coastguard Worker   }
1707*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,k_div_4_subtile)1708*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, k_div_4_subtile) {
1709*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
1710*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1711*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1712*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1713*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1714*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1715*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1716*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1717*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1718*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1719*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1720*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1721*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1722*4bdc9457SAndroid Build Coastguard Worker         }
1723*4bdc9457SAndroid Build Coastguard Worker       }
1724*4bdc9457SAndroid Build Coastguard Worker     }
1725*4bdc9457SAndroid Build Coastguard Worker   }
1726*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,n_gt_8)1727*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, n_gt_8) {
1728*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
1729*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
1730*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1731*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1732*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1733*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1734*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1735*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1736*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1737*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1738*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1739*4bdc9457SAndroid Build Coastguard Worker       }
1740*4bdc9457SAndroid Build Coastguard Worker     }
1741*4bdc9457SAndroid Build Coastguard Worker   }
1742*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)1743*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
1744*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
1745*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
1746*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1747*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1748*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1749*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1750*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1751*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1752*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1753*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1754*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
1755*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1756*4bdc9457SAndroid Build Coastguard Worker       }
1757*4bdc9457SAndroid Build Coastguard Worker     }
1758*4bdc9457SAndroid Build Coastguard Worker   }
1759*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,n_gt_8_subtile)1760*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
1761*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
1762*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
1763*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1764*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1765*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1766*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1767*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1768*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1769*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1770*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1771*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1772*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1773*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1774*4bdc9457SAndroid Build Coastguard Worker         }
1775*4bdc9457SAndroid Build Coastguard Worker       }
1776*4bdc9457SAndroid Build Coastguard Worker     }
1777*4bdc9457SAndroid Build Coastguard Worker   }
1778*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,n_div_8)1779*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, n_div_8) {
1780*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1781*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
1782*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1783*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1784*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1785*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1786*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1787*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1788*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1789*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1790*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1791*4bdc9457SAndroid Build Coastguard Worker       }
1792*4bdc9457SAndroid Build Coastguard Worker     }
1793*4bdc9457SAndroid Build Coastguard Worker   }
1794*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,n_div_8_strided_cn)1795*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
1796*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1797*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
1798*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1799*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1800*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1801*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1802*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1803*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1804*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1805*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1806*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
1807*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1808*4bdc9457SAndroid Build Coastguard Worker       }
1809*4bdc9457SAndroid Build Coastguard Worker     }
1810*4bdc9457SAndroid Build Coastguard Worker   }
1811*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,n_div_8_subtile)1812*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, n_div_8_subtile) {
1813*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1814*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
1815*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1816*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1817*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1818*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1819*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1820*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1821*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1822*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1823*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1824*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1825*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1826*4bdc9457SAndroid Build Coastguard Worker         }
1827*4bdc9457SAndroid Build Coastguard Worker       }
1828*4bdc9457SAndroid Build Coastguard Worker     }
1829*4bdc9457SAndroid Build Coastguard Worker   }
1830*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,small_kernel)1831*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, small_kernel) {
1832*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
1833*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1834*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1835*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1836*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1837*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1838*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1839*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1840*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1841*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
1842*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1843*4bdc9457SAndroid Build Coastguard Worker     }
1844*4bdc9457SAndroid Build Coastguard Worker   }
1845*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,small_kernel_subtile)1846*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, small_kernel_subtile) {
1847*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
1848*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1849*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1850*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1851*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1852*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1853*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1854*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1855*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1856*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1857*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1858*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
1859*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1860*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1861*4bdc9457SAndroid Build Coastguard Worker         }
1862*4bdc9457SAndroid Build Coastguard Worker       }
1863*4bdc9457SAndroid Build Coastguard Worker     }
1864*4bdc9457SAndroid Build Coastguard Worker   }
1865*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,n_gt_8_small_kernel)1866*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, n_gt_8_small_kernel) {
1867*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
1868*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
1869*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1870*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1871*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1872*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1873*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1874*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1875*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1876*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1877*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
1878*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1879*4bdc9457SAndroid Build Coastguard Worker       }
1880*4bdc9457SAndroid Build Coastguard Worker     }
1881*4bdc9457SAndroid Build Coastguard Worker   }
1882*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,n_div_8_small_kernel)1883*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, n_div_8_small_kernel) {
1884*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
1885*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
1886*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1887*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1888*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1889*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1890*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1891*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1892*4bdc9457SAndroid Build Coastguard Worker           .n(n)
1893*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1894*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
1895*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1896*4bdc9457SAndroid Build Coastguard Worker       }
1897*4bdc9457SAndroid Build Coastguard Worker     }
1898*4bdc9457SAndroid Build Coastguard Worker   }
1899*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,strided_cm_subtile)1900*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, strided_cm_subtile) {
1901*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
1902*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
1903*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
1904*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
1905*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
1906*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
1907*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
1908*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
1909*4bdc9457SAndroid Build Coastguard Worker             .m(m)
1910*4bdc9457SAndroid Build Coastguard Worker             .n(n)
1911*4bdc9457SAndroid Build Coastguard Worker             .k(k)
1912*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
1913*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
1914*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1915*4bdc9457SAndroid Build Coastguard Worker         }
1916*4bdc9457SAndroid Build Coastguard Worker       }
1917*4bdc9457SAndroid Build Coastguard Worker     }
1918*4bdc9457SAndroid Build Coastguard Worker   }
1919*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,a_offset)1920*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, a_offset) {
1921*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
1922*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
1923*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
1924*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
1925*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
1926*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
1927*4bdc9457SAndroid Build Coastguard Worker         .m(4)
1928*4bdc9457SAndroid Build Coastguard Worker         .n(8)
1929*4bdc9457SAndroid Build Coastguard Worker         .k(k)
1930*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
1931*4bdc9457SAndroid Build Coastguard Worker         .a_offset(83)
1932*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1933*4bdc9457SAndroid Build Coastguard Worker     }
1934*4bdc9457SAndroid Build Coastguard Worker   }
1935*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,zero)1936*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, zero) {
1937*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
1938*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 4; mz++) {
1939*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
1940*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
1941*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
1942*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
1943*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
1944*4bdc9457SAndroid Build Coastguard Worker           .m(4)
1945*4bdc9457SAndroid Build Coastguard Worker           .n(8)
1946*4bdc9457SAndroid Build Coastguard Worker           .k(k)
1947*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
1948*4bdc9457SAndroid Build Coastguard Worker           .a_offset(83)
1949*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
1950*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1951*4bdc9457SAndroid Build Coastguard Worker       }
1952*4bdc9457SAndroid Build Coastguard Worker     }
1953*4bdc9457SAndroid Build Coastguard Worker   }
1954*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT,strided_cm)1955*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMSIMD_SPLAT, strided_cm) {
1956*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
1957*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
1958*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
1959*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
1960*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
1961*4bdc9457SAndroid Build Coastguard Worker       .m(4)
1962*4bdc9457SAndroid Build Coastguard Worker       .n(8)
1963*4bdc9457SAndroid Build Coastguard Worker       .k(4)
1964*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
1965*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmsimd_splat);
1966*4bdc9457SAndroid Build Coastguard Worker   }
1967*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1968*4bdc9457SAndroid Build Coastguard Worker 
1969*4bdc9457SAndroid Build Coastguard Worker 
1970*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_eq_1)1971*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_eq_1) {
1972*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
1973*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
1974*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
1975*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
1976*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
1977*4bdc9457SAndroid Build Coastguard Worker       .m(5)
1978*4bdc9457SAndroid Build Coastguard Worker       .n(8)
1979*4bdc9457SAndroid Build Coastguard Worker       .k(1)
1980*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
1981*4bdc9457SAndroid Build Coastguard Worker   }
1982*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,strided_cn)1983*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, strided_cn) {
1984*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
1985*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
1986*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
1987*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
1988*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
1989*4bdc9457SAndroid Build Coastguard Worker       .m(5)
1990*4bdc9457SAndroid Build Coastguard Worker       .n(8)
1991*4bdc9457SAndroid Build Coastguard Worker       .k(1)
1992*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
1993*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
1994*4bdc9457SAndroid Build Coastguard Worker   }
1995*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)1996*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
1997*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
1998*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 5; m++) {
1999*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2000*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2001*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2002*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2003*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2004*4bdc9457SAndroid Build Coastguard Worker           .m(m)
2005*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2006*4bdc9457SAndroid Build Coastguard Worker           .k(1)
2007*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
2008*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2009*4bdc9457SAndroid Build Coastguard Worker       }
2010*4bdc9457SAndroid Build Coastguard Worker     }
2011*4bdc9457SAndroid Build Coastguard Worker   }
2012*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)2013*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
2014*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 5; m++) {
2015*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2016*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2017*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2018*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2019*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2020*4bdc9457SAndroid Build Coastguard Worker         .m(m)
2021*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2022*4bdc9457SAndroid Build Coastguard Worker         .k(1)
2023*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
2024*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2025*4bdc9457SAndroid Build Coastguard Worker     }
2026*4bdc9457SAndroid Build Coastguard Worker   }
2027*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)2028*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
2029*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
2030*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2031*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2032*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2033*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2034*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2035*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2036*4bdc9457SAndroid Build Coastguard Worker         .n(n)
2037*4bdc9457SAndroid Build Coastguard Worker         .k(1)
2038*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
2039*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2040*4bdc9457SAndroid Build Coastguard Worker     }
2041*4bdc9457SAndroid Build Coastguard Worker   }
2042*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_gt_1)2043*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_gt_1) {
2044*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 2; k < 10; k++) {
2045*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2046*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2047*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2048*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2049*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2050*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2051*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2052*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2053*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2054*4bdc9457SAndroid Build Coastguard Worker     }
2055*4bdc9457SAndroid Build Coastguard Worker   }
2056*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)2057*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
2058*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 2; k < 10; k++) {
2059*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2060*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2061*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2062*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2063*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2064*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2065*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2066*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2067*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2068*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2069*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2070*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2071*4bdc9457SAndroid Build Coastguard Worker         }
2072*4bdc9457SAndroid Build Coastguard Worker       }
2073*4bdc9457SAndroid Build Coastguard Worker     }
2074*4bdc9457SAndroid Build Coastguard Worker   }
2075*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_gt_8)2076*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_gt_8) {
2077*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2078*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
2079*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2080*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2081*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2082*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2083*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2084*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2085*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2086*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2087*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2088*4bdc9457SAndroid Build Coastguard Worker       }
2089*4bdc9457SAndroid Build Coastguard Worker     }
2090*4bdc9457SAndroid Build Coastguard Worker   }
2091*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)2092*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
2093*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2094*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
2095*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2096*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2097*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2098*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2099*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2100*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2101*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2102*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2103*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
2104*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2105*4bdc9457SAndroid Build Coastguard Worker       }
2106*4bdc9457SAndroid Build Coastguard Worker     }
2107*4bdc9457SAndroid Build Coastguard Worker   }
2108*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)2109*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
2110*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2111*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
2112*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2113*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2114*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2115*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2116*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2117*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2118*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2119*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2120*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2121*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2122*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2123*4bdc9457SAndroid Build Coastguard Worker         }
2124*4bdc9457SAndroid Build Coastguard Worker       }
2125*4bdc9457SAndroid Build Coastguard Worker     }
2126*4bdc9457SAndroid Build Coastguard Worker   }
2127*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_div_8)2128*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_div_8) {
2129*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2130*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
2131*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2132*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2133*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2134*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2135*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2136*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2137*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2138*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2139*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2140*4bdc9457SAndroid Build Coastguard Worker       }
2141*4bdc9457SAndroid Build Coastguard Worker     }
2142*4bdc9457SAndroid Build Coastguard Worker   }
2143*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)2144*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
2145*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2146*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
2147*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2148*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2149*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2150*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2151*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2152*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2153*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2154*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2155*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
2156*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2157*4bdc9457SAndroid Build Coastguard Worker       }
2158*4bdc9457SAndroid Build Coastguard Worker     }
2159*4bdc9457SAndroid Build Coastguard Worker   }
2160*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)2161*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
2162*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2163*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
2164*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2165*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2166*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2167*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2168*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2169*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2170*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2171*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2172*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2173*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2174*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2175*4bdc9457SAndroid Build Coastguard Worker         }
2176*4bdc9457SAndroid Build Coastguard Worker       }
2177*4bdc9457SAndroid Build Coastguard Worker     }
2178*4bdc9457SAndroid Build Coastguard Worker   }
2179*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,small_kernel)2180*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, small_kernel) {
2181*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
2182*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2183*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2184*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2185*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2186*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2187*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2188*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2189*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2190*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
2191*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2192*4bdc9457SAndroid Build Coastguard Worker     }
2193*4bdc9457SAndroid Build Coastguard Worker   }
2194*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,small_kernel_subtile)2195*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, small_kernel_subtile) {
2196*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
2197*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2198*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2199*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2200*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2201*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2202*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2203*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2204*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2205*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2206*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2207*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
2208*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2209*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2210*4bdc9457SAndroid Build Coastguard Worker         }
2211*4bdc9457SAndroid Build Coastguard Worker       }
2212*4bdc9457SAndroid Build Coastguard Worker     }
2213*4bdc9457SAndroid Build Coastguard Worker   }
2214*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_gt_8_small_kernel)2215*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_gt_8_small_kernel) {
2216*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2217*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
2218*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2219*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2220*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2221*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2222*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2223*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2224*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2225*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2226*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
2227*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2228*4bdc9457SAndroid Build Coastguard Worker       }
2229*4bdc9457SAndroid Build Coastguard Worker     }
2230*4bdc9457SAndroid Build Coastguard Worker   }
2231*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_div_8_small_kernel)2232*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_div_8_small_kernel) {
2233*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2234*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
2235*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2236*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2237*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2238*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2239*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2240*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2241*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2242*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2243*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
2244*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2245*4bdc9457SAndroid Build Coastguard Worker       }
2246*4bdc9457SAndroid Build Coastguard Worker     }
2247*4bdc9457SAndroid Build Coastguard Worker   }
2248*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)2249*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
2250*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
2251*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2252*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2253*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2254*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2255*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2256*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2257*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2258*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2259*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2260*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2261*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
2262*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2263*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2264*4bdc9457SAndroid Build Coastguard Worker         }
2265*4bdc9457SAndroid Build Coastguard Worker       }
2266*4bdc9457SAndroid Build Coastguard Worker     }
2267*4bdc9457SAndroid Build Coastguard Worker   }
2268*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,a_offset)2269*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, a_offset) {
2270*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
2271*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2272*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2273*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2274*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2275*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2276*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2277*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2278*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2279*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
2280*4bdc9457SAndroid Build Coastguard Worker         .a_offset(29)
2281*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2282*4bdc9457SAndroid Build Coastguard Worker     }
2283*4bdc9457SAndroid Build Coastguard Worker   }
2284*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,zero)2285*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, zero) {
2286*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
2287*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 5; mz++) {
2288*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2289*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2290*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2291*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2292*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2293*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2294*4bdc9457SAndroid Build Coastguard Worker           .n(8)
2295*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2296*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
2297*4bdc9457SAndroid Build Coastguard Worker           .a_offset(29)
2298*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
2299*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2300*4bdc9457SAndroid Build Coastguard Worker       }
2301*4bdc9457SAndroid Build Coastguard Worker     }
2302*4bdc9457SAndroid Build Coastguard Worker   }
2303*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT,strided_cm)2304*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_LOADSPLAT, strided_cm) {
2305*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
2306*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
2307*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
2308*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
2309*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
2310*4bdc9457SAndroid Build Coastguard Worker       .m(5)
2311*4bdc9457SAndroid Build Coastguard Worker       .n(8)
2312*4bdc9457SAndroid Build Coastguard Worker       .k(1)
2313*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
2314*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2315*4bdc9457SAndroid Build Coastguard Worker   }
2316*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2317*4bdc9457SAndroid Build Coastguard Worker 
2318*4bdc9457SAndroid Build Coastguard Worker 
2319*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_eq_4)2320*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_eq_4) {
2321*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
2322*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
2323*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
2324*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
2325*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
2326*4bdc9457SAndroid Build Coastguard Worker       .m(5)
2327*4bdc9457SAndroid Build Coastguard Worker       .n(8)
2328*4bdc9457SAndroid Build Coastguard Worker       .k(4)
2329*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2330*4bdc9457SAndroid Build Coastguard Worker   }
2331*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,strided_cn)2332*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, strided_cn) {
2333*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
2334*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
2335*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
2336*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
2337*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
2338*4bdc9457SAndroid Build Coastguard Worker       .m(5)
2339*4bdc9457SAndroid Build Coastguard Worker       .n(8)
2340*4bdc9457SAndroid Build Coastguard Worker       .k(4)
2341*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
2342*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2343*4bdc9457SAndroid Build Coastguard Worker   }
2344*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_eq_4_subtile)2345*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
2346*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
2347*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 5; m++) {
2348*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2349*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2350*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2351*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2352*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2353*4bdc9457SAndroid Build Coastguard Worker           .m(m)
2354*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2355*4bdc9457SAndroid Build Coastguard Worker           .k(4)
2356*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
2357*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2358*4bdc9457SAndroid Build Coastguard Worker       }
2359*4bdc9457SAndroid Build Coastguard Worker     }
2360*4bdc9457SAndroid Build Coastguard Worker   }
2361*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)2362*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
2363*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 5; m++) {
2364*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2365*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2366*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2367*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2368*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2369*4bdc9457SAndroid Build Coastguard Worker         .m(m)
2370*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2371*4bdc9457SAndroid Build Coastguard Worker         .k(4)
2372*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
2373*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2374*4bdc9457SAndroid Build Coastguard Worker     }
2375*4bdc9457SAndroid Build Coastguard Worker   }
2376*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)2377*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
2378*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
2379*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2380*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2381*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2382*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2383*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2384*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2385*4bdc9457SAndroid Build Coastguard Worker         .n(n)
2386*4bdc9457SAndroid Build Coastguard Worker         .k(4)
2387*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
2388*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2389*4bdc9457SAndroid Build Coastguard Worker     }
2390*4bdc9457SAndroid Build Coastguard Worker   }
2391*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_lt_4)2392*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_lt_4) {
2393*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
2394*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2395*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2396*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2397*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2398*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2399*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2400*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2401*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2402*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2403*4bdc9457SAndroid Build Coastguard Worker     }
2404*4bdc9457SAndroid Build Coastguard Worker   }
2405*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_lt_4_subtile)2406*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
2407*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
2408*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2409*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2410*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2411*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2412*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2413*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2414*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2415*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2416*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2417*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2418*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2419*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2420*4bdc9457SAndroid Build Coastguard Worker         }
2421*4bdc9457SAndroid Build Coastguard Worker       }
2422*4bdc9457SAndroid Build Coastguard Worker     }
2423*4bdc9457SAndroid Build Coastguard Worker   }
2424*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_gt_4)2425*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_gt_4) {
2426*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
2427*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2428*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2429*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2430*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2431*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2432*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2433*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2434*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2435*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2436*4bdc9457SAndroid Build Coastguard Worker     }
2437*4bdc9457SAndroid Build Coastguard Worker   }
2438*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_gt_4_subtile)2439*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
2440*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
2441*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2442*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2443*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2444*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2445*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2446*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2447*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2448*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2449*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2450*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2451*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2452*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2453*4bdc9457SAndroid Build Coastguard Worker         }
2454*4bdc9457SAndroid Build Coastguard Worker       }
2455*4bdc9457SAndroid Build Coastguard Worker     }
2456*4bdc9457SAndroid Build Coastguard Worker   }
2457*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_div_4)2458*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_div_4) {
2459*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
2460*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2461*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2462*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2463*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2464*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2465*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2466*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2467*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2468*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2469*4bdc9457SAndroid Build Coastguard Worker     }
2470*4bdc9457SAndroid Build Coastguard Worker   }
2471*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,k_div_4_subtile)2472*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, k_div_4_subtile) {
2473*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
2474*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2475*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2476*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2477*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2478*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2479*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2480*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2481*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2482*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2483*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2484*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2485*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2486*4bdc9457SAndroid Build Coastguard Worker         }
2487*4bdc9457SAndroid Build Coastguard Worker       }
2488*4bdc9457SAndroid Build Coastguard Worker     }
2489*4bdc9457SAndroid Build Coastguard Worker   }
2490*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,n_gt_8)2491*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, n_gt_8) {
2492*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2493*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2494*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2495*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2496*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2497*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2498*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2499*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2500*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2501*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2502*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2503*4bdc9457SAndroid Build Coastguard Worker       }
2504*4bdc9457SAndroid Build Coastguard Worker     }
2505*4bdc9457SAndroid Build Coastguard Worker   }
2506*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)2507*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
2508*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2509*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2510*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2511*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2512*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2513*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2514*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2515*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2516*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2517*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2518*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
2519*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2520*4bdc9457SAndroid Build Coastguard Worker       }
2521*4bdc9457SAndroid Build Coastguard Worker     }
2522*4bdc9457SAndroid Build Coastguard Worker   }
2523*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,n_gt_8_subtile)2524*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
2525*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2526*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2527*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2528*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2529*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2530*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2531*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2532*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2533*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2534*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2535*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2536*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2537*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2538*4bdc9457SAndroid Build Coastguard Worker         }
2539*4bdc9457SAndroid Build Coastguard Worker       }
2540*4bdc9457SAndroid Build Coastguard Worker     }
2541*4bdc9457SAndroid Build Coastguard Worker   }
2542*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,n_div_8)2543*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, n_div_8) {
2544*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2545*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2546*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2547*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2548*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2549*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2550*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2551*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2552*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2553*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2554*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2555*4bdc9457SAndroid Build Coastguard Worker       }
2556*4bdc9457SAndroid Build Coastguard Worker     }
2557*4bdc9457SAndroid Build Coastguard Worker   }
2558*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,n_div_8_strided_cn)2559*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
2560*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2561*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2562*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2563*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2564*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2565*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2566*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2567*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2568*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2569*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2570*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
2571*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2572*4bdc9457SAndroid Build Coastguard Worker       }
2573*4bdc9457SAndroid Build Coastguard Worker     }
2574*4bdc9457SAndroid Build Coastguard Worker   }
2575*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,n_div_8_subtile)2576*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, n_div_8_subtile) {
2577*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2578*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2579*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2580*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2581*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2582*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2583*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2584*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2585*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2586*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2587*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2588*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2589*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2590*4bdc9457SAndroid Build Coastguard Worker         }
2591*4bdc9457SAndroid Build Coastguard Worker       }
2592*4bdc9457SAndroid Build Coastguard Worker     }
2593*4bdc9457SAndroid Build Coastguard Worker   }
2594*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,small_kernel)2595*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, small_kernel) {
2596*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
2597*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2598*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2599*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2600*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2601*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2602*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2603*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2604*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2605*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
2606*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2607*4bdc9457SAndroid Build Coastguard Worker     }
2608*4bdc9457SAndroid Build Coastguard Worker   }
2609*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,small_kernel_subtile)2610*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, small_kernel_subtile) {
2611*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
2612*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2613*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2614*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2615*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2616*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2617*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2618*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2619*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2620*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2621*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2622*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
2623*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2624*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2625*4bdc9457SAndroid Build Coastguard Worker         }
2626*4bdc9457SAndroid Build Coastguard Worker       }
2627*4bdc9457SAndroid Build Coastguard Worker     }
2628*4bdc9457SAndroid Build Coastguard Worker   }
2629*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,n_gt_8_small_kernel)2630*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, n_gt_8_small_kernel) {
2631*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2632*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2633*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2634*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2635*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2636*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2637*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2638*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2639*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2640*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2641*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
2642*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2643*4bdc9457SAndroid Build Coastguard Worker       }
2644*4bdc9457SAndroid Build Coastguard Worker     }
2645*4bdc9457SAndroid Build Coastguard Worker   }
2646*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,n_div_8_small_kernel)2647*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, n_div_8_small_kernel) {
2648*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2649*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2650*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2651*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2652*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2653*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2654*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2655*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2656*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2657*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2658*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
2659*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2660*4bdc9457SAndroid Build Coastguard Worker       }
2661*4bdc9457SAndroid Build Coastguard Worker     }
2662*4bdc9457SAndroid Build Coastguard Worker   }
2663*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,strided_cm_subtile)2664*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, strided_cm_subtile) {
2665*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
2666*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2667*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
2668*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2669*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
2670*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2671*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2672*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
2673*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2674*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2675*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2676*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
2677*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2678*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2679*4bdc9457SAndroid Build Coastguard Worker         }
2680*4bdc9457SAndroid Build Coastguard Worker       }
2681*4bdc9457SAndroid Build Coastguard Worker     }
2682*4bdc9457SAndroid Build Coastguard Worker   }
2683*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,a_offset)2684*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, a_offset) {
2685*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
2686*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2687*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
2688*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2689*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2690*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
2691*4bdc9457SAndroid Build Coastguard Worker         .m(5)
2692*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2693*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2694*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
2695*4bdc9457SAndroid Build Coastguard Worker         .a_offset(103)
2696*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2697*4bdc9457SAndroid Build Coastguard Worker     }
2698*4bdc9457SAndroid Build Coastguard Worker   }
2699*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,zero)2700*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, zero) {
2701*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
2702*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 5; mz++) {
2703*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2704*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
2705*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2706*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2707*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
2708*4bdc9457SAndroid Build Coastguard Worker           .m(5)
2709*4bdc9457SAndroid Build Coastguard Worker           .n(8)
2710*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2711*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
2712*4bdc9457SAndroid Build Coastguard Worker           .a_offset(103)
2713*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
2714*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2715*4bdc9457SAndroid Build Coastguard Worker       }
2716*4bdc9457SAndroid Build Coastguard Worker     }
2717*4bdc9457SAndroid Build Coastguard Worker   }
2718*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT,strided_cm)2719*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMSIMD_SPLAT, strided_cm) {
2720*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
2721*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
2722*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
2723*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
2724*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
2725*4bdc9457SAndroid Build Coastguard Worker       .m(5)
2726*4bdc9457SAndroid Build Coastguard Worker       .n(8)
2727*4bdc9457SAndroid Build Coastguard Worker       .k(4)
2728*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
2729*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmsimd_splat);
2730*4bdc9457SAndroid Build Coastguard Worker   }
2731*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2732*4bdc9457SAndroid Build Coastguard Worker 
2733*4bdc9457SAndroid Build Coastguard Worker 
2734*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_eq_4)2735*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_eq_4) {
2736*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
2737*4bdc9457SAndroid Build Coastguard Worker       .mr(6)
2738*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
2739*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
2740*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
2741*4bdc9457SAndroid Build Coastguard Worker       .m(6)
2742*4bdc9457SAndroid Build Coastguard Worker       .n(8)
2743*4bdc9457SAndroid Build Coastguard Worker       .k(4)
2744*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2745*4bdc9457SAndroid Build Coastguard Worker   }
2746*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,strided_cn)2747*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, strided_cn) {
2748*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
2749*4bdc9457SAndroid Build Coastguard Worker       .mr(6)
2750*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
2751*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
2752*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
2753*4bdc9457SAndroid Build Coastguard Worker       .m(6)
2754*4bdc9457SAndroid Build Coastguard Worker       .n(8)
2755*4bdc9457SAndroid Build Coastguard Worker       .k(4)
2756*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
2757*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2758*4bdc9457SAndroid Build Coastguard Worker   }
2759*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_eq_4_subtile)2760*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_eq_4_subtile) {
2761*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
2762*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 6; m++) {
2763*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2764*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
2765*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2766*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2767*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
2768*4bdc9457SAndroid Build Coastguard Worker           .m(m)
2769*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2770*4bdc9457SAndroid Build Coastguard Worker           .k(4)
2771*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
2772*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2773*4bdc9457SAndroid Build Coastguard Worker       }
2774*4bdc9457SAndroid Build Coastguard Worker     }
2775*4bdc9457SAndroid Build Coastguard Worker   }
2776*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_eq_4_subtile_m)2777*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_eq_4_subtile_m) {
2778*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 6; m++) {
2779*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2780*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
2781*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2782*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2783*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
2784*4bdc9457SAndroid Build Coastguard Worker         .m(m)
2785*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2786*4bdc9457SAndroid Build Coastguard Worker         .k(4)
2787*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
2788*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2789*4bdc9457SAndroid Build Coastguard Worker     }
2790*4bdc9457SAndroid Build Coastguard Worker   }
2791*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_eq_4_subtile_n)2792*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_eq_4_subtile_n) {
2793*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
2794*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2795*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
2796*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2797*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2798*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
2799*4bdc9457SAndroid Build Coastguard Worker         .m(6)
2800*4bdc9457SAndroid Build Coastguard Worker         .n(n)
2801*4bdc9457SAndroid Build Coastguard Worker         .k(4)
2802*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
2803*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2804*4bdc9457SAndroid Build Coastguard Worker     }
2805*4bdc9457SAndroid Build Coastguard Worker   }
2806*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_lt_4)2807*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_lt_4) {
2808*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
2809*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2810*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
2811*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2812*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2813*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
2814*4bdc9457SAndroid Build Coastguard Worker         .m(6)
2815*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2816*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2817*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2818*4bdc9457SAndroid Build Coastguard Worker     }
2819*4bdc9457SAndroid Build Coastguard Worker   }
2820*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_lt_4_subtile)2821*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_lt_4_subtile) {
2822*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
2823*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2824*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
2825*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2826*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
2827*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2828*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2829*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
2830*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2831*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2832*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2833*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2834*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2835*4bdc9457SAndroid Build Coastguard Worker         }
2836*4bdc9457SAndroid Build Coastguard Worker       }
2837*4bdc9457SAndroid Build Coastguard Worker     }
2838*4bdc9457SAndroid Build Coastguard Worker   }
2839*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_gt_4)2840*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_gt_4) {
2841*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
2842*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2843*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
2844*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2845*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2846*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
2847*4bdc9457SAndroid Build Coastguard Worker         .m(6)
2848*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2849*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2850*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2851*4bdc9457SAndroid Build Coastguard Worker     }
2852*4bdc9457SAndroid Build Coastguard Worker   }
2853*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_gt_4_subtile)2854*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_gt_4_subtile) {
2855*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
2856*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2857*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
2858*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2859*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
2860*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2861*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2862*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
2863*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2864*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2865*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2866*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2867*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2868*4bdc9457SAndroid Build Coastguard Worker         }
2869*4bdc9457SAndroid Build Coastguard Worker       }
2870*4bdc9457SAndroid Build Coastguard Worker     }
2871*4bdc9457SAndroid Build Coastguard Worker   }
2872*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_div_4)2873*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_div_4) {
2874*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
2875*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
2876*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
2877*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
2878*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
2879*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
2880*4bdc9457SAndroid Build Coastguard Worker         .m(6)
2881*4bdc9457SAndroid Build Coastguard Worker         .n(8)
2882*4bdc9457SAndroid Build Coastguard Worker         .k(k)
2883*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2884*4bdc9457SAndroid Build Coastguard Worker     }
2885*4bdc9457SAndroid Build Coastguard Worker   }
2886*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,k_div_4_subtile)2887*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, k_div_4_subtile) {
2888*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
2889*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
2890*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
2891*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2892*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
2893*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2894*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2895*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
2896*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2897*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2898*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2899*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2900*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2901*4bdc9457SAndroid Build Coastguard Worker         }
2902*4bdc9457SAndroid Build Coastguard Worker       }
2903*4bdc9457SAndroid Build Coastguard Worker     }
2904*4bdc9457SAndroid Build Coastguard Worker   }
2905*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,n_gt_8)2906*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, n_gt_8) {
2907*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2908*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2909*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2910*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
2911*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2912*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2913*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
2914*4bdc9457SAndroid Build Coastguard Worker           .m(6)
2915*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2916*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2917*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2918*4bdc9457SAndroid Build Coastguard Worker       }
2919*4bdc9457SAndroid Build Coastguard Worker     }
2920*4bdc9457SAndroid Build Coastguard Worker   }
2921*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,n_gt_8_strided_cn)2922*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, n_gt_8_strided_cn) {
2923*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2924*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2925*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2926*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
2927*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2928*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2929*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
2930*4bdc9457SAndroid Build Coastguard Worker           .m(6)
2931*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2932*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2933*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
2934*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2935*4bdc9457SAndroid Build Coastguard Worker       }
2936*4bdc9457SAndroid Build Coastguard Worker     }
2937*4bdc9457SAndroid Build Coastguard Worker   }
2938*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,n_gt_8_subtile)2939*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, n_gt_8_subtile) {
2940*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
2941*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2942*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
2943*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2944*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
2945*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2946*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2947*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
2948*4bdc9457SAndroid Build Coastguard Worker             .m(m)
2949*4bdc9457SAndroid Build Coastguard Worker             .n(n)
2950*4bdc9457SAndroid Build Coastguard Worker             .k(k)
2951*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
2952*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2953*4bdc9457SAndroid Build Coastguard Worker         }
2954*4bdc9457SAndroid Build Coastguard Worker       }
2955*4bdc9457SAndroid Build Coastguard Worker     }
2956*4bdc9457SAndroid Build Coastguard Worker   }
2957*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,n_div_8)2958*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, n_div_8) {
2959*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2960*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2961*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2962*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
2963*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2964*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2965*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
2966*4bdc9457SAndroid Build Coastguard Worker           .m(6)
2967*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2968*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2969*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2970*4bdc9457SAndroid Build Coastguard Worker       }
2971*4bdc9457SAndroid Build Coastguard Worker     }
2972*4bdc9457SAndroid Build Coastguard Worker   }
2973*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,n_div_8_strided_cn)2974*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, n_div_8_strided_cn) {
2975*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2976*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2977*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
2978*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
2979*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
2980*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
2981*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
2982*4bdc9457SAndroid Build Coastguard Worker           .m(6)
2983*4bdc9457SAndroid Build Coastguard Worker           .n(n)
2984*4bdc9457SAndroid Build Coastguard Worker           .k(k)
2985*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
2986*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
2987*4bdc9457SAndroid Build Coastguard Worker       }
2988*4bdc9457SAndroid Build Coastguard Worker     }
2989*4bdc9457SAndroid Build Coastguard Worker   }
2990*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,n_div_8_subtile)2991*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, n_div_8_subtile) {
2992*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
2993*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
2994*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
2995*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
2996*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
2997*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
2998*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
2999*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3000*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3001*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3002*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3003*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3004*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
3005*4bdc9457SAndroid Build Coastguard Worker         }
3006*4bdc9457SAndroid Build Coastguard Worker       }
3007*4bdc9457SAndroid Build Coastguard Worker     }
3008*4bdc9457SAndroid Build Coastguard Worker   }
3009*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,small_kernel)3010*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, small_kernel) {
3011*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3012*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3013*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
3014*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3015*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3016*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
3017*4bdc9457SAndroid Build Coastguard Worker         .m(6)
3018*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3019*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3020*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
3021*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
3022*4bdc9457SAndroid Build Coastguard Worker     }
3023*4bdc9457SAndroid Build Coastguard Worker   }
3024*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,small_kernel_subtile)3025*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, small_kernel_subtile) {
3026*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3027*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3028*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
3029*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3030*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
3031*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3032*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3033*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3034*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3035*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3036*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3037*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
3038*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3039*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
3040*4bdc9457SAndroid Build Coastguard Worker         }
3041*4bdc9457SAndroid Build Coastguard Worker       }
3042*4bdc9457SAndroid Build Coastguard Worker     }
3043*4bdc9457SAndroid Build Coastguard Worker   }
3044*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,n_gt_8_small_kernel)3045*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, n_gt_8_small_kernel) {
3046*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
3047*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3048*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3049*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
3050*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3051*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3052*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3053*4bdc9457SAndroid Build Coastguard Worker           .m(6)
3054*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3055*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3056*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
3057*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
3058*4bdc9457SAndroid Build Coastguard Worker       }
3059*4bdc9457SAndroid Build Coastguard Worker     }
3060*4bdc9457SAndroid Build Coastguard Worker   }
3061*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,n_div_8_small_kernel)3062*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, n_div_8_small_kernel) {
3063*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
3064*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3065*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3066*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
3067*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3068*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3069*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3070*4bdc9457SAndroid Build Coastguard Worker           .m(6)
3071*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3072*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3073*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
3074*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
3075*4bdc9457SAndroid Build Coastguard Worker       }
3076*4bdc9457SAndroid Build Coastguard Worker     }
3077*4bdc9457SAndroid Build Coastguard Worker   }
3078*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,strided_cm_subtile)3079*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, strided_cm_subtile) {
3080*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3081*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3082*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
3083*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3084*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
3085*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3086*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3087*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3088*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3089*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3090*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3091*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
3092*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3093*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
3094*4bdc9457SAndroid Build Coastguard Worker         }
3095*4bdc9457SAndroid Build Coastguard Worker       }
3096*4bdc9457SAndroid Build Coastguard Worker     }
3097*4bdc9457SAndroid Build Coastguard Worker   }
3098*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,a_offset)3099*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, a_offset) {
3100*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3101*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3102*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
3103*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3104*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3105*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
3106*4bdc9457SAndroid Build Coastguard Worker         .m(6)
3107*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3108*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3109*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
3110*4bdc9457SAndroid Build Coastguard Worker         .a_offset(127)
3111*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
3112*4bdc9457SAndroid Build Coastguard Worker     }
3113*4bdc9457SAndroid Build Coastguard Worker   }
3114*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,zero)3115*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, zero) {
3116*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3117*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 6; mz++) {
3118*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3119*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
3120*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3121*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3122*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3123*4bdc9457SAndroid Build Coastguard Worker           .m(6)
3124*4bdc9457SAndroid Build Coastguard Worker           .n(8)
3125*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3126*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
3127*4bdc9457SAndroid Build Coastguard Worker           .a_offset(127)
3128*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
3129*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
3130*4bdc9457SAndroid Build Coastguard Worker       }
3131*4bdc9457SAndroid Build Coastguard Worker     }
3132*4bdc9457SAndroid Build Coastguard Worker   }
3133*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD,strided_cm)3134*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMSIMD, strided_cm) {
3135*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
3136*4bdc9457SAndroid Build Coastguard Worker       .mr(6)
3137*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
3138*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
3139*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
3140*4bdc9457SAndroid Build Coastguard Worker       .m(6)
3141*4bdc9457SAndroid Build Coastguard Worker       .n(8)
3142*4bdc9457SAndroid Build Coastguard Worker       .k(4)
3143*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
3144*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmsimd);
3145*4bdc9457SAndroid Build Coastguard Worker   }
3146*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
3147*4bdc9457SAndroid Build Coastguard Worker 
3148*4bdc9457SAndroid Build Coastguard Worker 
3149*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)3150*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
3151*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
3152*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
3153*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
3154*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
3155*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
3156*4bdc9457SAndroid Build Coastguard Worker       .m(1)
3157*4bdc9457SAndroid Build Coastguard Worker       .n(8)
3158*4bdc9457SAndroid Build Coastguard Worker       .k(4)
3159*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3160*4bdc9457SAndroid Build Coastguard Worker   }
3161*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)3162*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
3163*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
3164*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
3165*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
3166*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
3167*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
3168*4bdc9457SAndroid Build Coastguard Worker       .m(1)
3169*4bdc9457SAndroid Build Coastguard Worker       .n(8)
3170*4bdc9457SAndroid Build Coastguard Worker       .k(4)
3171*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
3172*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3173*4bdc9457SAndroid Build Coastguard Worker   }
3174*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)3175*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
3176*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
3177*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 1; m++) {
3178*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3179*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3180*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3181*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3182*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
3183*4bdc9457SAndroid Build Coastguard Worker           .m(m)
3184*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3185*4bdc9457SAndroid Build Coastguard Worker           .k(4)
3186*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
3187*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3188*4bdc9457SAndroid Build Coastguard Worker       }
3189*4bdc9457SAndroid Build Coastguard Worker     }
3190*4bdc9457SAndroid Build Coastguard Worker   }
3191*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)3192*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
3193*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 1; m++) {
3194*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3195*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3196*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3197*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3198*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
3199*4bdc9457SAndroid Build Coastguard Worker         .m(m)
3200*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3201*4bdc9457SAndroid Build Coastguard Worker         .k(4)
3202*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
3203*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3204*4bdc9457SAndroid Build Coastguard Worker     }
3205*4bdc9457SAndroid Build Coastguard Worker   }
3206*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)3207*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
3208*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
3209*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3210*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3211*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3212*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3213*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
3214*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3215*4bdc9457SAndroid Build Coastguard Worker         .n(n)
3216*4bdc9457SAndroid Build Coastguard Worker         .k(4)
3217*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
3218*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3219*4bdc9457SAndroid Build Coastguard Worker     }
3220*4bdc9457SAndroid Build Coastguard Worker   }
3221*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)3222*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
3223*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
3224*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3225*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3226*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3227*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3228*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
3229*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3230*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3231*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3232*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3233*4bdc9457SAndroid Build Coastguard Worker     }
3234*4bdc9457SAndroid Build Coastguard Worker   }
3235*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)3236*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
3237*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
3238*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3239*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3240*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3241*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3242*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3243*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3244*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
3245*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3246*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3247*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3248*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3249*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3250*4bdc9457SAndroid Build Coastguard Worker         }
3251*4bdc9457SAndroid Build Coastguard Worker       }
3252*4bdc9457SAndroid Build Coastguard Worker     }
3253*4bdc9457SAndroid Build Coastguard Worker   }
3254*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)3255*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
3256*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
3257*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3258*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3259*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3260*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3261*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
3262*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3263*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3264*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3265*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3266*4bdc9457SAndroid Build Coastguard Worker     }
3267*4bdc9457SAndroid Build Coastguard Worker   }
3268*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)3269*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
3270*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
3271*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3272*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3273*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3274*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3275*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3276*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3277*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
3278*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3279*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3280*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3281*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3282*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3283*4bdc9457SAndroid Build Coastguard Worker         }
3284*4bdc9457SAndroid Build Coastguard Worker       }
3285*4bdc9457SAndroid Build Coastguard Worker     }
3286*4bdc9457SAndroid Build Coastguard Worker   }
3287*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)3288*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
3289*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
3290*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3291*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3292*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3293*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3294*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
3295*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3296*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3297*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3298*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3299*4bdc9457SAndroid Build Coastguard Worker     }
3300*4bdc9457SAndroid Build Coastguard Worker   }
3301*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)3302*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
3303*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
3304*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3305*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3306*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3307*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3308*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3309*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3310*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
3311*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3312*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3313*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3314*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3315*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3316*4bdc9457SAndroid Build Coastguard Worker         }
3317*4bdc9457SAndroid Build Coastguard Worker       }
3318*4bdc9457SAndroid Build Coastguard Worker     }
3319*4bdc9457SAndroid Build Coastguard Worker   }
3320*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)3321*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
3322*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
3323*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3324*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3325*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3326*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3327*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3328*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
3329*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3330*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3331*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3332*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3333*4bdc9457SAndroid Build Coastguard Worker       }
3334*4bdc9457SAndroid Build Coastguard Worker     }
3335*4bdc9457SAndroid Build Coastguard Worker   }
3336*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)3337*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
3338*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
3339*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3340*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3341*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3342*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3343*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3344*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
3345*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3346*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3347*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3348*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
3349*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3350*4bdc9457SAndroid Build Coastguard Worker       }
3351*4bdc9457SAndroid Build Coastguard Worker     }
3352*4bdc9457SAndroid Build Coastguard Worker   }
3353*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)3354*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
3355*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
3356*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3357*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3358*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3359*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3360*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3361*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3362*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
3363*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3364*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3365*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3366*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3367*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3368*4bdc9457SAndroid Build Coastguard Worker         }
3369*4bdc9457SAndroid Build Coastguard Worker       }
3370*4bdc9457SAndroid Build Coastguard Worker     }
3371*4bdc9457SAndroid Build Coastguard Worker   }
3372*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)3373*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
3374*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
3375*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3376*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3377*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3378*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3379*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3380*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
3381*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3382*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3383*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3384*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3385*4bdc9457SAndroid Build Coastguard Worker       }
3386*4bdc9457SAndroid Build Coastguard Worker     }
3387*4bdc9457SAndroid Build Coastguard Worker   }
3388*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)3389*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
3390*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
3391*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3392*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3393*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3394*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3395*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3396*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
3397*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3398*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3399*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3400*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
3401*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3402*4bdc9457SAndroid Build Coastguard Worker       }
3403*4bdc9457SAndroid Build Coastguard Worker     }
3404*4bdc9457SAndroid Build Coastguard Worker   }
3405*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)3406*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
3407*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
3408*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3409*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3410*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3411*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3412*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3413*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3414*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
3415*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3416*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3417*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3418*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3419*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3420*4bdc9457SAndroid Build Coastguard Worker         }
3421*4bdc9457SAndroid Build Coastguard Worker       }
3422*4bdc9457SAndroid Build Coastguard Worker     }
3423*4bdc9457SAndroid Build Coastguard Worker   }
3424*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel)3425*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel) {
3426*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3427*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3428*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3429*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3430*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3431*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
3432*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3433*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3434*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3435*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
3436*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3437*4bdc9457SAndroid Build Coastguard Worker     }
3438*4bdc9457SAndroid Build Coastguard Worker   }
3439*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel_subtile)3440*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel_subtile) {
3441*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3442*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3443*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3444*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3445*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3446*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3447*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3448*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
3449*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3450*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3451*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3452*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
3453*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3454*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3455*4bdc9457SAndroid Build Coastguard Worker         }
3456*4bdc9457SAndroid Build Coastguard Worker       }
3457*4bdc9457SAndroid Build Coastguard Worker     }
3458*4bdc9457SAndroid Build Coastguard Worker   }
3459*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_small_kernel)3460*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_small_kernel) {
3461*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
3462*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3463*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3464*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3465*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3466*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3467*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
3468*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3469*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3470*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3471*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
3472*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3473*4bdc9457SAndroid Build Coastguard Worker       }
3474*4bdc9457SAndroid Build Coastguard Worker     }
3475*4bdc9457SAndroid Build Coastguard Worker   }
3476*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_small_kernel)3477*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_small_kernel) {
3478*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
3479*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3480*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3481*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3482*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3483*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3484*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
3485*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3486*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3487*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3488*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
3489*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3490*4bdc9457SAndroid Build Coastguard Worker       }
3491*4bdc9457SAndroid Build Coastguard Worker     }
3492*4bdc9457SAndroid Build Coastguard Worker   }
3493*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)3494*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
3495*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3496*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3497*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3498*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3499*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3500*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3501*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3502*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
3503*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3504*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3505*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3506*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
3507*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3508*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3509*4bdc9457SAndroid Build Coastguard Worker         }
3510*4bdc9457SAndroid Build Coastguard Worker       }
3511*4bdc9457SAndroid Build Coastguard Worker     }
3512*4bdc9457SAndroid Build Coastguard Worker   }
3513*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,a_offset)3514*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, a_offset) {
3515*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3516*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3517*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3518*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3519*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3520*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
3521*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3522*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3523*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3524*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
3525*4bdc9457SAndroid Build Coastguard Worker         .a_offset(23)
3526*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3527*4bdc9457SAndroid Build Coastguard Worker     }
3528*4bdc9457SAndroid Build Coastguard Worker   }
3529*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,zero)3530*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, zero) {
3531*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3532*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 1; mz++) {
3533*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3534*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3535*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3536*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3537*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
3538*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3539*4bdc9457SAndroid Build Coastguard Worker           .n(8)
3540*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3541*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
3542*4bdc9457SAndroid Build Coastguard Worker           .a_offset(23)
3543*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
3544*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3545*4bdc9457SAndroid Build Coastguard Worker       }
3546*4bdc9457SAndroid Build Coastguard Worker     }
3547*4bdc9457SAndroid Build Coastguard Worker   }
3548*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)3549*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
3550*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
3551*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
3552*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
3553*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
3554*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
3555*4bdc9457SAndroid Build Coastguard Worker       .m(1)
3556*4bdc9457SAndroid Build Coastguard Worker       .n(8)
3557*4bdc9457SAndroid Build Coastguard Worker       .k(4)
3558*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
3559*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3560*4bdc9457SAndroid Build Coastguard Worker   }
3561*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMRELAXEDSIMD
3562*4bdc9457SAndroid Build Coastguard Worker 
3563*4bdc9457SAndroid Build Coastguard Worker 
3564*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)3565*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
3566*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
3567*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
3568*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
3569*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
3570*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
3571*4bdc9457SAndroid Build Coastguard Worker       .m(1)
3572*4bdc9457SAndroid Build Coastguard Worker       .n(8)
3573*4bdc9457SAndroid Build Coastguard Worker       .k(4)
3574*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3575*4bdc9457SAndroid Build Coastguard Worker   }
3576*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,strided_cn)3577*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
3578*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
3579*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
3580*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
3581*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
3582*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
3583*4bdc9457SAndroid Build Coastguard Worker       .m(1)
3584*4bdc9457SAndroid Build Coastguard Worker       .n(8)
3585*4bdc9457SAndroid Build Coastguard Worker       .k(4)
3586*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
3587*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3588*4bdc9457SAndroid Build Coastguard Worker   }
3589*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)3590*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
3591*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
3592*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 1; m++) {
3593*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3594*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3595*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3596*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3597*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3598*4bdc9457SAndroid Build Coastguard Worker           .m(m)
3599*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3600*4bdc9457SAndroid Build Coastguard Worker           .k(4)
3601*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
3602*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3603*4bdc9457SAndroid Build Coastguard Worker       }
3604*4bdc9457SAndroid Build Coastguard Worker     }
3605*4bdc9457SAndroid Build Coastguard Worker   }
3606*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)3607*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
3608*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 1; m++) {
3609*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3610*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3611*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3612*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3613*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
3614*4bdc9457SAndroid Build Coastguard Worker         .m(m)
3615*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3616*4bdc9457SAndroid Build Coastguard Worker         .k(4)
3617*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
3618*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3619*4bdc9457SAndroid Build Coastguard Worker     }
3620*4bdc9457SAndroid Build Coastguard Worker   }
3621*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)3622*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
3623*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
3624*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3625*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3626*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3627*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3628*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
3629*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3630*4bdc9457SAndroid Build Coastguard Worker         .n(n)
3631*4bdc9457SAndroid Build Coastguard Worker         .k(4)
3632*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
3633*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3634*4bdc9457SAndroid Build Coastguard Worker     }
3635*4bdc9457SAndroid Build Coastguard Worker   }
3636*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)3637*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
3638*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
3639*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3640*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3641*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3642*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3643*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
3644*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3645*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3646*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3647*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3648*4bdc9457SAndroid Build Coastguard Worker     }
3649*4bdc9457SAndroid Build Coastguard Worker   }
3650*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)3651*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
3652*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
3653*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3654*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3655*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3656*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3657*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3658*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3659*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3660*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3661*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3662*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3663*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3664*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3665*4bdc9457SAndroid Build Coastguard Worker         }
3666*4bdc9457SAndroid Build Coastguard Worker       }
3667*4bdc9457SAndroid Build Coastguard Worker     }
3668*4bdc9457SAndroid Build Coastguard Worker   }
3669*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)3670*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
3671*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
3672*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3673*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3674*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3675*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3676*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
3677*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3678*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3679*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3680*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3681*4bdc9457SAndroid Build Coastguard Worker     }
3682*4bdc9457SAndroid Build Coastguard Worker   }
3683*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)3684*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
3685*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
3686*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3687*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3688*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3689*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3690*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3691*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3692*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3693*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3694*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3695*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3696*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3697*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3698*4bdc9457SAndroid Build Coastguard Worker         }
3699*4bdc9457SAndroid Build Coastguard Worker       }
3700*4bdc9457SAndroid Build Coastguard Worker     }
3701*4bdc9457SAndroid Build Coastguard Worker   }
3702*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_div_4)3703*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
3704*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
3705*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3706*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3707*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3708*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3709*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
3710*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3711*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3712*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3713*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3714*4bdc9457SAndroid Build Coastguard Worker     }
3715*4bdc9457SAndroid Build Coastguard Worker   }
3716*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)3717*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
3718*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
3719*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3720*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3721*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3722*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3723*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3724*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3725*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3726*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3727*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3728*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3729*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3730*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3731*4bdc9457SAndroid Build Coastguard Worker         }
3732*4bdc9457SAndroid Build Coastguard Worker       }
3733*4bdc9457SAndroid Build Coastguard Worker     }
3734*4bdc9457SAndroid Build Coastguard Worker   }
3735*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)3736*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
3737*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
3738*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3739*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3740*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3741*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3742*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3743*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3744*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3745*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3746*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3747*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3748*4bdc9457SAndroid Build Coastguard Worker       }
3749*4bdc9457SAndroid Build Coastguard Worker     }
3750*4bdc9457SAndroid Build Coastguard Worker   }
3751*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)3752*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
3753*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
3754*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3755*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3756*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3757*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3758*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3759*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3760*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3761*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3762*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3763*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
3764*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3765*4bdc9457SAndroid Build Coastguard Worker       }
3766*4bdc9457SAndroid Build Coastguard Worker     }
3767*4bdc9457SAndroid Build Coastguard Worker   }
3768*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)3769*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
3770*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
3771*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3772*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3773*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3774*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3775*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3776*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3777*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3778*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3779*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3780*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3781*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3782*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3783*4bdc9457SAndroid Build Coastguard Worker         }
3784*4bdc9457SAndroid Build Coastguard Worker       }
3785*4bdc9457SAndroid Build Coastguard Worker     }
3786*4bdc9457SAndroid Build Coastguard Worker   }
3787*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_div_8)3788*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
3789*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
3790*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3791*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3792*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3793*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3794*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3795*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3796*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3797*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3798*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3799*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3800*4bdc9457SAndroid Build Coastguard Worker       }
3801*4bdc9457SAndroid Build Coastguard Worker     }
3802*4bdc9457SAndroid Build Coastguard Worker   }
3803*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)3804*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
3805*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
3806*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3807*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3808*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3809*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3810*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3811*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3812*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3813*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3814*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3815*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
3816*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3817*4bdc9457SAndroid Build Coastguard Worker       }
3818*4bdc9457SAndroid Build Coastguard Worker     }
3819*4bdc9457SAndroid Build Coastguard Worker   }
3820*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)3821*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
3822*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
3823*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3824*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3825*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3826*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3827*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3828*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3829*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3830*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3831*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3832*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3833*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3834*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3835*4bdc9457SAndroid Build Coastguard Worker         }
3836*4bdc9457SAndroid Build Coastguard Worker       }
3837*4bdc9457SAndroid Build Coastguard Worker     }
3838*4bdc9457SAndroid Build Coastguard Worker   }
3839*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,small_kernel)3840*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, small_kernel) {
3841*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3842*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3843*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3844*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3845*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3846*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
3847*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3848*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3849*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3850*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
3851*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3852*4bdc9457SAndroid Build Coastguard Worker     }
3853*4bdc9457SAndroid Build Coastguard Worker   }
3854*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,small_kernel_subtile)3855*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, small_kernel_subtile) {
3856*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3857*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3858*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3859*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3860*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3861*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3862*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3863*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3864*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3865*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3866*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3867*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
3868*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3869*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3870*4bdc9457SAndroid Build Coastguard Worker         }
3871*4bdc9457SAndroid Build Coastguard Worker       }
3872*4bdc9457SAndroid Build Coastguard Worker     }
3873*4bdc9457SAndroid Build Coastguard Worker   }
3874*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_small_kernel)3875*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_small_kernel) {
3876*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
3877*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3878*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3879*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3880*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3881*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3882*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3883*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3884*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3885*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3886*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
3887*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3888*4bdc9457SAndroid Build Coastguard Worker       }
3889*4bdc9457SAndroid Build Coastguard Worker     }
3890*4bdc9457SAndroid Build Coastguard Worker   }
3891*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_div_8_small_kernel)3892*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_div_8_small_kernel) {
3893*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
3894*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
3895*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3896*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3897*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3898*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3899*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3900*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3901*4bdc9457SAndroid Build Coastguard Worker           .n(n)
3902*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3903*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
3904*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3905*4bdc9457SAndroid Build Coastguard Worker       }
3906*4bdc9457SAndroid Build Coastguard Worker     }
3907*4bdc9457SAndroid Build Coastguard Worker   }
3908*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)3909*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
3910*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3911*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
3912*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
3913*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
3914*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
3915*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
3916*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
3917*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
3918*4bdc9457SAndroid Build Coastguard Worker             .m(m)
3919*4bdc9457SAndroid Build Coastguard Worker             .n(n)
3920*4bdc9457SAndroid Build Coastguard Worker             .k(k)
3921*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
3922*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
3923*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3924*4bdc9457SAndroid Build Coastguard Worker         }
3925*4bdc9457SAndroid Build Coastguard Worker       }
3926*4bdc9457SAndroid Build Coastguard Worker     }
3927*4bdc9457SAndroid Build Coastguard Worker   }
3928*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,a_offset)3929*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, a_offset) {
3930*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3931*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
3932*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
3933*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
3934*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
3935*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
3936*4bdc9457SAndroid Build Coastguard Worker         .m(1)
3937*4bdc9457SAndroid Build Coastguard Worker         .n(8)
3938*4bdc9457SAndroid Build Coastguard Worker         .k(k)
3939*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
3940*4bdc9457SAndroid Build Coastguard Worker         .a_offset(23)
3941*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3942*4bdc9457SAndroid Build Coastguard Worker     }
3943*4bdc9457SAndroid Build Coastguard Worker   }
3944*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,zero)3945*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, zero) {
3946*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
3947*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 1; mz++) {
3948*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
3949*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
3950*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
3951*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
3952*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
3953*4bdc9457SAndroid Build Coastguard Worker           .m(1)
3954*4bdc9457SAndroid Build Coastguard Worker           .n(8)
3955*4bdc9457SAndroid Build Coastguard Worker           .k(k)
3956*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
3957*4bdc9457SAndroid Build Coastguard Worker           .a_offset(23)
3958*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
3959*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3960*4bdc9457SAndroid Build Coastguard Worker       }
3961*4bdc9457SAndroid Build Coastguard Worker     }
3962*4bdc9457SAndroid Build Coastguard Worker   }
3963*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,strided_cm)3964*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
3965*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
3966*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
3967*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
3968*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
3969*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
3970*4bdc9457SAndroid Build Coastguard Worker       .m(1)
3971*4bdc9457SAndroid Build Coastguard Worker       .n(8)
3972*4bdc9457SAndroid Build Coastguard Worker       .k(4)
3973*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
3974*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3975*4bdc9457SAndroid Build Coastguard Worker   }
3976*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMRELAXEDSIMD
3977*4bdc9457SAndroid Build Coastguard Worker 
3978*4bdc9457SAndroid Build Coastguard Worker 
3979*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)3980*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
3981*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
3982*4bdc9457SAndroid Build Coastguard Worker       .mr(3)
3983*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
3984*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
3985*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
3986*4bdc9457SAndroid Build Coastguard Worker       .m(3)
3987*4bdc9457SAndroid Build Coastguard Worker       .n(8)
3988*4bdc9457SAndroid Build Coastguard Worker       .k(4)
3989*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3990*4bdc9457SAndroid Build Coastguard Worker   }
3991*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)3992*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
3993*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
3994*4bdc9457SAndroid Build Coastguard Worker       .mr(3)
3995*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
3996*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
3997*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
3998*4bdc9457SAndroid Build Coastguard Worker       .m(3)
3999*4bdc9457SAndroid Build Coastguard Worker       .n(8)
4000*4bdc9457SAndroid Build Coastguard Worker       .k(4)
4001*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
4002*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4003*4bdc9457SAndroid Build Coastguard Worker   }
4004*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)4005*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
4006*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
4007*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 3; m++) {
4008*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4009*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
4010*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4011*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4012*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4013*4bdc9457SAndroid Build Coastguard Worker           .m(m)
4014*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4015*4bdc9457SAndroid Build Coastguard Worker           .k(4)
4016*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
4017*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4018*4bdc9457SAndroid Build Coastguard Worker       }
4019*4bdc9457SAndroid Build Coastguard Worker     }
4020*4bdc9457SAndroid Build Coastguard Worker   }
4021*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)4022*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
4023*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 3; m++) {
4024*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4025*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
4026*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4027*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4028*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4029*4bdc9457SAndroid Build Coastguard Worker         .m(m)
4030*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4031*4bdc9457SAndroid Build Coastguard Worker         .k(4)
4032*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
4033*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4034*4bdc9457SAndroid Build Coastguard Worker     }
4035*4bdc9457SAndroid Build Coastguard Worker   }
4036*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)4037*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
4038*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
4039*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4040*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
4041*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4042*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4043*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4044*4bdc9457SAndroid Build Coastguard Worker         .m(3)
4045*4bdc9457SAndroid Build Coastguard Worker         .n(n)
4046*4bdc9457SAndroid Build Coastguard Worker         .k(4)
4047*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
4048*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4049*4bdc9457SAndroid Build Coastguard Worker     }
4050*4bdc9457SAndroid Build Coastguard Worker   }
4051*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)4052*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
4053*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
4054*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4055*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
4056*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4057*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4058*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4059*4bdc9457SAndroid Build Coastguard Worker         .m(3)
4060*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4061*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4062*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4063*4bdc9457SAndroid Build Coastguard Worker     }
4064*4bdc9457SAndroid Build Coastguard Worker   }
4065*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)4066*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
4067*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
4068*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
4069*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
4070*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4071*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
4072*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4073*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4074*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4075*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4076*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4077*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4078*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4079*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4080*4bdc9457SAndroid Build Coastguard Worker         }
4081*4bdc9457SAndroid Build Coastguard Worker       }
4082*4bdc9457SAndroid Build Coastguard Worker     }
4083*4bdc9457SAndroid Build Coastguard Worker   }
4084*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)4085*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
4086*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
4087*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4088*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
4089*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4090*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4091*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4092*4bdc9457SAndroid Build Coastguard Worker         .m(3)
4093*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4094*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4095*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4096*4bdc9457SAndroid Build Coastguard Worker     }
4097*4bdc9457SAndroid Build Coastguard Worker   }
4098*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)4099*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
4100*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
4101*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
4102*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
4103*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4104*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
4105*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4106*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4107*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4108*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4109*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4110*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4111*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4112*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4113*4bdc9457SAndroid Build Coastguard Worker         }
4114*4bdc9457SAndroid Build Coastguard Worker       }
4115*4bdc9457SAndroid Build Coastguard Worker     }
4116*4bdc9457SAndroid Build Coastguard Worker   }
4117*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)4118*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
4119*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
4120*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4121*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
4122*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4123*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4124*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4125*4bdc9457SAndroid Build Coastguard Worker         .m(3)
4126*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4127*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4128*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4129*4bdc9457SAndroid Build Coastguard Worker     }
4130*4bdc9457SAndroid Build Coastguard Worker   }
4131*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)4132*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
4133*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
4134*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
4135*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
4136*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4137*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
4138*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4139*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4140*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4141*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4142*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4143*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4144*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4145*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4146*4bdc9457SAndroid Build Coastguard Worker         }
4147*4bdc9457SAndroid Build Coastguard Worker       }
4148*4bdc9457SAndroid Build Coastguard Worker     }
4149*4bdc9457SAndroid Build Coastguard Worker   }
4150*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)4151*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
4152*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
4153*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4154*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4155*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
4156*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4157*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4158*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4159*4bdc9457SAndroid Build Coastguard Worker           .m(3)
4160*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4161*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4162*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4163*4bdc9457SAndroid Build Coastguard Worker       }
4164*4bdc9457SAndroid Build Coastguard Worker     }
4165*4bdc9457SAndroid Build Coastguard Worker   }
4166*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)4167*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
4168*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
4169*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4170*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4171*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
4172*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4173*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4174*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4175*4bdc9457SAndroid Build Coastguard Worker           .m(3)
4176*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4177*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4178*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
4179*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4180*4bdc9457SAndroid Build Coastguard Worker       }
4181*4bdc9457SAndroid Build Coastguard Worker     }
4182*4bdc9457SAndroid Build Coastguard Worker   }
4183*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)4184*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
4185*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
4186*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4187*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
4188*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4189*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
4190*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4191*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4192*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4193*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4194*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4195*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4196*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4197*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4198*4bdc9457SAndroid Build Coastguard Worker         }
4199*4bdc9457SAndroid Build Coastguard Worker       }
4200*4bdc9457SAndroid Build Coastguard Worker     }
4201*4bdc9457SAndroid Build Coastguard Worker   }
4202*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)4203*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
4204*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
4205*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4206*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4207*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
4208*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4209*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4210*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4211*4bdc9457SAndroid Build Coastguard Worker           .m(3)
4212*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4213*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4214*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4215*4bdc9457SAndroid Build Coastguard Worker       }
4216*4bdc9457SAndroid Build Coastguard Worker     }
4217*4bdc9457SAndroid Build Coastguard Worker   }
4218*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)4219*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
4220*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
4221*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4222*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4223*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
4224*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4225*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4226*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4227*4bdc9457SAndroid Build Coastguard Worker           .m(3)
4228*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4229*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4230*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
4231*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4232*4bdc9457SAndroid Build Coastguard Worker       }
4233*4bdc9457SAndroid Build Coastguard Worker     }
4234*4bdc9457SAndroid Build Coastguard Worker   }
4235*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)4236*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
4237*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
4238*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4239*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
4240*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4241*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
4242*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4243*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4244*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4245*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4246*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4247*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4248*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4249*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4250*4bdc9457SAndroid Build Coastguard Worker         }
4251*4bdc9457SAndroid Build Coastguard Worker       }
4252*4bdc9457SAndroid Build Coastguard Worker     }
4253*4bdc9457SAndroid Build Coastguard Worker   }
4254*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel)4255*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel) {
4256*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4257*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4258*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
4259*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4260*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4261*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4262*4bdc9457SAndroid Build Coastguard Worker         .m(3)
4263*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4264*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4265*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
4266*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4267*4bdc9457SAndroid Build Coastguard Worker     }
4268*4bdc9457SAndroid Build Coastguard Worker   }
4269*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel_subtile)4270*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel_subtile) {
4271*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4272*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
4273*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
4274*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4275*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
4276*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4277*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4278*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4279*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4280*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4281*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4282*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
4283*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4284*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4285*4bdc9457SAndroid Build Coastguard Worker         }
4286*4bdc9457SAndroid Build Coastguard Worker       }
4287*4bdc9457SAndroid Build Coastguard Worker     }
4288*4bdc9457SAndroid Build Coastguard Worker   }
4289*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_small_kernel)4290*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_small_kernel) {
4291*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
4292*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4293*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4294*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
4295*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4296*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4297*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4298*4bdc9457SAndroid Build Coastguard Worker           .m(3)
4299*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4300*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4301*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
4302*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4303*4bdc9457SAndroid Build Coastguard Worker       }
4304*4bdc9457SAndroid Build Coastguard Worker     }
4305*4bdc9457SAndroid Build Coastguard Worker   }
4306*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_small_kernel)4307*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_small_kernel) {
4308*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
4309*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4310*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4311*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
4312*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4313*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4314*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4315*4bdc9457SAndroid Build Coastguard Worker           .m(3)
4316*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4317*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4318*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
4319*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4320*4bdc9457SAndroid Build Coastguard Worker       }
4321*4bdc9457SAndroid Build Coastguard Worker     }
4322*4bdc9457SAndroid Build Coastguard Worker   }
4323*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)4324*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
4325*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4326*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
4327*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 3; m++) {
4328*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4329*4bdc9457SAndroid Build Coastguard Worker             .mr(3)
4330*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4331*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4332*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4333*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4334*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4335*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4336*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
4337*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4338*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4339*4bdc9457SAndroid Build Coastguard Worker         }
4340*4bdc9457SAndroid Build Coastguard Worker       }
4341*4bdc9457SAndroid Build Coastguard Worker     }
4342*4bdc9457SAndroid Build Coastguard Worker   }
4343*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,a_offset)4344*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, a_offset) {
4345*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4346*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4347*4bdc9457SAndroid Build Coastguard Worker         .mr(3)
4348*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4349*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4350*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4351*4bdc9457SAndroid Build Coastguard Worker         .m(3)
4352*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4353*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4354*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
4355*4bdc9457SAndroid Build Coastguard Worker         .a_offset(67)
4356*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4357*4bdc9457SAndroid Build Coastguard Worker     }
4358*4bdc9457SAndroid Build Coastguard Worker   }
4359*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,zero)4360*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, zero) {
4361*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4362*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 3; mz++) {
4363*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4364*4bdc9457SAndroid Build Coastguard Worker           .mr(3)
4365*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4366*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4367*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4368*4bdc9457SAndroid Build Coastguard Worker           .m(3)
4369*4bdc9457SAndroid Build Coastguard Worker           .n(8)
4370*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4371*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
4372*4bdc9457SAndroid Build Coastguard Worker           .a_offset(67)
4373*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
4374*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4375*4bdc9457SAndroid Build Coastguard Worker       }
4376*4bdc9457SAndroid Build Coastguard Worker     }
4377*4bdc9457SAndroid Build Coastguard Worker   }
4378*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)4379*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
4380*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
4381*4bdc9457SAndroid Build Coastguard Worker       .mr(3)
4382*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
4383*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
4384*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
4385*4bdc9457SAndroid Build Coastguard Worker       .m(3)
4386*4bdc9457SAndroid Build Coastguard Worker       .n(8)
4387*4bdc9457SAndroid Build Coastguard Worker       .k(4)
4388*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
4389*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
4390*4bdc9457SAndroid Build Coastguard Worker   }
4391*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMRELAXEDSIMD
4392*4bdc9457SAndroid Build Coastguard Worker 
4393*4bdc9457SAndroid Build Coastguard Worker 
4394*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_eq_4)4395*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_eq_4) {
4396*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
4397*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
4398*4bdc9457SAndroid Build Coastguard Worker       .nr(2)
4399*4bdc9457SAndroid Build Coastguard Worker       .kr(4)
4400*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
4401*4bdc9457SAndroid Build Coastguard Worker       .m(4)
4402*4bdc9457SAndroid Build Coastguard Worker       .n(2)
4403*4bdc9457SAndroid Build Coastguard Worker       .k(4)
4404*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4405*4bdc9457SAndroid Build Coastguard Worker   }
4406*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,strided_cn)4407*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, strided_cn) {
4408*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
4409*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
4410*4bdc9457SAndroid Build Coastguard Worker       .nr(2)
4411*4bdc9457SAndroid Build Coastguard Worker       .kr(4)
4412*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
4413*4bdc9457SAndroid Build Coastguard Worker       .m(4)
4414*4bdc9457SAndroid Build Coastguard Worker       .n(2)
4415*4bdc9457SAndroid Build Coastguard Worker       .k(4)
4416*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(5)
4417*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4418*4bdc9457SAndroid Build Coastguard Worker   }
4419*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)4420*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
4421*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 2; n++) {
4422*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 4; m++) {
4423*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4424*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4425*4bdc9457SAndroid Build Coastguard Worker           .nr(2)
4426*4bdc9457SAndroid Build Coastguard Worker           .kr(4)
4427*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4428*4bdc9457SAndroid Build Coastguard Worker           .m(m)
4429*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4430*4bdc9457SAndroid Build Coastguard Worker           .k(4)
4431*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
4432*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4433*4bdc9457SAndroid Build Coastguard Worker       }
4434*4bdc9457SAndroid Build Coastguard Worker     }
4435*4bdc9457SAndroid Build Coastguard Worker   }
4436*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)4437*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
4438*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 4; m++) {
4439*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4440*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4441*4bdc9457SAndroid Build Coastguard Worker         .nr(2)
4442*4bdc9457SAndroid Build Coastguard Worker         .kr(4)
4443*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4444*4bdc9457SAndroid Build Coastguard Worker         .m(m)
4445*4bdc9457SAndroid Build Coastguard Worker         .n(2)
4446*4bdc9457SAndroid Build Coastguard Worker         .k(4)
4447*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
4448*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4449*4bdc9457SAndroid Build Coastguard Worker     }
4450*4bdc9457SAndroid Build Coastguard Worker   }
4451*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)4452*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
4453*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 2; n++) {
4454*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4455*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4456*4bdc9457SAndroid Build Coastguard Worker         .nr(2)
4457*4bdc9457SAndroid Build Coastguard Worker         .kr(4)
4458*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4459*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4460*4bdc9457SAndroid Build Coastguard Worker         .n(n)
4461*4bdc9457SAndroid Build Coastguard Worker         .k(4)
4462*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
4463*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4464*4bdc9457SAndroid Build Coastguard Worker     }
4465*4bdc9457SAndroid Build Coastguard Worker   }
4466*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_lt_4)4467*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_lt_4) {
4468*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
4469*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4470*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4471*4bdc9457SAndroid Build Coastguard Worker         .nr(2)
4472*4bdc9457SAndroid Build Coastguard Worker         .kr(4)
4473*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4474*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4475*4bdc9457SAndroid Build Coastguard Worker         .n(2)
4476*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4477*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4478*4bdc9457SAndroid Build Coastguard Worker     }
4479*4bdc9457SAndroid Build Coastguard Worker   }
4480*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)4481*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
4482*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
4483*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 2; n++) {
4484*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4485*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4486*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4487*4bdc9457SAndroid Build Coastguard Worker             .nr(2)
4488*4bdc9457SAndroid Build Coastguard Worker             .kr(4)
4489*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4490*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4491*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4492*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4493*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4494*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4495*4bdc9457SAndroid Build Coastguard Worker         }
4496*4bdc9457SAndroid Build Coastguard Worker       }
4497*4bdc9457SAndroid Build Coastguard Worker     }
4498*4bdc9457SAndroid Build Coastguard Worker   }
4499*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_gt_4)4500*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_gt_4) {
4501*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
4502*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4503*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4504*4bdc9457SAndroid Build Coastguard Worker         .nr(2)
4505*4bdc9457SAndroid Build Coastguard Worker         .kr(4)
4506*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4507*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4508*4bdc9457SAndroid Build Coastguard Worker         .n(2)
4509*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4510*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4511*4bdc9457SAndroid Build Coastguard Worker     }
4512*4bdc9457SAndroid Build Coastguard Worker   }
4513*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)4514*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
4515*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
4516*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 2; n++) {
4517*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4518*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4519*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4520*4bdc9457SAndroid Build Coastguard Worker             .nr(2)
4521*4bdc9457SAndroid Build Coastguard Worker             .kr(4)
4522*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4523*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4524*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4525*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4526*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4527*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4528*4bdc9457SAndroid Build Coastguard Worker         }
4529*4bdc9457SAndroid Build Coastguard Worker       }
4530*4bdc9457SAndroid Build Coastguard Worker     }
4531*4bdc9457SAndroid Build Coastguard Worker   }
4532*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_div_4)4533*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_div_4) {
4534*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
4535*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4536*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4537*4bdc9457SAndroid Build Coastguard Worker         .nr(2)
4538*4bdc9457SAndroid Build Coastguard Worker         .kr(4)
4539*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4540*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4541*4bdc9457SAndroid Build Coastguard Worker         .n(2)
4542*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4543*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4544*4bdc9457SAndroid Build Coastguard Worker     }
4545*4bdc9457SAndroid Build Coastguard Worker   }
4546*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)4547*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
4548*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
4549*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 2; n++) {
4550*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4551*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4552*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4553*4bdc9457SAndroid Build Coastguard Worker             .nr(2)
4554*4bdc9457SAndroid Build Coastguard Worker             .kr(4)
4555*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4556*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4557*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4558*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4559*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4560*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4561*4bdc9457SAndroid Build Coastguard Worker         }
4562*4bdc9457SAndroid Build Coastguard Worker       }
4563*4bdc9457SAndroid Build Coastguard Worker     }
4564*4bdc9457SAndroid Build Coastguard Worker   }
4565*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_gt_2)4566*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_gt_2) {
4567*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 3; n < 4; n++) {
4568*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4569*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4570*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4571*4bdc9457SAndroid Build Coastguard Worker           .nr(2)
4572*4bdc9457SAndroid Build Coastguard Worker           .kr(4)
4573*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4574*4bdc9457SAndroid Build Coastguard Worker           .m(4)
4575*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4576*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4577*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4578*4bdc9457SAndroid Build Coastguard Worker       }
4579*4bdc9457SAndroid Build Coastguard Worker     }
4580*4bdc9457SAndroid Build Coastguard Worker   }
4581*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_gt_2_strided_cn)4582*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_gt_2_strided_cn) {
4583*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 3; n < 4; n++) {
4584*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4585*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4586*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4587*4bdc9457SAndroid Build Coastguard Worker           .nr(2)
4588*4bdc9457SAndroid Build Coastguard Worker           .kr(4)
4589*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4590*4bdc9457SAndroid Build Coastguard Worker           .m(4)
4591*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4592*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4593*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(5)
4594*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4595*4bdc9457SAndroid Build Coastguard Worker       }
4596*4bdc9457SAndroid Build Coastguard Worker     }
4597*4bdc9457SAndroid Build Coastguard Worker   }
4598*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_gt_2_subtile)4599*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_gt_2_subtile) {
4600*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 3; n < 4; n++) {
4601*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4602*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4603*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4604*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4605*4bdc9457SAndroid Build Coastguard Worker             .nr(2)
4606*4bdc9457SAndroid Build Coastguard Worker             .kr(4)
4607*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4608*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4609*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4610*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4611*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4612*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4613*4bdc9457SAndroid Build Coastguard Worker         }
4614*4bdc9457SAndroid Build Coastguard Worker       }
4615*4bdc9457SAndroid Build Coastguard Worker     }
4616*4bdc9457SAndroid Build Coastguard Worker   }
4617*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_div_2)4618*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_div_2) {
4619*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 4; n <= 6; n += 2) {
4620*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4621*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4622*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4623*4bdc9457SAndroid Build Coastguard Worker           .nr(2)
4624*4bdc9457SAndroid Build Coastguard Worker           .kr(4)
4625*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4626*4bdc9457SAndroid Build Coastguard Worker           .m(4)
4627*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4628*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4629*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4630*4bdc9457SAndroid Build Coastguard Worker       }
4631*4bdc9457SAndroid Build Coastguard Worker     }
4632*4bdc9457SAndroid Build Coastguard Worker   }
4633*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_div_2_strided_cn)4634*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_div_2_strided_cn) {
4635*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 4; n <= 6; n += 2) {
4636*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4637*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4638*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4639*4bdc9457SAndroid Build Coastguard Worker           .nr(2)
4640*4bdc9457SAndroid Build Coastguard Worker           .kr(4)
4641*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4642*4bdc9457SAndroid Build Coastguard Worker           .m(4)
4643*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4644*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4645*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(5)
4646*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4647*4bdc9457SAndroid Build Coastguard Worker       }
4648*4bdc9457SAndroid Build Coastguard Worker     }
4649*4bdc9457SAndroid Build Coastguard Worker   }
4650*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_div_2_subtile)4651*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_div_2_subtile) {
4652*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 4; n <= 6; n += 2) {
4653*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4654*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4655*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4656*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4657*4bdc9457SAndroid Build Coastguard Worker             .nr(2)
4658*4bdc9457SAndroid Build Coastguard Worker             .kr(4)
4659*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4660*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4661*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4662*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4663*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4664*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4665*4bdc9457SAndroid Build Coastguard Worker         }
4666*4bdc9457SAndroid Build Coastguard Worker       }
4667*4bdc9457SAndroid Build Coastguard Worker     }
4668*4bdc9457SAndroid Build Coastguard Worker   }
4669*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,small_kernel)4670*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, small_kernel) {
4671*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4672*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4673*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4674*4bdc9457SAndroid Build Coastguard Worker         .nr(2)
4675*4bdc9457SAndroid Build Coastguard Worker         .kr(4)
4676*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4677*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4678*4bdc9457SAndroid Build Coastguard Worker         .n(2)
4679*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4680*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
4681*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4682*4bdc9457SAndroid Build Coastguard Worker     }
4683*4bdc9457SAndroid Build Coastguard Worker   }
4684*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,small_kernel_subtile)4685*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, small_kernel_subtile) {
4686*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4687*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 2; n++) {
4688*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4689*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4690*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4691*4bdc9457SAndroid Build Coastguard Worker             .nr(2)
4692*4bdc9457SAndroid Build Coastguard Worker             .kr(4)
4693*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4694*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4695*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4696*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4697*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
4698*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4699*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4700*4bdc9457SAndroid Build Coastguard Worker         }
4701*4bdc9457SAndroid Build Coastguard Worker       }
4702*4bdc9457SAndroid Build Coastguard Worker     }
4703*4bdc9457SAndroid Build Coastguard Worker   }
4704*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_gt_2_small_kernel)4705*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_gt_2_small_kernel) {
4706*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 3; n < 4; n++) {
4707*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4708*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4709*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4710*4bdc9457SAndroid Build Coastguard Worker           .nr(2)
4711*4bdc9457SAndroid Build Coastguard Worker           .kr(4)
4712*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4713*4bdc9457SAndroid Build Coastguard Worker           .m(4)
4714*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4715*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4716*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
4717*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4718*4bdc9457SAndroid Build Coastguard Worker       }
4719*4bdc9457SAndroid Build Coastguard Worker     }
4720*4bdc9457SAndroid Build Coastguard Worker   }
4721*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_div_2_small_kernel)4722*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_div_2_small_kernel) {
4723*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 4; n <= 6; n += 2) {
4724*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4725*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4726*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4727*4bdc9457SAndroid Build Coastguard Worker           .nr(2)
4728*4bdc9457SAndroid Build Coastguard Worker           .kr(4)
4729*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4730*4bdc9457SAndroid Build Coastguard Worker           .m(4)
4731*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4732*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4733*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
4734*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4735*4bdc9457SAndroid Build Coastguard Worker       }
4736*4bdc9457SAndroid Build Coastguard Worker     }
4737*4bdc9457SAndroid Build Coastguard Worker   }
4738*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)4739*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
4740*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4741*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 2; n++) {
4742*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4743*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4744*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4745*4bdc9457SAndroid Build Coastguard Worker             .nr(2)
4746*4bdc9457SAndroid Build Coastguard Worker             .kr(4)
4747*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4748*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4749*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4750*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4751*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(5)
4752*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4753*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4754*4bdc9457SAndroid Build Coastguard Worker         }
4755*4bdc9457SAndroid Build Coastguard Worker       }
4756*4bdc9457SAndroid Build Coastguard Worker     }
4757*4bdc9457SAndroid Build Coastguard Worker   }
4758*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,a_offset)4759*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, a_offset) {
4760*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4761*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4762*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4763*4bdc9457SAndroid Build Coastguard Worker         .nr(2)
4764*4bdc9457SAndroid Build Coastguard Worker         .kr(4)
4765*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4766*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4767*4bdc9457SAndroid Build Coastguard Worker         .n(2)
4768*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4769*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
4770*4bdc9457SAndroid Build Coastguard Worker         .a_offset(83)
4771*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4772*4bdc9457SAndroid Build Coastguard Worker     }
4773*4bdc9457SAndroid Build Coastguard Worker   }
4774*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,zero)4775*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, zero) {
4776*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
4777*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 4; mz++) {
4778*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4779*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4780*4bdc9457SAndroid Build Coastguard Worker           .nr(2)
4781*4bdc9457SAndroid Build Coastguard Worker           .kr(4)
4782*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4783*4bdc9457SAndroid Build Coastguard Worker           .m(4)
4784*4bdc9457SAndroid Build Coastguard Worker           .n(2)
4785*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4786*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
4787*4bdc9457SAndroid Build Coastguard Worker           .a_offset(83)
4788*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
4789*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4790*4bdc9457SAndroid Build Coastguard Worker       }
4791*4bdc9457SAndroid Build Coastguard Worker     }
4792*4bdc9457SAndroid Build Coastguard Worker   }
4793*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,strided_cm)4794*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, strided_cm) {
4795*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
4796*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
4797*4bdc9457SAndroid Build Coastguard Worker       .nr(2)
4798*4bdc9457SAndroid Build Coastguard Worker       .kr(4)
4799*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
4800*4bdc9457SAndroid Build Coastguard Worker       .m(4)
4801*4bdc9457SAndroid Build Coastguard Worker       .n(2)
4802*4bdc9457SAndroid Build Coastguard Worker       .k(4)
4803*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(5)
4804*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4805*4bdc9457SAndroid Build Coastguard Worker   }
4806*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMRELAXEDSIMD
4807*4bdc9457SAndroid Build Coastguard Worker 
4808*4bdc9457SAndroid Build Coastguard Worker 
4809*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)4810*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
4811*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
4812*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
4813*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
4814*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
4815*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
4816*4bdc9457SAndroid Build Coastguard Worker       .m(4)
4817*4bdc9457SAndroid Build Coastguard Worker       .n(8)
4818*4bdc9457SAndroid Build Coastguard Worker       .k(4)
4819*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4820*4bdc9457SAndroid Build Coastguard Worker   }
4821*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)4822*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
4823*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
4824*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
4825*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
4826*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
4827*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
4828*4bdc9457SAndroid Build Coastguard Worker       .m(4)
4829*4bdc9457SAndroid Build Coastguard Worker       .n(8)
4830*4bdc9457SAndroid Build Coastguard Worker       .k(4)
4831*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
4832*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4833*4bdc9457SAndroid Build Coastguard Worker   }
4834*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)4835*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
4836*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
4837*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 4; m++) {
4838*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4839*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4840*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4841*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4842*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4843*4bdc9457SAndroid Build Coastguard Worker           .m(m)
4844*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4845*4bdc9457SAndroid Build Coastguard Worker           .k(4)
4846*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
4847*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4848*4bdc9457SAndroid Build Coastguard Worker       }
4849*4bdc9457SAndroid Build Coastguard Worker     }
4850*4bdc9457SAndroid Build Coastguard Worker   }
4851*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)4852*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
4853*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 4; m++) {
4854*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4855*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4856*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4857*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4858*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4859*4bdc9457SAndroid Build Coastguard Worker         .m(m)
4860*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4861*4bdc9457SAndroid Build Coastguard Worker         .k(4)
4862*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
4863*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4864*4bdc9457SAndroid Build Coastguard Worker     }
4865*4bdc9457SAndroid Build Coastguard Worker   }
4866*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)4867*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
4868*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
4869*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4870*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4871*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4872*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4873*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4874*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4875*4bdc9457SAndroid Build Coastguard Worker         .n(n)
4876*4bdc9457SAndroid Build Coastguard Worker         .k(4)
4877*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
4878*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4879*4bdc9457SAndroid Build Coastguard Worker     }
4880*4bdc9457SAndroid Build Coastguard Worker   }
4881*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)4882*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
4883*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
4884*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4885*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4886*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4887*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4888*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4889*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4890*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4891*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4892*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4893*4bdc9457SAndroid Build Coastguard Worker     }
4894*4bdc9457SAndroid Build Coastguard Worker   }
4895*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)4896*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
4897*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
4898*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
4899*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4900*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4901*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4902*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4903*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4904*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4905*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4906*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4907*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4908*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4909*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4910*4bdc9457SAndroid Build Coastguard Worker         }
4911*4bdc9457SAndroid Build Coastguard Worker       }
4912*4bdc9457SAndroid Build Coastguard Worker     }
4913*4bdc9457SAndroid Build Coastguard Worker   }
4914*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)4915*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
4916*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
4917*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4918*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4919*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4920*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4921*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4922*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4923*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4924*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4925*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4926*4bdc9457SAndroid Build Coastguard Worker     }
4927*4bdc9457SAndroid Build Coastguard Worker   }
4928*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)4929*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
4930*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
4931*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
4932*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4933*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4934*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4935*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4936*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4937*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4938*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4939*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4940*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4941*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4942*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4943*4bdc9457SAndroid Build Coastguard Worker         }
4944*4bdc9457SAndroid Build Coastguard Worker       }
4945*4bdc9457SAndroid Build Coastguard Worker     }
4946*4bdc9457SAndroid Build Coastguard Worker   }
4947*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)4948*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
4949*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
4950*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
4951*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
4952*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
4953*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
4954*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
4955*4bdc9457SAndroid Build Coastguard Worker         .m(4)
4956*4bdc9457SAndroid Build Coastguard Worker         .n(8)
4957*4bdc9457SAndroid Build Coastguard Worker         .k(k)
4958*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4959*4bdc9457SAndroid Build Coastguard Worker     }
4960*4bdc9457SAndroid Build Coastguard Worker   }
4961*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)4962*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
4963*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
4964*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
4965*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
4966*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
4967*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
4968*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
4969*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
4970*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
4971*4bdc9457SAndroid Build Coastguard Worker             .m(m)
4972*4bdc9457SAndroid Build Coastguard Worker             .n(n)
4973*4bdc9457SAndroid Build Coastguard Worker             .k(k)
4974*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
4975*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4976*4bdc9457SAndroid Build Coastguard Worker         }
4977*4bdc9457SAndroid Build Coastguard Worker       }
4978*4bdc9457SAndroid Build Coastguard Worker     }
4979*4bdc9457SAndroid Build Coastguard Worker   }
4980*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)4981*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
4982*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
4983*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
4984*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
4985*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
4986*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
4987*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
4988*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
4989*4bdc9457SAndroid Build Coastguard Worker           .m(4)
4990*4bdc9457SAndroid Build Coastguard Worker           .n(n)
4991*4bdc9457SAndroid Build Coastguard Worker           .k(k)
4992*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4993*4bdc9457SAndroid Build Coastguard Worker       }
4994*4bdc9457SAndroid Build Coastguard Worker     }
4995*4bdc9457SAndroid Build Coastguard Worker   }
4996*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)4997*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
4998*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
4999*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5000*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5001*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
5002*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5003*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5004*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5005*4bdc9457SAndroid Build Coastguard Worker           .m(4)
5006*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5007*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5008*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
5009*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5010*4bdc9457SAndroid Build Coastguard Worker       }
5011*4bdc9457SAndroid Build Coastguard Worker     }
5012*4bdc9457SAndroid Build Coastguard Worker   }
5013*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)5014*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
5015*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5016*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5017*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
5018*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5019*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
5020*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5021*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5022*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5023*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5024*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5025*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5026*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5027*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5028*4bdc9457SAndroid Build Coastguard Worker         }
5029*4bdc9457SAndroid Build Coastguard Worker       }
5030*4bdc9457SAndroid Build Coastguard Worker     }
5031*4bdc9457SAndroid Build Coastguard Worker   }
5032*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)5033*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
5034*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5035*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5036*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5037*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
5038*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5039*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5040*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5041*4bdc9457SAndroid Build Coastguard Worker           .m(4)
5042*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5043*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5044*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5045*4bdc9457SAndroid Build Coastguard Worker       }
5046*4bdc9457SAndroid Build Coastguard Worker     }
5047*4bdc9457SAndroid Build Coastguard Worker   }
5048*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)5049*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
5050*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5051*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5052*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5053*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
5054*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5055*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5056*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5057*4bdc9457SAndroid Build Coastguard Worker           .m(4)
5058*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5059*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5060*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
5061*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5062*4bdc9457SAndroid Build Coastguard Worker       }
5063*4bdc9457SAndroid Build Coastguard Worker     }
5064*4bdc9457SAndroid Build Coastguard Worker   }
5065*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)5066*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
5067*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5068*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5069*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
5070*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5071*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
5072*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5073*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5074*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5075*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5076*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5077*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5078*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5079*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5080*4bdc9457SAndroid Build Coastguard Worker         }
5081*4bdc9457SAndroid Build Coastguard Worker       }
5082*4bdc9457SAndroid Build Coastguard Worker     }
5083*4bdc9457SAndroid Build Coastguard Worker   }
5084*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel)5085*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel) {
5086*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5087*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5088*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
5089*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5090*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5091*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
5092*4bdc9457SAndroid Build Coastguard Worker         .m(4)
5093*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5094*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5095*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
5096*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5097*4bdc9457SAndroid Build Coastguard Worker     }
5098*4bdc9457SAndroid Build Coastguard Worker   }
5099*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel_subtile)5100*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel_subtile) {
5101*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5102*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5103*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
5104*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5105*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
5106*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5107*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5108*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5109*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5110*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5111*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5112*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
5113*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5114*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5115*4bdc9457SAndroid Build Coastguard Worker         }
5116*4bdc9457SAndroid Build Coastguard Worker       }
5117*4bdc9457SAndroid Build Coastguard Worker     }
5118*4bdc9457SAndroid Build Coastguard Worker   }
5119*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_small_kernel)5120*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_small_kernel) {
5121*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5122*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5123*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5124*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
5125*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5126*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5127*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5128*4bdc9457SAndroid Build Coastguard Worker           .m(4)
5129*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5130*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5131*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
5132*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5133*4bdc9457SAndroid Build Coastguard Worker       }
5134*4bdc9457SAndroid Build Coastguard Worker     }
5135*4bdc9457SAndroid Build Coastguard Worker   }
5136*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_small_kernel)5137*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_small_kernel) {
5138*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5139*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5140*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5141*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
5142*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5143*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5144*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5145*4bdc9457SAndroid Build Coastguard Worker           .m(4)
5146*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5147*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5148*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
5149*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5150*4bdc9457SAndroid Build Coastguard Worker       }
5151*4bdc9457SAndroid Build Coastguard Worker     }
5152*4bdc9457SAndroid Build Coastguard Worker   }
5153*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)5154*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
5155*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5156*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5157*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 4; m++) {
5158*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5159*4bdc9457SAndroid Build Coastguard Worker             .mr(4)
5160*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5161*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5162*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5163*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5164*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5165*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5166*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
5167*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5168*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5169*4bdc9457SAndroid Build Coastguard Worker         }
5170*4bdc9457SAndroid Build Coastguard Worker       }
5171*4bdc9457SAndroid Build Coastguard Worker     }
5172*4bdc9457SAndroid Build Coastguard Worker   }
5173*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,a_offset)5174*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, a_offset) {
5175*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5176*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5177*4bdc9457SAndroid Build Coastguard Worker         .mr(4)
5178*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5179*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5180*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
5181*4bdc9457SAndroid Build Coastguard Worker         .m(4)
5182*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5183*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5184*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
5185*4bdc9457SAndroid Build Coastguard Worker         .a_offset(83)
5186*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5187*4bdc9457SAndroid Build Coastguard Worker     }
5188*4bdc9457SAndroid Build Coastguard Worker   }
5189*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,zero)5190*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, zero) {
5191*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5192*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 4; mz++) {
5193*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5194*4bdc9457SAndroid Build Coastguard Worker           .mr(4)
5195*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5196*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5197*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5198*4bdc9457SAndroid Build Coastguard Worker           .m(4)
5199*4bdc9457SAndroid Build Coastguard Worker           .n(8)
5200*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5201*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
5202*4bdc9457SAndroid Build Coastguard Worker           .a_offset(83)
5203*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
5204*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5205*4bdc9457SAndroid Build Coastguard Worker       }
5206*4bdc9457SAndroid Build Coastguard Worker     }
5207*4bdc9457SAndroid Build Coastguard Worker   }
5208*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)5209*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
5210*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
5211*4bdc9457SAndroid Build Coastguard Worker       .mr(4)
5212*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
5213*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
5214*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
5215*4bdc9457SAndroid Build Coastguard Worker       .m(4)
5216*4bdc9457SAndroid Build Coastguard Worker       .n(8)
5217*4bdc9457SAndroid Build Coastguard Worker       .k(4)
5218*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
5219*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
5220*4bdc9457SAndroid Build Coastguard Worker   }
5221*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMRELAXEDSIMD
5222*4bdc9457SAndroid Build Coastguard Worker 
5223*4bdc9457SAndroid Build Coastguard Worker 
5224*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)5225*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
5226*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
5227*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
5228*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
5229*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
5230*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
5231*4bdc9457SAndroid Build Coastguard Worker       .m(5)
5232*4bdc9457SAndroid Build Coastguard Worker       .n(8)
5233*4bdc9457SAndroid Build Coastguard Worker       .k(4)
5234*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5235*4bdc9457SAndroid Build Coastguard Worker   }
5236*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)5237*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
5238*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
5239*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
5240*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
5241*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
5242*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
5243*4bdc9457SAndroid Build Coastguard Worker       .m(5)
5244*4bdc9457SAndroid Build Coastguard Worker       .n(8)
5245*4bdc9457SAndroid Build Coastguard Worker       .k(4)
5246*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
5247*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5248*4bdc9457SAndroid Build Coastguard Worker   }
5249*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)5250*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
5251*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
5252*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 5; m++) {
5253*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5254*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5255*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5256*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5257*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5258*4bdc9457SAndroid Build Coastguard Worker           .m(m)
5259*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5260*4bdc9457SAndroid Build Coastguard Worker           .k(4)
5261*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
5262*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5263*4bdc9457SAndroid Build Coastguard Worker       }
5264*4bdc9457SAndroid Build Coastguard Worker     }
5265*4bdc9457SAndroid Build Coastguard Worker   }
5266*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)5267*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
5268*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 5; m++) {
5269*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5270*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5271*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5272*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5273*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
5274*4bdc9457SAndroid Build Coastguard Worker         .m(m)
5275*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5276*4bdc9457SAndroid Build Coastguard Worker         .k(4)
5277*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
5278*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5279*4bdc9457SAndroid Build Coastguard Worker     }
5280*4bdc9457SAndroid Build Coastguard Worker   }
5281*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)5282*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
5283*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
5284*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5285*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5286*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5287*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5288*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
5289*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5290*4bdc9457SAndroid Build Coastguard Worker         .n(n)
5291*4bdc9457SAndroid Build Coastguard Worker         .k(4)
5292*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
5293*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5294*4bdc9457SAndroid Build Coastguard Worker     }
5295*4bdc9457SAndroid Build Coastguard Worker   }
5296*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)5297*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
5298*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
5299*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5300*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5301*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5302*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5303*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
5304*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5305*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5306*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5307*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5308*4bdc9457SAndroid Build Coastguard Worker     }
5309*4bdc9457SAndroid Build Coastguard Worker   }
5310*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)5311*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
5312*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
5313*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5314*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5315*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5316*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5317*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5318*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5319*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5320*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5321*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5322*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5323*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5324*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5325*4bdc9457SAndroid Build Coastguard Worker         }
5326*4bdc9457SAndroid Build Coastguard Worker       }
5327*4bdc9457SAndroid Build Coastguard Worker     }
5328*4bdc9457SAndroid Build Coastguard Worker   }
5329*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)5330*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
5331*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
5332*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5333*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5334*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5335*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5336*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
5337*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5338*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5339*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5340*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5341*4bdc9457SAndroid Build Coastguard Worker     }
5342*4bdc9457SAndroid Build Coastguard Worker   }
5343*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)5344*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
5345*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
5346*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5347*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5348*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5349*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5350*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5351*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5352*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5353*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5354*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5355*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5356*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5357*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5358*4bdc9457SAndroid Build Coastguard Worker         }
5359*4bdc9457SAndroid Build Coastguard Worker       }
5360*4bdc9457SAndroid Build Coastguard Worker     }
5361*4bdc9457SAndroid Build Coastguard Worker   }
5362*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)5363*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
5364*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
5365*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5366*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5367*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5368*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5369*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
5370*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5371*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5372*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5373*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5374*4bdc9457SAndroid Build Coastguard Worker     }
5375*4bdc9457SAndroid Build Coastguard Worker   }
5376*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)5377*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
5378*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
5379*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5380*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5381*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5382*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5383*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5384*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5385*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5386*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5387*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5388*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5389*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5390*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5391*4bdc9457SAndroid Build Coastguard Worker         }
5392*4bdc9457SAndroid Build Coastguard Worker       }
5393*4bdc9457SAndroid Build Coastguard Worker     }
5394*4bdc9457SAndroid Build Coastguard Worker   }
5395*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)5396*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
5397*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5398*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5399*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5400*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5401*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5402*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5403*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5404*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5405*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5406*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5407*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5408*4bdc9457SAndroid Build Coastguard Worker       }
5409*4bdc9457SAndroid Build Coastguard Worker     }
5410*4bdc9457SAndroid Build Coastguard Worker   }
5411*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)5412*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
5413*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5414*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5415*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5416*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5417*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5418*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5419*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5420*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5421*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5422*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5423*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
5424*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5425*4bdc9457SAndroid Build Coastguard Worker       }
5426*4bdc9457SAndroid Build Coastguard Worker     }
5427*4bdc9457SAndroid Build Coastguard Worker   }
5428*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)5429*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
5430*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5431*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5432*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5433*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5434*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5435*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5436*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5437*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5438*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5439*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5440*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5441*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5442*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5443*4bdc9457SAndroid Build Coastguard Worker         }
5444*4bdc9457SAndroid Build Coastguard Worker       }
5445*4bdc9457SAndroid Build Coastguard Worker     }
5446*4bdc9457SAndroid Build Coastguard Worker   }
5447*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)5448*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
5449*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5450*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5451*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5452*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5453*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5454*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5455*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5456*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5457*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5458*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5459*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5460*4bdc9457SAndroid Build Coastguard Worker       }
5461*4bdc9457SAndroid Build Coastguard Worker     }
5462*4bdc9457SAndroid Build Coastguard Worker   }
5463*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)5464*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
5465*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5466*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5467*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5468*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5469*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5470*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5471*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5472*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5473*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5474*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5475*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
5476*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5477*4bdc9457SAndroid Build Coastguard Worker       }
5478*4bdc9457SAndroid Build Coastguard Worker     }
5479*4bdc9457SAndroid Build Coastguard Worker   }
5480*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)5481*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
5482*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5483*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5484*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5485*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5486*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5487*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5488*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5489*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5490*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5491*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5492*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5493*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5494*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5495*4bdc9457SAndroid Build Coastguard Worker         }
5496*4bdc9457SAndroid Build Coastguard Worker       }
5497*4bdc9457SAndroid Build Coastguard Worker     }
5498*4bdc9457SAndroid Build Coastguard Worker   }
5499*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel)5500*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel) {
5501*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5502*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5503*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5504*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5505*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5506*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
5507*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5508*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5509*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5510*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
5511*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5512*4bdc9457SAndroid Build Coastguard Worker     }
5513*4bdc9457SAndroid Build Coastguard Worker   }
5514*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel_subtile)5515*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel_subtile) {
5516*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5517*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5518*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5519*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5520*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5521*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5522*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5523*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5524*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5525*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5526*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5527*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
5528*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5529*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5530*4bdc9457SAndroid Build Coastguard Worker         }
5531*4bdc9457SAndroid Build Coastguard Worker       }
5532*4bdc9457SAndroid Build Coastguard Worker     }
5533*4bdc9457SAndroid Build Coastguard Worker   }
5534*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_small_kernel)5535*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_small_kernel) {
5536*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5537*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5538*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5539*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5540*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5541*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5542*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5543*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5544*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5545*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5546*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
5547*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5548*4bdc9457SAndroid Build Coastguard Worker       }
5549*4bdc9457SAndroid Build Coastguard Worker     }
5550*4bdc9457SAndroid Build Coastguard Worker   }
5551*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_small_kernel)5552*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_small_kernel) {
5553*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5554*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5555*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5556*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5557*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5558*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5559*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5560*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5561*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5562*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5563*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
5564*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5565*4bdc9457SAndroid Build Coastguard Worker       }
5566*4bdc9457SAndroid Build Coastguard Worker     }
5567*4bdc9457SAndroid Build Coastguard Worker   }
5568*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)5569*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
5570*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5571*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5572*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5573*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5574*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5575*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5576*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5577*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
5578*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5579*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5580*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5581*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
5582*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5583*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5584*4bdc9457SAndroid Build Coastguard Worker         }
5585*4bdc9457SAndroid Build Coastguard Worker       }
5586*4bdc9457SAndroid Build Coastguard Worker     }
5587*4bdc9457SAndroid Build Coastguard Worker   }
5588*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,a_offset)5589*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, a_offset) {
5590*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5591*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5592*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5593*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5594*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5595*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
5596*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5597*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5598*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5599*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
5600*4bdc9457SAndroid Build Coastguard Worker         .a_offset(103)
5601*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5602*4bdc9457SAndroid Build Coastguard Worker     }
5603*4bdc9457SAndroid Build Coastguard Worker   }
5604*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,zero)5605*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, zero) {
5606*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5607*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 5; mz++) {
5608*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5609*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5610*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5611*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5612*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
5613*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5614*4bdc9457SAndroid Build Coastguard Worker           .n(8)
5615*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5616*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
5617*4bdc9457SAndroid Build Coastguard Worker           .a_offset(103)
5618*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
5619*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5620*4bdc9457SAndroid Build Coastguard Worker       }
5621*4bdc9457SAndroid Build Coastguard Worker     }
5622*4bdc9457SAndroid Build Coastguard Worker   }
5623*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)5624*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
5625*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
5626*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
5627*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
5628*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
5629*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
5630*4bdc9457SAndroid Build Coastguard Worker       .m(5)
5631*4bdc9457SAndroid Build Coastguard Worker       .n(8)
5632*4bdc9457SAndroid Build Coastguard Worker       .k(4)
5633*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
5634*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5635*4bdc9457SAndroid Build Coastguard Worker   }
5636*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMRELAXEDSIMD
5637*4bdc9457SAndroid Build Coastguard Worker 
5638*4bdc9457SAndroid Build Coastguard Worker 
5639*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)5640*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
5641*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
5642*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
5643*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
5644*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
5645*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
5646*4bdc9457SAndroid Build Coastguard Worker       .m(5)
5647*4bdc9457SAndroid Build Coastguard Worker       .n(8)
5648*4bdc9457SAndroid Build Coastguard Worker       .k(4)
5649*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5650*4bdc9457SAndroid Build Coastguard Worker   }
5651*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,strided_cn)5652*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
5653*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
5654*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
5655*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
5656*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
5657*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
5658*4bdc9457SAndroid Build Coastguard Worker       .m(5)
5659*4bdc9457SAndroid Build Coastguard Worker       .n(8)
5660*4bdc9457SAndroid Build Coastguard Worker       .k(4)
5661*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
5662*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5663*4bdc9457SAndroid Build Coastguard Worker   }
5664*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)5665*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
5666*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
5667*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 5; m++) {
5668*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5669*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5670*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5671*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5672*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
5673*4bdc9457SAndroid Build Coastguard Worker           .m(m)
5674*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5675*4bdc9457SAndroid Build Coastguard Worker           .k(4)
5676*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
5677*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5678*4bdc9457SAndroid Build Coastguard Worker       }
5679*4bdc9457SAndroid Build Coastguard Worker     }
5680*4bdc9457SAndroid Build Coastguard Worker   }
5681*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)5682*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
5683*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 5; m++) {
5684*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5685*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5686*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5687*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5688*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
5689*4bdc9457SAndroid Build Coastguard Worker         .m(m)
5690*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5691*4bdc9457SAndroid Build Coastguard Worker         .k(4)
5692*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
5693*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5694*4bdc9457SAndroid Build Coastguard Worker     }
5695*4bdc9457SAndroid Build Coastguard Worker   }
5696*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)5697*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
5698*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
5699*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5700*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5701*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5702*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5703*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
5704*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5705*4bdc9457SAndroid Build Coastguard Worker         .n(n)
5706*4bdc9457SAndroid Build Coastguard Worker         .k(4)
5707*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
5708*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5709*4bdc9457SAndroid Build Coastguard Worker     }
5710*4bdc9457SAndroid Build Coastguard Worker   }
5711*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)5712*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
5713*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
5714*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5715*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5716*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5717*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5718*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
5719*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5720*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5721*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5722*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5723*4bdc9457SAndroid Build Coastguard Worker     }
5724*4bdc9457SAndroid Build Coastguard Worker   }
5725*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)5726*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
5727*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
5728*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5729*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5730*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5731*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5732*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5733*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5734*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
5735*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5736*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5737*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5738*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5739*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5740*4bdc9457SAndroid Build Coastguard Worker         }
5741*4bdc9457SAndroid Build Coastguard Worker       }
5742*4bdc9457SAndroid Build Coastguard Worker     }
5743*4bdc9457SAndroid Build Coastguard Worker   }
5744*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)5745*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
5746*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
5747*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5748*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5749*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5750*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5751*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
5752*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5753*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5754*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5755*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5756*4bdc9457SAndroid Build Coastguard Worker     }
5757*4bdc9457SAndroid Build Coastguard Worker   }
5758*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)5759*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
5760*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
5761*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5762*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5763*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5764*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5765*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5766*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5767*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
5768*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5769*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5770*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5771*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5772*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5773*4bdc9457SAndroid Build Coastguard Worker         }
5774*4bdc9457SAndroid Build Coastguard Worker       }
5775*4bdc9457SAndroid Build Coastguard Worker     }
5776*4bdc9457SAndroid Build Coastguard Worker   }
5777*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_div_4)5778*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
5779*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
5780*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5781*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5782*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5783*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5784*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
5785*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5786*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5787*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5788*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5789*4bdc9457SAndroid Build Coastguard Worker     }
5790*4bdc9457SAndroid Build Coastguard Worker   }
5791*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)5792*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
5793*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
5794*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5795*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5796*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5797*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5798*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5799*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5800*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
5801*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5802*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5803*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5804*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5805*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5806*4bdc9457SAndroid Build Coastguard Worker         }
5807*4bdc9457SAndroid Build Coastguard Worker       }
5808*4bdc9457SAndroid Build Coastguard Worker     }
5809*4bdc9457SAndroid Build Coastguard Worker   }
5810*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)5811*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
5812*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5813*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5814*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5815*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5816*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5817*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5818*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
5819*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5820*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5821*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5822*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5823*4bdc9457SAndroid Build Coastguard Worker       }
5824*4bdc9457SAndroid Build Coastguard Worker     }
5825*4bdc9457SAndroid Build Coastguard Worker   }
5826*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)5827*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
5828*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5829*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5830*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5831*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5832*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5833*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5834*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
5835*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5836*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5837*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5838*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
5839*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5840*4bdc9457SAndroid Build Coastguard Worker       }
5841*4bdc9457SAndroid Build Coastguard Worker     }
5842*4bdc9457SAndroid Build Coastguard Worker   }
5843*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)5844*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
5845*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5846*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5847*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5848*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5849*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5850*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5851*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5852*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
5853*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5854*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5855*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5856*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5857*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5858*4bdc9457SAndroid Build Coastguard Worker         }
5859*4bdc9457SAndroid Build Coastguard Worker       }
5860*4bdc9457SAndroid Build Coastguard Worker     }
5861*4bdc9457SAndroid Build Coastguard Worker   }
5862*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_div_8)5863*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
5864*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5865*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5866*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5867*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5868*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5869*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5870*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
5871*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5872*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5873*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5874*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5875*4bdc9457SAndroid Build Coastguard Worker       }
5876*4bdc9457SAndroid Build Coastguard Worker     }
5877*4bdc9457SAndroid Build Coastguard Worker   }
5878*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)5879*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
5880*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5881*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5882*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5883*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5884*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5885*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5886*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
5887*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5888*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5889*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5890*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
5891*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5892*4bdc9457SAndroid Build Coastguard Worker       }
5893*4bdc9457SAndroid Build Coastguard Worker     }
5894*4bdc9457SAndroid Build Coastguard Worker   }
5895*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)5896*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
5897*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5898*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5899*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5900*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5901*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5902*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5903*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5904*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
5905*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5906*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5907*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5908*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5909*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5910*4bdc9457SAndroid Build Coastguard Worker         }
5911*4bdc9457SAndroid Build Coastguard Worker       }
5912*4bdc9457SAndroid Build Coastguard Worker     }
5913*4bdc9457SAndroid Build Coastguard Worker   }
5914*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,small_kernel)5915*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, small_kernel) {
5916*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5917*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
5918*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
5919*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
5920*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
5921*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
5922*4bdc9457SAndroid Build Coastguard Worker         .m(5)
5923*4bdc9457SAndroid Build Coastguard Worker         .n(8)
5924*4bdc9457SAndroid Build Coastguard Worker         .k(k)
5925*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
5926*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5927*4bdc9457SAndroid Build Coastguard Worker     }
5928*4bdc9457SAndroid Build Coastguard Worker   }
5929*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,small_kernel_subtile)5930*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, small_kernel_subtile) {
5931*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5932*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5933*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5934*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5935*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5936*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5937*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5938*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
5939*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5940*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5941*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5942*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
5943*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5944*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5945*4bdc9457SAndroid Build Coastguard Worker         }
5946*4bdc9457SAndroid Build Coastguard Worker       }
5947*4bdc9457SAndroid Build Coastguard Worker     }
5948*4bdc9457SAndroid Build Coastguard Worker   }
5949*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_small_kernel)5950*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_small_kernel) {
5951*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
5952*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5953*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5954*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5955*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5956*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5957*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
5958*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5959*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5960*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5961*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
5962*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5963*4bdc9457SAndroid Build Coastguard Worker       }
5964*4bdc9457SAndroid Build Coastguard Worker     }
5965*4bdc9457SAndroid Build Coastguard Worker   }
5966*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_div_8_small_kernel)5967*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_div_8_small_kernel) {
5968*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
5969*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
5970*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
5971*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
5972*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
5973*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
5974*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
5975*4bdc9457SAndroid Build Coastguard Worker           .m(5)
5976*4bdc9457SAndroid Build Coastguard Worker           .n(n)
5977*4bdc9457SAndroid Build Coastguard Worker           .k(k)
5978*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
5979*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5980*4bdc9457SAndroid Build Coastguard Worker       }
5981*4bdc9457SAndroid Build Coastguard Worker     }
5982*4bdc9457SAndroid Build Coastguard Worker   }
5983*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)5984*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
5985*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
5986*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
5987*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 5; m++) {
5988*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
5989*4bdc9457SAndroid Build Coastguard Worker             .mr(5)
5990*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
5991*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
5992*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
5993*4bdc9457SAndroid Build Coastguard Worker             .m(m)
5994*4bdc9457SAndroid Build Coastguard Worker             .n(n)
5995*4bdc9457SAndroid Build Coastguard Worker             .k(k)
5996*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
5997*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
5998*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5999*4bdc9457SAndroid Build Coastguard Worker         }
6000*4bdc9457SAndroid Build Coastguard Worker       }
6001*4bdc9457SAndroid Build Coastguard Worker     }
6002*4bdc9457SAndroid Build Coastguard Worker   }
6003*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,a_offset)6004*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, a_offset) {
6005*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6006*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6007*4bdc9457SAndroid Build Coastguard Worker         .mr(5)
6008*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6009*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6010*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
6011*4bdc9457SAndroid Build Coastguard Worker         .m(5)
6012*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6013*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6014*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
6015*4bdc9457SAndroid Build Coastguard Worker         .a_offset(103)
6016*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
6017*4bdc9457SAndroid Build Coastguard Worker     }
6018*4bdc9457SAndroid Build Coastguard Worker   }
6019*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,zero)6020*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, zero) {
6021*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6022*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 5; mz++) {
6023*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6024*4bdc9457SAndroid Build Coastguard Worker           .mr(5)
6025*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6026*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6027*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
6028*4bdc9457SAndroid Build Coastguard Worker           .m(5)
6029*4bdc9457SAndroid Build Coastguard Worker           .n(8)
6030*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6031*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
6032*4bdc9457SAndroid Build Coastguard Worker           .a_offset(103)
6033*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
6034*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
6035*4bdc9457SAndroid Build Coastguard Worker       }
6036*4bdc9457SAndroid Build Coastguard Worker     }
6037*4bdc9457SAndroid Build Coastguard Worker   }
6038*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,strided_cm)6039*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
6040*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
6041*4bdc9457SAndroid Build Coastguard Worker       .mr(5)
6042*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
6043*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
6044*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
6045*4bdc9457SAndroid Build Coastguard Worker       .m(5)
6046*4bdc9457SAndroid Build Coastguard Worker       .n(8)
6047*4bdc9457SAndroid Build Coastguard Worker       .k(4)
6048*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
6049*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
6050*4bdc9457SAndroid Build Coastguard Worker   }
6051*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMRELAXEDSIMD
6052*4bdc9457SAndroid Build Coastguard Worker 
6053*4bdc9457SAndroid Build Coastguard Worker 
6054*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)6055*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
6056*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
6057*4bdc9457SAndroid Build Coastguard Worker       .mr(6)
6058*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
6059*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
6060*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
6061*4bdc9457SAndroid Build Coastguard Worker       .m(6)
6062*4bdc9457SAndroid Build Coastguard Worker       .n(8)
6063*4bdc9457SAndroid Build Coastguard Worker       .k(4)
6064*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6065*4bdc9457SAndroid Build Coastguard Worker   }
6066*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)6067*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
6068*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
6069*4bdc9457SAndroid Build Coastguard Worker       .mr(6)
6070*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
6071*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
6072*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
6073*4bdc9457SAndroid Build Coastguard Worker       .m(6)
6074*4bdc9457SAndroid Build Coastguard Worker       .n(8)
6075*4bdc9457SAndroid Build Coastguard Worker       .k(4)
6076*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
6077*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6078*4bdc9457SAndroid Build Coastguard Worker   }
6079*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)6080*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
6081*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
6082*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 6; m++) {
6083*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6084*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6085*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6086*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6087*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6088*4bdc9457SAndroid Build Coastguard Worker           .m(m)
6089*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6090*4bdc9457SAndroid Build Coastguard Worker           .k(4)
6091*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
6092*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6093*4bdc9457SAndroid Build Coastguard Worker       }
6094*4bdc9457SAndroid Build Coastguard Worker     }
6095*4bdc9457SAndroid Build Coastguard Worker   }
6096*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)6097*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
6098*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 6; m++) {
6099*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6100*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6101*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6102*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6103*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6104*4bdc9457SAndroid Build Coastguard Worker         .m(m)
6105*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6106*4bdc9457SAndroid Build Coastguard Worker         .k(4)
6107*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
6108*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6109*4bdc9457SAndroid Build Coastguard Worker     }
6110*4bdc9457SAndroid Build Coastguard Worker   }
6111*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)6112*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
6113*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
6114*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6115*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6116*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6117*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6118*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6119*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6120*4bdc9457SAndroid Build Coastguard Worker         .n(n)
6121*4bdc9457SAndroid Build Coastguard Worker         .k(4)
6122*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
6123*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6124*4bdc9457SAndroid Build Coastguard Worker     }
6125*4bdc9457SAndroid Build Coastguard Worker   }
6126*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)6127*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
6128*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
6129*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6130*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6131*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6132*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6133*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6134*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6135*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6136*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6137*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6138*4bdc9457SAndroid Build Coastguard Worker     }
6139*4bdc9457SAndroid Build Coastguard Worker   }
6140*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)6141*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
6142*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
6143*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6144*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6145*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6146*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6147*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6148*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6149*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
6150*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6151*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6152*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6153*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6154*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6155*4bdc9457SAndroid Build Coastguard Worker         }
6156*4bdc9457SAndroid Build Coastguard Worker       }
6157*4bdc9457SAndroid Build Coastguard Worker     }
6158*4bdc9457SAndroid Build Coastguard Worker   }
6159*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)6160*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
6161*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
6162*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6163*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6164*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6165*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6166*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6167*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6168*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6169*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6170*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6171*4bdc9457SAndroid Build Coastguard Worker     }
6172*4bdc9457SAndroid Build Coastguard Worker   }
6173*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)6174*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
6175*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
6176*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6177*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6178*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6179*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6180*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6181*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6182*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
6183*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6184*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6185*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6186*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6187*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6188*4bdc9457SAndroid Build Coastguard Worker         }
6189*4bdc9457SAndroid Build Coastguard Worker       }
6190*4bdc9457SAndroid Build Coastguard Worker     }
6191*4bdc9457SAndroid Build Coastguard Worker   }
6192*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)6193*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
6194*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
6195*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6196*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6197*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6198*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6199*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6200*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6201*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6202*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6203*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6204*4bdc9457SAndroid Build Coastguard Worker     }
6205*4bdc9457SAndroid Build Coastguard Worker   }
6206*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)6207*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
6208*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
6209*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6210*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6211*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6212*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6213*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6214*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6215*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
6216*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6217*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6218*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6219*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6220*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6221*4bdc9457SAndroid Build Coastguard Worker         }
6222*4bdc9457SAndroid Build Coastguard Worker       }
6223*4bdc9457SAndroid Build Coastguard Worker     }
6224*4bdc9457SAndroid Build Coastguard Worker   }
6225*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)6226*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
6227*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
6228*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6229*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6230*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6231*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6232*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6233*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6234*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6235*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6236*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6237*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6238*4bdc9457SAndroid Build Coastguard Worker       }
6239*4bdc9457SAndroid Build Coastguard Worker     }
6240*4bdc9457SAndroid Build Coastguard Worker   }
6241*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)6242*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
6243*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
6244*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6245*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6246*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6247*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6248*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6249*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6250*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6251*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6252*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6253*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
6254*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6255*4bdc9457SAndroid Build Coastguard Worker       }
6256*4bdc9457SAndroid Build Coastguard Worker     }
6257*4bdc9457SAndroid Build Coastguard Worker   }
6258*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)6259*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
6260*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
6261*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6262*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6263*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6264*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6265*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6266*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6267*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
6268*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6269*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6270*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6271*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6272*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6273*4bdc9457SAndroid Build Coastguard Worker         }
6274*4bdc9457SAndroid Build Coastguard Worker       }
6275*4bdc9457SAndroid Build Coastguard Worker     }
6276*4bdc9457SAndroid Build Coastguard Worker   }
6277*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)6278*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
6279*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
6280*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6281*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6282*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6283*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6284*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6285*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6286*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6287*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6288*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6289*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6290*4bdc9457SAndroid Build Coastguard Worker       }
6291*4bdc9457SAndroid Build Coastguard Worker     }
6292*4bdc9457SAndroid Build Coastguard Worker   }
6293*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)6294*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
6295*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
6296*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6297*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6298*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6299*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6300*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6301*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6302*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6303*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6304*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6305*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
6306*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6307*4bdc9457SAndroid Build Coastguard Worker       }
6308*4bdc9457SAndroid Build Coastguard Worker     }
6309*4bdc9457SAndroid Build Coastguard Worker   }
6310*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)6311*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
6312*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
6313*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6314*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6315*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6316*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6317*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6318*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6319*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
6320*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6321*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6322*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6323*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6324*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6325*4bdc9457SAndroid Build Coastguard Worker         }
6326*4bdc9457SAndroid Build Coastguard Worker       }
6327*4bdc9457SAndroid Build Coastguard Worker     }
6328*4bdc9457SAndroid Build Coastguard Worker   }
6329*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel)6330*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel) {
6331*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6332*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6333*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6334*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6335*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6336*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6337*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6338*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6339*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6340*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
6341*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6342*4bdc9457SAndroid Build Coastguard Worker     }
6343*4bdc9457SAndroid Build Coastguard Worker   }
6344*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,small_kernel_subtile)6345*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, small_kernel_subtile) {
6346*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6347*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6348*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6349*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6350*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6351*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6352*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6353*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
6354*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6355*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6356*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6357*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
6358*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6359*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6360*4bdc9457SAndroid Build Coastguard Worker         }
6361*4bdc9457SAndroid Build Coastguard Worker       }
6362*4bdc9457SAndroid Build Coastguard Worker     }
6363*4bdc9457SAndroid Build Coastguard Worker   }
6364*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_small_kernel)6365*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_small_kernel) {
6366*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
6367*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6368*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6369*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6370*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6371*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6372*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6373*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6374*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6375*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6376*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
6377*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6378*4bdc9457SAndroid Build Coastguard Worker       }
6379*4bdc9457SAndroid Build Coastguard Worker     }
6380*4bdc9457SAndroid Build Coastguard Worker   }
6381*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_small_kernel)6382*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_small_kernel) {
6383*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
6384*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6385*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6386*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6387*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6388*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6389*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6390*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6391*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6392*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6393*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
6394*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6395*4bdc9457SAndroid Build Coastguard Worker       }
6396*4bdc9457SAndroid Build Coastguard Worker     }
6397*4bdc9457SAndroid Build Coastguard Worker   }
6398*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)6399*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
6400*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6401*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6402*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6403*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6404*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6405*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6406*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6407*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
6408*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6409*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6410*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6411*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
6412*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6413*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6414*4bdc9457SAndroid Build Coastguard Worker         }
6415*4bdc9457SAndroid Build Coastguard Worker       }
6416*4bdc9457SAndroid Build Coastguard Worker     }
6417*4bdc9457SAndroid Build Coastguard Worker   }
6418*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,a_offset)6419*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, a_offset) {
6420*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6421*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6422*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6423*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6424*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6425*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6426*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6427*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6428*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6429*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
6430*4bdc9457SAndroid Build Coastguard Worker         .a_offset(127)
6431*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6432*4bdc9457SAndroid Build Coastguard Worker     }
6433*4bdc9457SAndroid Build Coastguard Worker   }
6434*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,zero)6435*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, zero) {
6436*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6437*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 6; mz++) {
6438*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6439*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6440*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6441*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6442*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6443*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6444*4bdc9457SAndroid Build Coastguard Worker           .n(8)
6445*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6446*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
6447*4bdc9457SAndroid Build Coastguard Worker           .a_offset(127)
6448*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
6449*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6450*4bdc9457SAndroid Build Coastguard Worker       }
6451*4bdc9457SAndroid Build Coastguard Worker     }
6452*4bdc9457SAndroid Build Coastguard Worker   }
6453*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)6454*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
6455*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
6456*4bdc9457SAndroid Build Coastguard Worker       .mr(6)
6457*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
6458*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
6459*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
6460*4bdc9457SAndroid Build Coastguard Worker       .m(6)
6461*4bdc9457SAndroid Build Coastguard Worker       .n(8)
6462*4bdc9457SAndroid Build Coastguard Worker       .k(4)
6463*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
6464*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
6465*4bdc9457SAndroid Build Coastguard Worker   }
6466*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMRELAXEDSIMD
6467*4bdc9457SAndroid Build Coastguard Worker 
6468*4bdc9457SAndroid Build Coastguard Worker 
6469*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)6470*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
6471*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
6472*4bdc9457SAndroid Build Coastguard Worker       .mr(6)
6473*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
6474*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
6475*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
6476*4bdc9457SAndroid Build Coastguard Worker       .m(6)
6477*4bdc9457SAndroid Build Coastguard Worker       .n(8)
6478*4bdc9457SAndroid Build Coastguard Worker       .k(4)
6479*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6480*4bdc9457SAndroid Build Coastguard Worker   }
6481*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,strided_cn)6482*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
6483*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
6484*4bdc9457SAndroid Build Coastguard Worker       .mr(6)
6485*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
6486*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
6487*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
6488*4bdc9457SAndroid Build Coastguard Worker       .m(6)
6489*4bdc9457SAndroid Build Coastguard Worker       .n(8)
6490*4bdc9457SAndroid Build Coastguard Worker       .k(4)
6491*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(11)
6492*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6493*4bdc9457SAndroid Build Coastguard Worker   }
6494*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)6495*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
6496*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
6497*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 6; m++) {
6498*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6499*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6500*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6501*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6502*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
6503*4bdc9457SAndroid Build Coastguard Worker           .m(m)
6504*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6505*4bdc9457SAndroid Build Coastguard Worker           .k(4)
6506*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
6507*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6508*4bdc9457SAndroid Build Coastguard Worker       }
6509*4bdc9457SAndroid Build Coastguard Worker     }
6510*4bdc9457SAndroid Build Coastguard Worker   }
6511*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)6512*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
6513*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 6; m++) {
6514*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6515*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6516*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6517*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6518*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
6519*4bdc9457SAndroid Build Coastguard Worker         .m(m)
6520*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6521*4bdc9457SAndroid Build Coastguard Worker         .k(4)
6522*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
6523*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6524*4bdc9457SAndroid Build Coastguard Worker     }
6525*4bdc9457SAndroid Build Coastguard Worker   }
6526*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)6527*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
6528*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 8; n++) {
6529*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6530*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6531*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6532*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6533*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
6534*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6535*4bdc9457SAndroid Build Coastguard Worker         .n(n)
6536*4bdc9457SAndroid Build Coastguard Worker         .k(4)
6537*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
6538*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6539*4bdc9457SAndroid Build Coastguard Worker     }
6540*4bdc9457SAndroid Build Coastguard Worker   }
6541*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)6542*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
6543*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
6544*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6545*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6546*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6547*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6548*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
6549*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6550*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6551*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6552*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6553*4bdc9457SAndroid Build Coastguard Worker     }
6554*4bdc9457SAndroid Build Coastguard Worker   }
6555*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)6556*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
6557*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k < 4; k++) {
6558*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6559*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6560*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6561*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6562*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6563*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6564*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
6565*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6566*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6567*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6568*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6569*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6570*4bdc9457SAndroid Build Coastguard Worker         }
6571*4bdc9457SAndroid Build Coastguard Worker       }
6572*4bdc9457SAndroid Build Coastguard Worker     }
6573*4bdc9457SAndroid Build Coastguard Worker   }
6574*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)6575*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
6576*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
6577*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6578*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6579*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6580*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6581*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
6582*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6583*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6584*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6585*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6586*4bdc9457SAndroid Build Coastguard Worker     }
6587*4bdc9457SAndroid Build Coastguard Worker   }
6588*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)6589*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
6590*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 5; k < 8; k++) {
6591*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6592*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6593*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6594*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6595*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6596*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6597*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
6598*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6599*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6600*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6601*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6602*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6603*4bdc9457SAndroid Build Coastguard Worker         }
6604*4bdc9457SAndroid Build Coastguard Worker       }
6605*4bdc9457SAndroid Build Coastguard Worker     }
6606*4bdc9457SAndroid Build Coastguard Worker   }
6607*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_div_4)6608*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
6609*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
6610*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6611*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6612*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6613*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6614*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
6615*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6616*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6617*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6618*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6619*4bdc9457SAndroid Build Coastguard Worker     }
6620*4bdc9457SAndroid Build Coastguard Worker   }
6621*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)6622*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
6623*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 8; k <= 40; k += 4) {
6624*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6625*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6626*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6627*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6628*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6629*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6630*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
6631*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6632*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6633*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6634*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6635*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6636*4bdc9457SAndroid Build Coastguard Worker         }
6637*4bdc9457SAndroid Build Coastguard Worker       }
6638*4bdc9457SAndroid Build Coastguard Worker     }
6639*4bdc9457SAndroid Build Coastguard Worker   }
6640*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)6641*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
6642*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
6643*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6644*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6645*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6646*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6647*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6648*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
6649*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6650*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6651*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6652*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6653*4bdc9457SAndroid Build Coastguard Worker       }
6654*4bdc9457SAndroid Build Coastguard Worker     }
6655*4bdc9457SAndroid Build Coastguard Worker   }
6656*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)6657*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
6658*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
6659*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6660*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6661*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6662*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6663*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6664*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
6665*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6666*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6667*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6668*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
6669*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6670*4bdc9457SAndroid Build Coastguard Worker       }
6671*4bdc9457SAndroid Build Coastguard Worker     }
6672*4bdc9457SAndroid Build Coastguard Worker   }
6673*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)6674*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
6675*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
6676*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6677*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6678*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6679*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6680*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6681*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6682*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
6683*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6684*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6685*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6686*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6687*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6688*4bdc9457SAndroid Build Coastguard Worker         }
6689*4bdc9457SAndroid Build Coastguard Worker       }
6690*4bdc9457SAndroid Build Coastguard Worker     }
6691*4bdc9457SAndroid Build Coastguard Worker   }
6692*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_div_8)6693*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
6694*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
6695*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6696*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6697*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6698*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6699*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6700*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
6701*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6702*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6703*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6704*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6705*4bdc9457SAndroid Build Coastguard Worker       }
6706*4bdc9457SAndroid Build Coastguard Worker     }
6707*4bdc9457SAndroid Build Coastguard Worker   }
6708*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)6709*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
6710*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
6711*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6712*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6713*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6714*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6715*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6716*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
6717*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6718*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6719*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6720*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(11)
6721*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6722*4bdc9457SAndroid Build Coastguard Worker       }
6723*4bdc9457SAndroid Build Coastguard Worker     }
6724*4bdc9457SAndroid Build Coastguard Worker   }
6725*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)6726*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
6727*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
6728*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6729*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6730*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6731*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6732*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6733*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6734*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
6735*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6736*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6737*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6738*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6739*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6740*4bdc9457SAndroid Build Coastguard Worker         }
6741*4bdc9457SAndroid Build Coastguard Worker       }
6742*4bdc9457SAndroid Build Coastguard Worker     }
6743*4bdc9457SAndroid Build Coastguard Worker   }
6744*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,small_kernel)6745*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, small_kernel) {
6746*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6747*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6748*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6749*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6750*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6751*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
6752*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6753*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6754*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6755*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
6756*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6757*4bdc9457SAndroid Build Coastguard Worker     }
6758*4bdc9457SAndroid Build Coastguard Worker   }
6759*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,small_kernel_subtile)6760*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, small_kernel_subtile) {
6761*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6762*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6763*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6764*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6765*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6766*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6767*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6768*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
6769*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6770*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6771*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6772*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
6773*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6774*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6775*4bdc9457SAndroid Build Coastguard Worker         }
6776*4bdc9457SAndroid Build Coastguard Worker       }
6777*4bdc9457SAndroid Build Coastguard Worker     }
6778*4bdc9457SAndroid Build Coastguard Worker   }
6779*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_small_kernel)6780*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_small_kernel) {
6781*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 9; n < 16; n++) {
6782*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6783*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6784*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6785*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6786*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6787*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
6788*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6789*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6790*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6791*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
6792*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6793*4bdc9457SAndroid Build Coastguard Worker       }
6794*4bdc9457SAndroid Build Coastguard Worker     }
6795*4bdc9457SAndroid Build Coastguard Worker   }
6796*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_div_8_small_kernel)6797*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_div_8_small_kernel) {
6798*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 16; n <= 24; n += 8) {
6799*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 20; k += 5) {
6800*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6801*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6802*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6803*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6804*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
6805*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6806*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6807*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6808*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
6809*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6810*4bdc9457SAndroid Build Coastguard Worker       }
6811*4bdc9457SAndroid Build Coastguard Worker     }
6812*4bdc9457SAndroid Build Coastguard Worker   }
6813*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)6814*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
6815*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6816*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 8; n++) {
6817*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 6; m++) {
6818*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6819*4bdc9457SAndroid Build Coastguard Worker             .mr(6)
6820*4bdc9457SAndroid Build Coastguard Worker             .nr(8)
6821*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6822*4bdc9457SAndroid Build Coastguard Worker             .sr(4)
6823*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6824*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6825*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6826*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(11)
6827*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6828*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6829*4bdc9457SAndroid Build Coastguard Worker         }
6830*4bdc9457SAndroid Build Coastguard Worker       }
6831*4bdc9457SAndroid Build Coastguard Worker     }
6832*4bdc9457SAndroid Build Coastguard Worker   }
6833*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,a_offset)6834*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, a_offset) {
6835*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6836*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6837*4bdc9457SAndroid Build Coastguard Worker         .mr(6)
6838*4bdc9457SAndroid Build Coastguard Worker         .nr(8)
6839*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6840*4bdc9457SAndroid Build Coastguard Worker         .sr(4)
6841*4bdc9457SAndroid Build Coastguard Worker         .m(6)
6842*4bdc9457SAndroid Build Coastguard Worker         .n(8)
6843*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6844*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
6845*4bdc9457SAndroid Build Coastguard Worker         .a_offset(127)
6846*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6847*4bdc9457SAndroid Build Coastguard Worker     }
6848*4bdc9457SAndroid Build Coastguard Worker   }
6849*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,zero)6850*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, zero) {
6851*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 20; k += 5) {
6852*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 6; mz++) {
6853*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6854*4bdc9457SAndroid Build Coastguard Worker           .mr(6)
6855*4bdc9457SAndroid Build Coastguard Worker           .nr(8)
6856*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6857*4bdc9457SAndroid Build Coastguard Worker           .sr(4)
6858*4bdc9457SAndroid Build Coastguard Worker           .m(6)
6859*4bdc9457SAndroid Build Coastguard Worker           .n(8)
6860*4bdc9457SAndroid Build Coastguard Worker           .k(k)
6861*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
6862*4bdc9457SAndroid Build Coastguard Worker           .a_offset(127)
6863*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
6864*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6865*4bdc9457SAndroid Build Coastguard Worker       }
6866*4bdc9457SAndroid Build Coastguard Worker     }
6867*4bdc9457SAndroid Build Coastguard Worker   }
6868*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,strided_cm)6869*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
6870*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
6871*4bdc9457SAndroid Build Coastguard Worker       .mr(6)
6872*4bdc9457SAndroid Build Coastguard Worker       .nr(8)
6873*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
6874*4bdc9457SAndroid Build Coastguard Worker       .sr(4)
6875*4bdc9457SAndroid Build Coastguard Worker       .m(6)
6876*4bdc9457SAndroid Build Coastguard Worker       .n(8)
6877*4bdc9457SAndroid Build Coastguard Worker       .k(4)
6878*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(11)
6879*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6880*4bdc9457SAndroid Build Coastguard Worker   }
6881*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASMRELAXEDSIMD
6882*4bdc9457SAndroid Build Coastguard Worker 
6883*4bdc9457SAndroid Build Coastguard Worker 
6884*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_1X4__WASM,k_eq_1)6885*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, k_eq_1) {
6886*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
6887*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
6888*4bdc9457SAndroid Build Coastguard Worker       .nr(4)
6889*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
6890*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
6891*4bdc9457SAndroid Build Coastguard Worker       .m(1)
6892*4bdc9457SAndroid Build Coastguard Worker       .n(4)
6893*4bdc9457SAndroid Build Coastguard Worker       .k(1)
6894*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
6895*4bdc9457SAndroid Build Coastguard Worker   }
6896*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,strided_cn)6897*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, strided_cn) {
6898*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
6899*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
6900*4bdc9457SAndroid Build Coastguard Worker       .nr(4)
6901*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
6902*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
6903*4bdc9457SAndroid Build Coastguard Worker       .m(1)
6904*4bdc9457SAndroid Build Coastguard Worker       .n(4)
6905*4bdc9457SAndroid Build Coastguard Worker       .k(1)
6906*4bdc9457SAndroid Build Coastguard Worker       .cn_stride(7)
6907*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
6908*4bdc9457SAndroid Build Coastguard Worker   }
6909*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,k_eq_1_subtile)6910*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, k_eq_1_subtile) {
6911*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 4; n++) {
6912*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 1; m++) {
6913*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6914*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
6915*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
6916*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6917*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6918*4bdc9457SAndroid Build Coastguard Worker           .m(m)
6919*4bdc9457SAndroid Build Coastguard Worker           .n(n)
6920*4bdc9457SAndroid Build Coastguard Worker           .k(1)
6921*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
6922*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
6923*4bdc9457SAndroid Build Coastguard Worker       }
6924*4bdc9457SAndroid Build Coastguard Worker     }
6925*4bdc9457SAndroid Build Coastguard Worker   }
6926*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,k_eq_1_subtile_m)6927*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, k_eq_1_subtile_m) {
6928*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 1; m++) {
6929*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6930*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
6931*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
6932*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6933*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6934*4bdc9457SAndroid Build Coastguard Worker         .m(m)
6935*4bdc9457SAndroid Build Coastguard Worker         .n(4)
6936*4bdc9457SAndroid Build Coastguard Worker         .k(1)
6937*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
6938*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
6939*4bdc9457SAndroid Build Coastguard Worker     }
6940*4bdc9457SAndroid Build Coastguard Worker   }
6941*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,k_eq_1_subtile_n)6942*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, k_eq_1_subtile_n) {
6943*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 4; n++) {
6944*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6945*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
6946*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
6947*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6948*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6949*4bdc9457SAndroid Build Coastguard Worker         .m(1)
6950*4bdc9457SAndroid Build Coastguard Worker         .n(n)
6951*4bdc9457SAndroid Build Coastguard Worker         .k(1)
6952*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
6953*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
6954*4bdc9457SAndroid Build Coastguard Worker     }
6955*4bdc9457SAndroid Build Coastguard Worker   }
6956*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,k_gt_1)6957*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, k_gt_1) {
6958*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 2; k < 10; k++) {
6959*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
6960*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
6961*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
6962*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
6963*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
6964*4bdc9457SAndroid Build Coastguard Worker         .m(1)
6965*4bdc9457SAndroid Build Coastguard Worker         .n(4)
6966*4bdc9457SAndroid Build Coastguard Worker         .k(k)
6967*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
6968*4bdc9457SAndroid Build Coastguard Worker     }
6969*4bdc9457SAndroid Build Coastguard Worker   }
6970*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,k_gt_1_subtile)6971*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, k_gt_1_subtile) {
6972*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 2; k < 10; k++) {
6973*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 4; n++) {
6974*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
6975*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
6976*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
6977*4bdc9457SAndroid Build Coastguard Worker             .nr(4)
6978*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
6979*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
6980*4bdc9457SAndroid Build Coastguard Worker             .m(m)
6981*4bdc9457SAndroid Build Coastguard Worker             .n(n)
6982*4bdc9457SAndroid Build Coastguard Worker             .k(k)
6983*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
6984*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
6985*4bdc9457SAndroid Build Coastguard Worker         }
6986*4bdc9457SAndroid Build Coastguard Worker       }
6987*4bdc9457SAndroid Build Coastguard Worker     }
6988*4bdc9457SAndroid Build Coastguard Worker   }
6989*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,n_gt_4)6990*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, n_gt_4) {
6991*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 5; n < 8; n++) {
6992*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
6993*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
6994*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
6995*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
6996*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
6997*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
6998*4bdc9457SAndroid Build Coastguard Worker           .m(1)
6999*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7000*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7001*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7002*4bdc9457SAndroid Build Coastguard Worker       }
7003*4bdc9457SAndroid Build Coastguard Worker     }
7004*4bdc9457SAndroid Build Coastguard Worker   }
7005*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,n_gt_4_strided_cn)7006*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, n_gt_4_strided_cn) {
7007*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 5; n < 8; n++) {
7008*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
7009*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7010*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
7011*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7012*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7013*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7014*4bdc9457SAndroid Build Coastguard Worker           .m(1)
7015*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7016*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7017*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(7)
7018*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7019*4bdc9457SAndroid Build Coastguard Worker       }
7020*4bdc9457SAndroid Build Coastguard Worker     }
7021*4bdc9457SAndroid Build Coastguard Worker   }
7022*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,n_gt_4_subtile)7023*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, n_gt_4_subtile) {
7024*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 5; n < 8; n++) {
7025*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
7026*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
7027*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
7028*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
7029*4bdc9457SAndroid Build Coastguard Worker             .nr(4)
7030*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
7031*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
7032*4bdc9457SAndroid Build Coastguard Worker             .m(m)
7033*4bdc9457SAndroid Build Coastguard Worker             .n(n)
7034*4bdc9457SAndroid Build Coastguard Worker             .k(k)
7035*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
7036*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7037*4bdc9457SAndroid Build Coastguard Worker         }
7038*4bdc9457SAndroid Build Coastguard Worker       }
7039*4bdc9457SAndroid Build Coastguard Worker     }
7040*4bdc9457SAndroid Build Coastguard Worker   }
7041*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,n_div_4)7042*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, n_div_4) {
7043*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 8; n <= 12; n += 4) {
7044*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
7045*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7046*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
7047*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7048*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7049*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7050*4bdc9457SAndroid Build Coastguard Worker           .m(1)
7051*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7052*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7053*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7054*4bdc9457SAndroid Build Coastguard Worker       }
7055*4bdc9457SAndroid Build Coastguard Worker     }
7056*4bdc9457SAndroid Build Coastguard Worker   }
7057*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,n_div_4_strided_cn)7058*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, n_div_4_strided_cn) {
7059*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 8; n <= 12; n += 4) {
7060*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
7061*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7062*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
7063*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7064*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7065*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7066*4bdc9457SAndroid Build Coastguard Worker           .m(1)
7067*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7068*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7069*4bdc9457SAndroid Build Coastguard Worker           .cn_stride(7)
7070*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7071*4bdc9457SAndroid Build Coastguard Worker       }
7072*4bdc9457SAndroid Build Coastguard Worker     }
7073*4bdc9457SAndroid Build Coastguard Worker   }
7074*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,n_div_4_subtile)7075*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, n_div_4_subtile) {
7076*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 8; n <= 12; n += 4) {
7077*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
7078*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
7079*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
7080*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
7081*4bdc9457SAndroid Build Coastguard Worker             .nr(4)
7082*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
7083*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
7084*4bdc9457SAndroid Build Coastguard Worker             .m(m)
7085*4bdc9457SAndroid Build Coastguard Worker             .n(n)
7086*4bdc9457SAndroid Build Coastguard Worker             .k(k)
7087*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
7088*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7089*4bdc9457SAndroid Build Coastguard Worker         }
7090*4bdc9457SAndroid Build Coastguard Worker       }
7091*4bdc9457SAndroid Build Coastguard Worker     }
7092*4bdc9457SAndroid Build Coastguard Worker   }
7093*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,small_kernel)7094*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, small_kernel) {
7095*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7096*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7097*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
7098*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7099*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7100*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7101*4bdc9457SAndroid Build Coastguard Worker         .m(1)
7102*4bdc9457SAndroid Build Coastguard Worker         .n(4)
7103*4bdc9457SAndroid Build Coastguard Worker         .k(k)
7104*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
7105*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7106*4bdc9457SAndroid Build Coastguard Worker     }
7107*4bdc9457SAndroid Build Coastguard Worker   }
7108*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,small_kernel_subtile)7109*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, small_kernel_subtile) {
7110*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7111*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 4; n++) {
7112*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
7113*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
7114*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
7115*4bdc9457SAndroid Build Coastguard Worker             .nr(4)
7116*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
7117*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
7118*4bdc9457SAndroid Build Coastguard Worker             .m(m)
7119*4bdc9457SAndroid Build Coastguard Worker             .n(n)
7120*4bdc9457SAndroid Build Coastguard Worker             .k(k)
7121*4bdc9457SAndroid Build Coastguard Worker             .ks(3)
7122*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
7123*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7124*4bdc9457SAndroid Build Coastguard Worker         }
7125*4bdc9457SAndroid Build Coastguard Worker       }
7126*4bdc9457SAndroid Build Coastguard Worker     }
7127*4bdc9457SAndroid Build Coastguard Worker   }
7128*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,n_gt_4_small_kernel)7129*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, n_gt_4_small_kernel) {
7130*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 5; n < 8; n++) {
7131*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
7132*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7133*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
7134*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7135*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7136*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7137*4bdc9457SAndroid Build Coastguard Worker           .m(1)
7138*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7139*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7140*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
7141*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7142*4bdc9457SAndroid Build Coastguard Worker       }
7143*4bdc9457SAndroid Build Coastguard Worker     }
7144*4bdc9457SAndroid Build Coastguard Worker   }
7145*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,n_div_4_small_kernel)7146*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, n_div_4_small_kernel) {
7147*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 8; n <= 12; n += 4) {
7148*4bdc9457SAndroid Build Coastguard Worker       for (size_t k = 1; k <= 5; k += 2) {
7149*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7150*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
7151*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7152*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7153*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7154*4bdc9457SAndroid Build Coastguard Worker           .m(1)
7155*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7156*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7157*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
7158*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7159*4bdc9457SAndroid Build Coastguard Worker       }
7160*4bdc9457SAndroid Build Coastguard Worker     }
7161*4bdc9457SAndroid Build Coastguard Worker   }
7162*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,strided_cm_subtile)7163*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, strided_cm_subtile) {
7164*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7165*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t n = 1; n <= 4; n++) {
7166*4bdc9457SAndroid Build Coastguard Worker         for (uint32_t m = 1; m <= 1; m++) {
7167*4bdc9457SAndroid Build Coastguard Worker           GemmMicrokernelTester()
7168*4bdc9457SAndroid Build Coastguard Worker             .mr(1)
7169*4bdc9457SAndroid Build Coastguard Worker             .nr(4)
7170*4bdc9457SAndroid Build Coastguard Worker             .kr(1)
7171*4bdc9457SAndroid Build Coastguard Worker             .sr(1)
7172*4bdc9457SAndroid Build Coastguard Worker             .m(m)
7173*4bdc9457SAndroid Build Coastguard Worker             .n(n)
7174*4bdc9457SAndroid Build Coastguard Worker             .k(k)
7175*4bdc9457SAndroid Build Coastguard Worker             .cm_stride(7)
7176*4bdc9457SAndroid Build Coastguard Worker             .iterations(1)
7177*4bdc9457SAndroid Build Coastguard Worker             .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7178*4bdc9457SAndroid Build Coastguard Worker         }
7179*4bdc9457SAndroid Build Coastguard Worker       }
7180*4bdc9457SAndroid Build Coastguard Worker     }
7181*4bdc9457SAndroid Build Coastguard Worker   }
7182*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,a_offset)7183*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, a_offset) {
7184*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7185*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7186*4bdc9457SAndroid Build Coastguard Worker         .mr(1)
7187*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7188*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7189*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7190*4bdc9457SAndroid Build Coastguard Worker         .m(1)
7191*4bdc9457SAndroid Build Coastguard Worker         .n(4)
7192*4bdc9457SAndroid Build Coastguard Worker         .k(k)
7193*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
7194*4bdc9457SAndroid Build Coastguard Worker         .a_offset(7)
7195*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7196*4bdc9457SAndroid Build Coastguard Worker     }
7197*4bdc9457SAndroid Build Coastguard Worker   }
7198*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,zero)7199*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, zero) {
7200*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7201*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t mz = 0; mz < 1; mz++) {
7202*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7203*4bdc9457SAndroid Build Coastguard Worker           .mr(1)
7204*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7205*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7206*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7207*4bdc9457SAndroid Build Coastguard Worker           .m(1)
7208*4bdc9457SAndroid Build Coastguard Worker           .n(4)
7209*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7210*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
7211*4bdc9457SAndroid Build Coastguard Worker           .a_offset(7)
7212*4bdc9457SAndroid Build Coastguard Worker           .zero_index(mz)
7213*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7214*4bdc9457SAndroid Build Coastguard Worker       }
7215*4bdc9457SAndroid Build Coastguard Worker     }
7216*4bdc9457SAndroid Build Coastguard Worker   }
7217*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_1X4__WASM,strided_cm)7218*4bdc9457SAndroid Build Coastguard Worker   TEST(F32_IGEMM_RELU_1X4__WASM, strided_cm) {
7219*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
7220*4bdc9457SAndroid Build Coastguard Worker       .mr(1)
7221*4bdc9457SAndroid Build Coastguard Worker       .nr(4)
7222*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
7223*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
7224*4bdc9457SAndroid Build Coastguard Worker       .m(1)
7225*4bdc9457SAndroid Build Coastguard Worker       .n(4)
7226*4bdc9457SAndroid Build Coastguard Worker       .k(1)
7227*4bdc9457SAndroid Build Coastguard Worker       .cm_stride(7)
7228*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_1x4__wasm);
7229*4bdc9457SAndroid Build Coastguard Worker   }
7230*4bdc9457SAndroid Build Coastguard Worker #endif  // XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
7231*4bdc9457SAndroid Build Coastguard Worker 
7232*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,k_eq_1)7233*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, k_eq_1) {
7234*4bdc9457SAndroid Build Coastguard Worker   GemmMicrokernelTester()
7235*4bdc9457SAndroid Build Coastguard Worker     .mr(2)
7236*4bdc9457SAndroid Build Coastguard Worker     .nr(4)
7237*4bdc9457SAndroid Build Coastguard Worker     .kr(1)
7238*4bdc9457SAndroid Build Coastguard Worker     .sr(1)
7239*4bdc9457SAndroid Build Coastguard Worker     .m(2)
7240*4bdc9457SAndroid Build Coastguard Worker     .n(4)
7241*4bdc9457SAndroid Build Coastguard Worker     .k(1)
7242*4bdc9457SAndroid Build Coastguard Worker     .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7243*4bdc9457SAndroid Build Coastguard Worker }
7244*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,strided_cn)7245*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, strided_cn) {
7246*4bdc9457SAndroid Build Coastguard Worker   GemmMicrokernelTester()
7247*4bdc9457SAndroid Build Coastguard Worker     .mr(2)
7248*4bdc9457SAndroid Build Coastguard Worker     .nr(4)
7249*4bdc9457SAndroid Build Coastguard Worker     .kr(1)
7250*4bdc9457SAndroid Build Coastguard Worker     .sr(1)
7251*4bdc9457SAndroid Build Coastguard Worker     .m(2)
7252*4bdc9457SAndroid Build Coastguard Worker     .n(4)
7253*4bdc9457SAndroid Build Coastguard Worker     .k(1)
7254*4bdc9457SAndroid Build Coastguard Worker     .cn_stride(7)
7255*4bdc9457SAndroid Build Coastguard Worker     .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7256*4bdc9457SAndroid Build Coastguard Worker }
7257*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,k_eq_1_subtile)7258*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, k_eq_1_subtile) {
7259*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 1; n <= 4; n++) {
7260*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t m = 1; m <= 2; m++) {
7261*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7262*4bdc9457SAndroid Build Coastguard Worker         .mr(2)
7263*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7264*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7265*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7266*4bdc9457SAndroid Build Coastguard Worker         .m(m)
7267*4bdc9457SAndroid Build Coastguard Worker         .n(n)
7268*4bdc9457SAndroid Build Coastguard Worker         .k(1)
7269*4bdc9457SAndroid Build Coastguard Worker         .iterations(1)
7270*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7271*4bdc9457SAndroid Build Coastguard Worker     }
7272*4bdc9457SAndroid Build Coastguard Worker   }
7273*4bdc9457SAndroid Build Coastguard Worker }
7274*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,k_eq_1_subtile_m)7275*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, k_eq_1_subtile_m) {
7276*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t m = 1; m <= 2; m++) {
7277*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
7278*4bdc9457SAndroid Build Coastguard Worker       .mr(2)
7279*4bdc9457SAndroid Build Coastguard Worker       .nr(4)
7280*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
7281*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
7282*4bdc9457SAndroid Build Coastguard Worker       .m(m)
7283*4bdc9457SAndroid Build Coastguard Worker       .n(4)
7284*4bdc9457SAndroid Build Coastguard Worker       .k(1)
7285*4bdc9457SAndroid Build Coastguard Worker       .iterations(1)
7286*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7287*4bdc9457SAndroid Build Coastguard Worker   }
7288*4bdc9457SAndroid Build Coastguard Worker }
7289*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,k_eq_1_subtile_n)7290*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, k_eq_1_subtile_n) {
7291*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 1; n <= 4; n++) {
7292*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
7293*4bdc9457SAndroid Build Coastguard Worker       .mr(2)
7294*4bdc9457SAndroid Build Coastguard Worker       .nr(4)
7295*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
7296*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
7297*4bdc9457SAndroid Build Coastguard Worker       .m(2)
7298*4bdc9457SAndroid Build Coastguard Worker       .n(n)
7299*4bdc9457SAndroid Build Coastguard Worker       .k(1)
7300*4bdc9457SAndroid Build Coastguard Worker       .iterations(1)
7301*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7302*4bdc9457SAndroid Build Coastguard Worker   }
7303*4bdc9457SAndroid Build Coastguard Worker }
7304*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,k_gt_1)7305*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, k_gt_1) {
7306*4bdc9457SAndroid Build Coastguard Worker   for (size_t k = 2; k < 10; k++) {
7307*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
7308*4bdc9457SAndroid Build Coastguard Worker       .mr(2)
7309*4bdc9457SAndroid Build Coastguard Worker       .nr(4)
7310*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
7311*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
7312*4bdc9457SAndroid Build Coastguard Worker       .m(2)
7313*4bdc9457SAndroid Build Coastguard Worker       .n(4)
7314*4bdc9457SAndroid Build Coastguard Worker       .k(k)
7315*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7316*4bdc9457SAndroid Build Coastguard Worker   }
7317*4bdc9457SAndroid Build Coastguard Worker }
7318*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,k_gt_1_subtile)7319*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, k_gt_1_subtile) {
7320*4bdc9457SAndroid Build Coastguard Worker   for (size_t k = 2; k < 10; k++) {
7321*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 4; n++) {
7322*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 2; m++) {
7323*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7324*4bdc9457SAndroid Build Coastguard Worker           .mr(2)
7325*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7326*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7327*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7328*4bdc9457SAndroid Build Coastguard Worker           .m(m)
7329*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7330*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7331*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
7332*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7333*4bdc9457SAndroid Build Coastguard Worker       }
7334*4bdc9457SAndroid Build Coastguard Worker     }
7335*4bdc9457SAndroid Build Coastguard Worker   }
7336*4bdc9457SAndroid Build Coastguard Worker }
7337*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,n_gt_4)7338*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, n_gt_4) {
7339*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 5; n < 8; n++) {
7340*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7341*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7342*4bdc9457SAndroid Build Coastguard Worker         .mr(2)
7343*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7344*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7345*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7346*4bdc9457SAndroid Build Coastguard Worker         .m(2)
7347*4bdc9457SAndroid Build Coastguard Worker         .n(n)
7348*4bdc9457SAndroid Build Coastguard Worker         .k(k)
7349*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7350*4bdc9457SAndroid Build Coastguard Worker     }
7351*4bdc9457SAndroid Build Coastguard Worker   }
7352*4bdc9457SAndroid Build Coastguard Worker }
7353*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,n_gt_4_strided_cn)7354*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, n_gt_4_strided_cn) {
7355*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 5; n < 8; n++) {
7356*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7357*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7358*4bdc9457SAndroid Build Coastguard Worker         .mr(2)
7359*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7360*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7361*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7362*4bdc9457SAndroid Build Coastguard Worker         .m(2)
7363*4bdc9457SAndroid Build Coastguard Worker         .n(n)
7364*4bdc9457SAndroid Build Coastguard Worker         .k(k)
7365*4bdc9457SAndroid Build Coastguard Worker         .cn_stride(7)
7366*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7367*4bdc9457SAndroid Build Coastguard Worker     }
7368*4bdc9457SAndroid Build Coastguard Worker   }
7369*4bdc9457SAndroid Build Coastguard Worker }
7370*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,n_gt_4_subtile)7371*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, n_gt_4_subtile) {
7372*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 5; n < 8; n++) {
7373*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7374*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 2; m++) {
7375*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7376*4bdc9457SAndroid Build Coastguard Worker           .mr(2)
7377*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7378*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7379*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7380*4bdc9457SAndroid Build Coastguard Worker           .m(m)
7381*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7382*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7383*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
7384*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7385*4bdc9457SAndroid Build Coastguard Worker       }
7386*4bdc9457SAndroid Build Coastguard Worker     }
7387*4bdc9457SAndroid Build Coastguard Worker   }
7388*4bdc9457SAndroid Build Coastguard Worker }
7389*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,n_div_4)7390*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, n_div_4) {
7391*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 8; n <= 12; n += 4) {
7392*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7393*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7394*4bdc9457SAndroid Build Coastguard Worker         .mr(2)
7395*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7396*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7397*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7398*4bdc9457SAndroid Build Coastguard Worker         .m(2)
7399*4bdc9457SAndroid Build Coastguard Worker         .n(n)
7400*4bdc9457SAndroid Build Coastguard Worker         .k(k)
7401*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7402*4bdc9457SAndroid Build Coastguard Worker     }
7403*4bdc9457SAndroid Build Coastguard Worker   }
7404*4bdc9457SAndroid Build Coastguard Worker }
7405*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,n_div_4_strided_cn)7406*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, n_div_4_strided_cn) {
7407*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 8; n <= 12; n += 4) {
7408*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7409*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7410*4bdc9457SAndroid Build Coastguard Worker         .mr(2)
7411*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7412*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7413*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7414*4bdc9457SAndroid Build Coastguard Worker         .m(2)
7415*4bdc9457SAndroid Build Coastguard Worker         .n(n)
7416*4bdc9457SAndroid Build Coastguard Worker         .k(k)
7417*4bdc9457SAndroid Build Coastguard Worker         .cn_stride(7)
7418*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7419*4bdc9457SAndroid Build Coastguard Worker     }
7420*4bdc9457SAndroid Build Coastguard Worker   }
7421*4bdc9457SAndroid Build Coastguard Worker }
7422*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,n_div_4_subtile)7423*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, n_div_4_subtile) {
7424*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 8; n <= 12; n += 4) {
7425*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7426*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 2; m++) {
7427*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7428*4bdc9457SAndroid Build Coastguard Worker           .mr(2)
7429*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7430*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7431*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7432*4bdc9457SAndroid Build Coastguard Worker           .m(m)
7433*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7434*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7435*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
7436*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7437*4bdc9457SAndroid Build Coastguard Worker       }
7438*4bdc9457SAndroid Build Coastguard Worker     }
7439*4bdc9457SAndroid Build Coastguard Worker   }
7440*4bdc9457SAndroid Build Coastguard Worker }
7441*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,small_kernel)7442*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, small_kernel) {
7443*4bdc9457SAndroid Build Coastguard Worker   for (size_t k = 1; k <= 5; k += 2) {
7444*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
7445*4bdc9457SAndroid Build Coastguard Worker       .mr(2)
7446*4bdc9457SAndroid Build Coastguard Worker       .nr(4)
7447*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
7448*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
7449*4bdc9457SAndroid Build Coastguard Worker       .m(2)
7450*4bdc9457SAndroid Build Coastguard Worker       .n(4)
7451*4bdc9457SAndroid Build Coastguard Worker       .k(k)
7452*4bdc9457SAndroid Build Coastguard Worker       .ks(3)
7453*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7454*4bdc9457SAndroid Build Coastguard Worker   }
7455*4bdc9457SAndroid Build Coastguard Worker }
7456*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,small_kernel_subtile)7457*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, small_kernel_subtile) {
7458*4bdc9457SAndroid Build Coastguard Worker   for (size_t k = 1; k <= 5; k += 2) {
7459*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 4; n++) {
7460*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 2; m++) {
7461*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7462*4bdc9457SAndroid Build Coastguard Worker           .mr(2)
7463*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7464*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7465*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7466*4bdc9457SAndroid Build Coastguard Worker           .m(m)
7467*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7468*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7469*4bdc9457SAndroid Build Coastguard Worker           .ks(3)
7470*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
7471*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7472*4bdc9457SAndroid Build Coastguard Worker       }
7473*4bdc9457SAndroid Build Coastguard Worker     }
7474*4bdc9457SAndroid Build Coastguard Worker   }
7475*4bdc9457SAndroid Build Coastguard Worker }
7476*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,n_gt_4_small_kernel)7477*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, n_gt_4_small_kernel) {
7478*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 5; n < 8; n++) {
7479*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7480*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7481*4bdc9457SAndroid Build Coastguard Worker         .mr(2)
7482*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7483*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7484*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7485*4bdc9457SAndroid Build Coastguard Worker         .m(2)
7486*4bdc9457SAndroid Build Coastguard Worker         .n(n)
7487*4bdc9457SAndroid Build Coastguard Worker         .k(k)
7488*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
7489*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7490*4bdc9457SAndroid Build Coastguard Worker     }
7491*4bdc9457SAndroid Build Coastguard Worker   }
7492*4bdc9457SAndroid Build Coastguard Worker }
7493*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,n_div_4_small_kernel)7494*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, n_div_4_small_kernel) {
7495*4bdc9457SAndroid Build Coastguard Worker   for (uint32_t n = 8; n <= 12; n += 4) {
7496*4bdc9457SAndroid Build Coastguard Worker     for (size_t k = 1; k <= 5; k += 2) {
7497*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7498*4bdc9457SAndroid Build Coastguard Worker         .mr(2)
7499*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7500*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7501*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7502*4bdc9457SAndroid Build Coastguard Worker         .m(2)
7503*4bdc9457SAndroid Build Coastguard Worker         .n(n)
7504*4bdc9457SAndroid Build Coastguard Worker         .k(k)
7505*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
7506*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7507*4bdc9457SAndroid Build Coastguard Worker     }
7508*4bdc9457SAndroid Build Coastguard Worker   }
7509*4bdc9457SAndroid Build Coastguard Worker }
7510*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,strided_cm_subtile)7511*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, strided_cm_subtile) {
7512*4bdc9457SAndroid Build Coastguard Worker   for (size_t k = 1; k <= 5; k += 2) {
7513*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t n = 1; n <= 4; n++) {
7514*4bdc9457SAndroid Build Coastguard Worker       for (uint32_t m = 1; m <= 2; m++) {
7515*4bdc9457SAndroid Build Coastguard Worker         GemmMicrokernelTester()
7516*4bdc9457SAndroid Build Coastguard Worker           .mr(2)
7517*4bdc9457SAndroid Build Coastguard Worker           .nr(4)
7518*4bdc9457SAndroid Build Coastguard Worker           .kr(1)
7519*4bdc9457SAndroid Build Coastguard Worker           .sr(1)
7520*4bdc9457SAndroid Build Coastguard Worker           .m(m)
7521*4bdc9457SAndroid Build Coastguard Worker           .n(n)
7522*4bdc9457SAndroid Build Coastguard Worker           .k(k)
7523*4bdc9457SAndroid Build Coastguard Worker           .cm_stride(7)
7524*4bdc9457SAndroid Build Coastguard Worker           .iterations(1)
7525*4bdc9457SAndroid Build Coastguard Worker           .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7526*4bdc9457SAndroid Build Coastguard Worker       }
7527*4bdc9457SAndroid Build Coastguard Worker     }
7528*4bdc9457SAndroid Build Coastguard Worker   }
7529*4bdc9457SAndroid Build Coastguard Worker }
7530*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,a_offset)7531*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, a_offset) {
7532*4bdc9457SAndroid Build Coastguard Worker   for (size_t k = 1; k <= 5; k += 2) {
7533*4bdc9457SAndroid Build Coastguard Worker     GemmMicrokernelTester()
7534*4bdc9457SAndroid Build Coastguard Worker       .mr(2)
7535*4bdc9457SAndroid Build Coastguard Worker       .nr(4)
7536*4bdc9457SAndroid Build Coastguard Worker       .kr(1)
7537*4bdc9457SAndroid Build Coastguard Worker       .sr(1)
7538*4bdc9457SAndroid Build Coastguard Worker       .m(2)
7539*4bdc9457SAndroid Build Coastguard Worker       .n(4)
7540*4bdc9457SAndroid Build Coastguard Worker       .k(k)
7541*4bdc9457SAndroid Build Coastguard Worker       .ks(3)
7542*4bdc9457SAndroid Build Coastguard Worker       .a_offset(13)
7543*4bdc9457SAndroid Build Coastguard Worker       .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7544*4bdc9457SAndroid Build Coastguard Worker   }
7545*4bdc9457SAndroid Build Coastguard Worker }
7546*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,zero)7547*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, zero) {
7548*4bdc9457SAndroid Build Coastguard Worker   for (size_t k = 1; k <= 5; k += 2) {
7549*4bdc9457SAndroid Build Coastguard Worker     for (uint32_t mz = 0; mz < 2; mz++) {
7550*4bdc9457SAndroid Build Coastguard Worker       GemmMicrokernelTester()
7551*4bdc9457SAndroid Build Coastguard Worker         .mr(2)
7552*4bdc9457SAndroid Build Coastguard Worker         .nr(4)
7553*4bdc9457SAndroid Build Coastguard Worker         .kr(1)
7554*4bdc9457SAndroid Build Coastguard Worker         .sr(1)
7555*4bdc9457SAndroid Build Coastguard Worker         .m(2)
7556*4bdc9457SAndroid Build Coastguard Worker         .n(4)
7557*4bdc9457SAndroid Build Coastguard Worker         .k(k)
7558*4bdc9457SAndroid Build Coastguard Worker         .ks(3)
7559*4bdc9457SAndroid Build Coastguard Worker         .a_offset(13)
7560*4bdc9457SAndroid Build Coastguard Worker         .zero_index(mz)
7561*4bdc9457SAndroid Build Coastguard Worker         .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7562*4bdc9457SAndroid Build Coastguard Worker     }
7563*4bdc9457SAndroid Build Coastguard Worker   }
7564*4bdc9457SAndroid Build Coastguard Worker }
7565*4bdc9457SAndroid Build Coastguard Worker 
TEST(F32_IGEMM_RELU_2X4__SCALAR,strided_cm)7566*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__SCALAR, strided_cm) {
7567*4bdc9457SAndroid Build Coastguard Worker   GemmMicrokernelTester()
7568*4bdc9457SAndroid Build Coastguard Worker     .mr(2)
7569*4bdc9457SAndroid Build Coastguard Worker     .nr(4)
7570*4bdc9457SAndroid Build Coastguard Worker     .kr(1)
7571*4bdc9457SAndroid Build Coastguard Worker     .sr(1)
7572*4bdc9457SAndroid Build Coastguard Worker     .m(2)
7573*4bdc9457SAndroid Build Coastguard Worker     .n(4)
7574*4bdc9457SAndroid Build Coastguard Worker     .k(1)
7575*4bdc9457SAndroid Build Coastguard Worker     .cm_stride(7)
7576*4bdc9457SAndroid Build Coastguard Worker     .Test(xnn_f32_igemm_relu_ukernel_2x4__scalar);
7577*4bdc9457SAndroid Build Coastguard Worker }
7578