1*4bdc9457SAndroid Build Coastguard Worker // Copyright (c) Facebook, Inc. and its affiliates.
2*4bdc9457SAndroid Build Coastguard Worker // All rights reserved.
3*4bdc9457SAndroid Build Coastguard Worker //
4*4bdc9457SAndroid Build Coastguard Worker // Copyright 2019 Google LLC
5*4bdc9457SAndroid Build Coastguard Worker //
6*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
7*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
8*4bdc9457SAndroid Build Coastguard Worker //
9*4bdc9457SAndroid Build Coastguard Worker // Auto-generated file. Do not edit!
10*4bdc9457SAndroid Build Coastguard Worker // Specification: test/f32-igemm-relu.yaml
11*4bdc9457SAndroid Build Coastguard Worker // Generator: tools/generate-gemm-test.py
12*4bdc9457SAndroid Build Coastguard Worker
13*4bdc9457SAndroid Build Coastguard Worker
14*4bdc9457SAndroid Build Coastguard Worker #include <gtest/gtest.h>
15*4bdc9457SAndroid Build Coastguard Worker
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/allocator.h>
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h>
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/isa-checks.h>
19*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microparams-init.h>
20*4bdc9457SAndroid Build Coastguard Worker
21*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/gemm.h>
22*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/igemm.h>
23*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/ppmm.h>
24*4bdc9457SAndroid Build Coastguard Worker #include "gemm-microkernel-tester.h"
25*4bdc9457SAndroid Build Coastguard Worker
26*4bdc9457SAndroid Build Coastguard Worker
27*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_eq_1)28*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_eq_1) {
29*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
30*4bdc9457SAndroid Build Coastguard Worker .mr(1)
31*4bdc9457SAndroid Build Coastguard Worker .nr(8)
32*4bdc9457SAndroid Build Coastguard Worker .kr(1)
33*4bdc9457SAndroid Build Coastguard Worker .sr(1)
34*4bdc9457SAndroid Build Coastguard Worker .m(1)
35*4bdc9457SAndroid Build Coastguard Worker .n(8)
36*4bdc9457SAndroid Build Coastguard Worker .k(1)
37*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
38*4bdc9457SAndroid Build Coastguard Worker }
39*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,strided_cn)40*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, strided_cn) {
41*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
42*4bdc9457SAndroid Build Coastguard Worker .mr(1)
43*4bdc9457SAndroid Build Coastguard Worker .nr(8)
44*4bdc9457SAndroid Build Coastguard Worker .kr(1)
45*4bdc9457SAndroid Build Coastguard Worker .sr(1)
46*4bdc9457SAndroid Build Coastguard Worker .m(1)
47*4bdc9457SAndroid Build Coastguard Worker .n(8)
48*4bdc9457SAndroid Build Coastguard Worker .k(1)
49*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
50*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
51*4bdc9457SAndroid Build Coastguard Worker }
52*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)53*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
54*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
55*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
56*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
57*4bdc9457SAndroid Build Coastguard Worker .mr(1)
58*4bdc9457SAndroid Build Coastguard Worker .nr(8)
59*4bdc9457SAndroid Build Coastguard Worker .kr(1)
60*4bdc9457SAndroid Build Coastguard Worker .sr(1)
61*4bdc9457SAndroid Build Coastguard Worker .m(m)
62*4bdc9457SAndroid Build Coastguard Worker .n(n)
63*4bdc9457SAndroid Build Coastguard Worker .k(1)
64*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
65*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
66*4bdc9457SAndroid Build Coastguard Worker }
67*4bdc9457SAndroid Build Coastguard Worker }
68*4bdc9457SAndroid Build Coastguard Worker }
69*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)70*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
71*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
72*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
73*4bdc9457SAndroid Build Coastguard Worker .mr(1)
74*4bdc9457SAndroid Build Coastguard Worker .nr(8)
75*4bdc9457SAndroid Build Coastguard Worker .kr(1)
76*4bdc9457SAndroid Build Coastguard Worker .sr(1)
77*4bdc9457SAndroid Build Coastguard Worker .m(m)
78*4bdc9457SAndroid Build Coastguard Worker .n(8)
79*4bdc9457SAndroid Build Coastguard Worker .k(1)
80*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
81*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
82*4bdc9457SAndroid Build Coastguard Worker }
83*4bdc9457SAndroid Build Coastguard Worker }
84*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)85*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
86*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
87*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
88*4bdc9457SAndroid Build Coastguard Worker .mr(1)
89*4bdc9457SAndroid Build Coastguard Worker .nr(8)
90*4bdc9457SAndroid Build Coastguard Worker .kr(1)
91*4bdc9457SAndroid Build Coastguard Worker .sr(1)
92*4bdc9457SAndroid Build Coastguard Worker .m(1)
93*4bdc9457SAndroid Build Coastguard Worker .n(n)
94*4bdc9457SAndroid Build Coastguard Worker .k(1)
95*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
96*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
97*4bdc9457SAndroid Build Coastguard Worker }
98*4bdc9457SAndroid Build Coastguard Worker }
99*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_gt_1)100*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_gt_1) {
101*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
102*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
103*4bdc9457SAndroid Build Coastguard Worker .mr(1)
104*4bdc9457SAndroid Build Coastguard Worker .nr(8)
105*4bdc9457SAndroid Build Coastguard Worker .kr(1)
106*4bdc9457SAndroid Build Coastguard Worker .sr(1)
107*4bdc9457SAndroid Build Coastguard Worker .m(1)
108*4bdc9457SAndroid Build Coastguard Worker .n(8)
109*4bdc9457SAndroid Build Coastguard Worker .k(k)
110*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
111*4bdc9457SAndroid Build Coastguard Worker }
112*4bdc9457SAndroid Build Coastguard Worker }
113*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)114*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
115*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
116*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
117*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
118*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
119*4bdc9457SAndroid Build Coastguard Worker .mr(1)
120*4bdc9457SAndroid Build Coastguard Worker .nr(8)
121*4bdc9457SAndroid Build Coastguard Worker .kr(1)
122*4bdc9457SAndroid Build Coastguard Worker .sr(1)
123*4bdc9457SAndroid Build Coastguard Worker .m(m)
124*4bdc9457SAndroid Build Coastguard Worker .n(n)
125*4bdc9457SAndroid Build Coastguard Worker .k(k)
126*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
127*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
128*4bdc9457SAndroid Build Coastguard Worker }
129*4bdc9457SAndroid Build Coastguard Worker }
130*4bdc9457SAndroid Build Coastguard Worker }
131*4bdc9457SAndroid Build Coastguard Worker }
132*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_gt_8)133*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_gt_8) {
134*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
135*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
136*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
137*4bdc9457SAndroid Build Coastguard Worker .mr(1)
138*4bdc9457SAndroid Build Coastguard Worker .nr(8)
139*4bdc9457SAndroid Build Coastguard Worker .kr(1)
140*4bdc9457SAndroid Build Coastguard Worker .sr(1)
141*4bdc9457SAndroid Build Coastguard Worker .m(1)
142*4bdc9457SAndroid Build Coastguard Worker .n(n)
143*4bdc9457SAndroid Build Coastguard Worker .k(k)
144*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
145*4bdc9457SAndroid Build Coastguard Worker }
146*4bdc9457SAndroid Build Coastguard Worker }
147*4bdc9457SAndroid Build Coastguard Worker }
148*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)149*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
150*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
151*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
152*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
153*4bdc9457SAndroid Build Coastguard Worker .mr(1)
154*4bdc9457SAndroid Build Coastguard Worker .nr(8)
155*4bdc9457SAndroid Build Coastguard Worker .kr(1)
156*4bdc9457SAndroid Build Coastguard Worker .sr(1)
157*4bdc9457SAndroid Build Coastguard Worker .m(1)
158*4bdc9457SAndroid Build Coastguard Worker .n(n)
159*4bdc9457SAndroid Build Coastguard Worker .k(k)
160*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
161*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
162*4bdc9457SAndroid Build Coastguard Worker }
163*4bdc9457SAndroid Build Coastguard Worker }
164*4bdc9457SAndroid Build Coastguard Worker }
165*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)166*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
167*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
168*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
169*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
170*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
171*4bdc9457SAndroid Build Coastguard Worker .mr(1)
172*4bdc9457SAndroid Build Coastguard Worker .nr(8)
173*4bdc9457SAndroid Build Coastguard Worker .kr(1)
174*4bdc9457SAndroid Build Coastguard Worker .sr(1)
175*4bdc9457SAndroid Build Coastguard Worker .m(m)
176*4bdc9457SAndroid Build Coastguard Worker .n(n)
177*4bdc9457SAndroid Build Coastguard Worker .k(k)
178*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
179*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
180*4bdc9457SAndroid Build Coastguard Worker }
181*4bdc9457SAndroid Build Coastguard Worker }
182*4bdc9457SAndroid Build Coastguard Worker }
183*4bdc9457SAndroid Build Coastguard Worker }
184*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_div_8)185*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_div_8) {
186*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
187*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
188*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
189*4bdc9457SAndroid Build Coastguard Worker .mr(1)
190*4bdc9457SAndroid Build Coastguard Worker .nr(8)
191*4bdc9457SAndroid Build Coastguard Worker .kr(1)
192*4bdc9457SAndroid Build Coastguard Worker .sr(1)
193*4bdc9457SAndroid Build Coastguard Worker .m(1)
194*4bdc9457SAndroid Build Coastguard Worker .n(n)
195*4bdc9457SAndroid Build Coastguard Worker .k(k)
196*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
197*4bdc9457SAndroid Build Coastguard Worker }
198*4bdc9457SAndroid Build Coastguard Worker }
199*4bdc9457SAndroid Build Coastguard Worker }
200*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)201*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
202*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
203*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
204*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
205*4bdc9457SAndroid Build Coastguard Worker .mr(1)
206*4bdc9457SAndroid Build Coastguard Worker .nr(8)
207*4bdc9457SAndroid Build Coastguard Worker .kr(1)
208*4bdc9457SAndroid Build Coastguard Worker .sr(1)
209*4bdc9457SAndroid Build Coastguard Worker .m(1)
210*4bdc9457SAndroid Build Coastguard Worker .n(n)
211*4bdc9457SAndroid Build Coastguard Worker .k(k)
212*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
213*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
214*4bdc9457SAndroid Build Coastguard Worker }
215*4bdc9457SAndroid Build Coastguard Worker }
216*4bdc9457SAndroid Build Coastguard Worker }
217*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)218*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
219*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
220*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
221*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
222*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
223*4bdc9457SAndroid Build Coastguard Worker .mr(1)
224*4bdc9457SAndroid Build Coastguard Worker .nr(8)
225*4bdc9457SAndroid Build Coastguard Worker .kr(1)
226*4bdc9457SAndroid Build Coastguard Worker .sr(1)
227*4bdc9457SAndroid Build Coastguard Worker .m(m)
228*4bdc9457SAndroid Build Coastguard Worker .n(n)
229*4bdc9457SAndroid Build Coastguard Worker .k(k)
230*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
231*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
232*4bdc9457SAndroid Build Coastguard Worker }
233*4bdc9457SAndroid Build Coastguard Worker }
234*4bdc9457SAndroid Build Coastguard Worker }
235*4bdc9457SAndroid Build Coastguard Worker }
236*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,small_kernel)237*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, small_kernel) {
238*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
239*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
240*4bdc9457SAndroid Build Coastguard Worker .mr(1)
241*4bdc9457SAndroid Build Coastguard Worker .nr(8)
242*4bdc9457SAndroid Build Coastguard Worker .kr(1)
243*4bdc9457SAndroid Build Coastguard Worker .sr(1)
244*4bdc9457SAndroid Build Coastguard Worker .m(1)
245*4bdc9457SAndroid Build Coastguard Worker .n(8)
246*4bdc9457SAndroid Build Coastguard Worker .k(k)
247*4bdc9457SAndroid Build Coastguard Worker .ks(3)
248*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
249*4bdc9457SAndroid Build Coastguard Worker }
250*4bdc9457SAndroid Build Coastguard Worker }
251*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,small_kernel_subtile)252*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, small_kernel_subtile) {
253*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
254*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
255*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
256*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
257*4bdc9457SAndroid Build Coastguard Worker .mr(1)
258*4bdc9457SAndroid Build Coastguard Worker .nr(8)
259*4bdc9457SAndroid Build Coastguard Worker .kr(1)
260*4bdc9457SAndroid Build Coastguard Worker .sr(1)
261*4bdc9457SAndroid Build Coastguard Worker .m(m)
262*4bdc9457SAndroid Build Coastguard Worker .n(n)
263*4bdc9457SAndroid Build Coastguard Worker .k(k)
264*4bdc9457SAndroid Build Coastguard Worker .ks(3)
265*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
266*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
267*4bdc9457SAndroid Build Coastguard Worker }
268*4bdc9457SAndroid Build Coastguard Worker }
269*4bdc9457SAndroid Build Coastguard Worker }
270*4bdc9457SAndroid Build Coastguard Worker }
271*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_gt_8_small_kernel)272*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_gt_8_small_kernel) {
273*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
274*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
275*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
276*4bdc9457SAndroid Build Coastguard Worker .mr(1)
277*4bdc9457SAndroid Build Coastguard Worker .nr(8)
278*4bdc9457SAndroid Build Coastguard Worker .kr(1)
279*4bdc9457SAndroid Build Coastguard Worker .sr(1)
280*4bdc9457SAndroid Build Coastguard Worker .m(1)
281*4bdc9457SAndroid Build Coastguard Worker .n(n)
282*4bdc9457SAndroid Build Coastguard Worker .k(k)
283*4bdc9457SAndroid Build Coastguard Worker .ks(3)
284*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
285*4bdc9457SAndroid Build Coastguard Worker }
286*4bdc9457SAndroid Build Coastguard Worker }
287*4bdc9457SAndroid Build Coastguard Worker }
288*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_div_8_small_kernel)289*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_div_8_small_kernel) {
290*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
291*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
292*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
293*4bdc9457SAndroid Build Coastguard Worker .mr(1)
294*4bdc9457SAndroid Build Coastguard Worker .nr(8)
295*4bdc9457SAndroid Build Coastguard Worker .kr(1)
296*4bdc9457SAndroid Build Coastguard Worker .sr(1)
297*4bdc9457SAndroid Build Coastguard Worker .m(1)
298*4bdc9457SAndroid Build Coastguard Worker .n(n)
299*4bdc9457SAndroid Build Coastguard Worker .k(k)
300*4bdc9457SAndroid Build Coastguard Worker .ks(3)
301*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
302*4bdc9457SAndroid Build Coastguard Worker }
303*4bdc9457SAndroid Build Coastguard Worker }
304*4bdc9457SAndroid Build Coastguard Worker }
305*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)306*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
307*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
308*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
309*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
310*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
311*4bdc9457SAndroid Build Coastguard Worker .mr(1)
312*4bdc9457SAndroid Build Coastguard Worker .nr(8)
313*4bdc9457SAndroid Build Coastguard Worker .kr(1)
314*4bdc9457SAndroid Build Coastguard Worker .sr(1)
315*4bdc9457SAndroid Build Coastguard Worker .m(m)
316*4bdc9457SAndroid Build Coastguard Worker .n(n)
317*4bdc9457SAndroid Build Coastguard Worker .k(k)
318*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
319*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
320*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
321*4bdc9457SAndroid Build Coastguard Worker }
322*4bdc9457SAndroid Build Coastguard Worker }
323*4bdc9457SAndroid Build Coastguard Worker }
324*4bdc9457SAndroid Build Coastguard Worker }
325*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,a_offset)326*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, a_offset) {
327*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
328*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
329*4bdc9457SAndroid Build Coastguard Worker .mr(1)
330*4bdc9457SAndroid Build Coastguard Worker .nr(8)
331*4bdc9457SAndroid Build Coastguard Worker .kr(1)
332*4bdc9457SAndroid Build Coastguard Worker .sr(1)
333*4bdc9457SAndroid Build Coastguard Worker .m(1)
334*4bdc9457SAndroid Build Coastguard Worker .n(8)
335*4bdc9457SAndroid Build Coastguard Worker .k(k)
336*4bdc9457SAndroid Build Coastguard Worker .ks(3)
337*4bdc9457SAndroid Build Coastguard Worker .a_offset(7)
338*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
339*4bdc9457SAndroid Build Coastguard Worker }
340*4bdc9457SAndroid Build Coastguard Worker }
341*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,zero)342*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, zero) {
343*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
344*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 1; mz++) {
345*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
346*4bdc9457SAndroid Build Coastguard Worker .mr(1)
347*4bdc9457SAndroid Build Coastguard Worker .nr(8)
348*4bdc9457SAndroid Build Coastguard Worker .kr(1)
349*4bdc9457SAndroid Build Coastguard Worker .sr(1)
350*4bdc9457SAndroid Build Coastguard Worker .m(1)
351*4bdc9457SAndroid Build Coastguard Worker .n(8)
352*4bdc9457SAndroid Build Coastguard Worker .k(k)
353*4bdc9457SAndroid Build Coastguard Worker .ks(3)
354*4bdc9457SAndroid Build Coastguard Worker .a_offset(7)
355*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
356*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
357*4bdc9457SAndroid Build Coastguard Worker }
358*4bdc9457SAndroid Build Coastguard Worker }
359*4bdc9457SAndroid Build Coastguard Worker }
360*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT,strided_cm)361*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMSIMD_LOADSPLAT, strided_cm) {
362*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
363*4bdc9457SAndroid Build Coastguard Worker .mr(1)
364*4bdc9457SAndroid Build Coastguard Worker .nr(8)
365*4bdc9457SAndroid Build Coastguard Worker .kr(1)
366*4bdc9457SAndroid Build Coastguard Worker .sr(1)
367*4bdc9457SAndroid Build Coastguard Worker .m(1)
368*4bdc9457SAndroid Build Coastguard Worker .n(8)
369*4bdc9457SAndroid Build Coastguard Worker .k(1)
370*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
371*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat);
372*4bdc9457SAndroid Build Coastguard Worker }
373*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
374*4bdc9457SAndroid Build Coastguard Worker
375*4bdc9457SAndroid Build Coastguard Worker
376*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_eq_4)377*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_eq_4) {
378*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
379*4bdc9457SAndroid Build Coastguard Worker .mr(3)
380*4bdc9457SAndroid Build Coastguard Worker .nr(8)
381*4bdc9457SAndroid Build Coastguard Worker .kr(1)
382*4bdc9457SAndroid Build Coastguard Worker .sr(1)
383*4bdc9457SAndroid Build Coastguard Worker .m(3)
384*4bdc9457SAndroid Build Coastguard Worker .n(8)
385*4bdc9457SAndroid Build Coastguard Worker .k(4)
386*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
387*4bdc9457SAndroid Build Coastguard Worker }
388*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,strided_cn)389*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, strided_cn) {
390*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
391*4bdc9457SAndroid Build Coastguard Worker .mr(3)
392*4bdc9457SAndroid Build Coastguard Worker .nr(8)
393*4bdc9457SAndroid Build Coastguard Worker .kr(1)
394*4bdc9457SAndroid Build Coastguard Worker .sr(1)
395*4bdc9457SAndroid Build Coastguard Worker .m(3)
396*4bdc9457SAndroid Build Coastguard Worker .n(8)
397*4bdc9457SAndroid Build Coastguard Worker .k(4)
398*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
399*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
400*4bdc9457SAndroid Build Coastguard Worker }
401*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_eq_4_subtile)402*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
403*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
404*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
405*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
406*4bdc9457SAndroid Build Coastguard Worker .mr(3)
407*4bdc9457SAndroid Build Coastguard Worker .nr(8)
408*4bdc9457SAndroid Build Coastguard Worker .kr(1)
409*4bdc9457SAndroid Build Coastguard Worker .sr(1)
410*4bdc9457SAndroid Build Coastguard Worker .m(m)
411*4bdc9457SAndroid Build Coastguard Worker .n(n)
412*4bdc9457SAndroid Build Coastguard Worker .k(4)
413*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
414*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
415*4bdc9457SAndroid Build Coastguard Worker }
416*4bdc9457SAndroid Build Coastguard Worker }
417*4bdc9457SAndroid Build Coastguard Worker }
418*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)419*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
420*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
421*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
422*4bdc9457SAndroid Build Coastguard Worker .mr(3)
423*4bdc9457SAndroid Build Coastguard Worker .nr(8)
424*4bdc9457SAndroid Build Coastguard Worker .kr(1)
425*4bdc9457SAndroid Build Coastguard Worker .sr(1)
426*4bdc9457SAndroid Build Coastguard Worker .m(m)
427*4bdc9457SAndroid Build Coastguard Worker .n(8)
428*4bdc9457SAndroid Build Coastguard Worker .k(4)
429*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
430*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
431*4bdc9457SAndroid Build Coastguard Worker }
432*4bdc9457SAndroid Build Coastguard Worker }
433*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)434*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
435*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
436*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
437*4bdc9457SAndroid Build Coastguard Worker .mr(3)
438*4bdc9457SAndroid Build Coastguard Worker .nr(8)
439*4bdc9457SAndroid Build Coastguard Worker .kr(1)
440*4bdc9457SAndroid Build Coastguard Worker .sr(1)
441*4bdc9457SAndroid Build Coastguard Worker .m(3)
442*4bdc9457SAndroid Build Coastguard Worker .n(n)
443*4bdc9457SAndroid Build Coastguard Worker .k(4)
444*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
445*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
446*4bdc9457SAndroid Build Coastguard Worker }
447*4bdc9457SAndroid Build Coastguard Worker }
448*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_lt_4)449*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_lt_4) {
450*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
451*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
452*4bdc9457SAndroid Build Coastguard Worker .mr(3)
453*4bdc9457SAndroid Build Coastguard Worker .nr(8)
454*4bdc9457SAndroid Build Coastguard Worker .kr(1)
455*4bdc9457SAndroid Build Coastguard Worker .sr(1)
456*4bdc9457SAndroid Build Coastguard Worker .m(3)
457*4bdc9457SAndroid Build Coastguard Worker .n(8)
458*4bdc9457SAndroid Build Coastguard Worker .k(k)
459*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
460*4bdc9457SAndroid Build Coastguard Worker }
461*4bdc9457SAndroid Build Coastguard Worker }
462*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_lt_4_subtile)463*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
464*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
465*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
466*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
467*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
468*4bdc9457SAndroid Build Coastguard Worker .mr(3)
469*4bdc9457SAndroid Build Coastguard Worker .nr(8)
470*4bdc9457SAndroid Build Coastguard Worker .kr(1)
471*4bdc9457SAndroid Build Coastguard Worker .sr(1)
472*4bdc9457SAndroid Build Coastguard Worker .m(m)
473*4bdc9457SAndroid Build Coastguard Worker .n(n)
474*4bdc9457SAndroid Build Coastguard Worker .k(k)
475*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
476*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
477*4bdc9457SAndroid Build Coastguard Worker }
478*4bdc9457SAndroid Build Coastguard Worker }
479*4bdc9457SAndroid Build Coastguard Worker }
480*4bdc9457SAndroid Build Coastguard Worker }
481*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_gt_4)482*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_gt_4) {
483*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
484*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
485*4bdc9457SAndroid Build Coastguard Worker .mr(3)
486*4bdc9457SAndroid Build Coastguard Worker .nr(8)
487*4bdc9457SAndroid Build Coastguard Worker .kr(1)
488*4bdc9457SAndroid Build Coastguard Worker .sr(1)
489*4bdc9457SAndroid Build Coastguard Worker .m(3)
490*4bdc9457SAndroid Build Coastguard Worker .n(8)
491*4bdc9457SAndroid Build Coastguard Worker .k(k)
492*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
493*4bdc9457SAndroid Build Coastguard Worker }
494*4bdc9457SAndroid Build Coastguard Worker }
495*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_gt_4_subtile)496*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
497*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
498*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
499*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
500*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
501*4bdc9457SAndroid Build Coastguard Worker .mr(3)
502*4bdc9457SAndroid Build Coastguard Worker .nr(8)
503*4bdc9457SAndroid Build Coastguard Worker .kr(1)
504*4bdc9457SAndroid Build Coastguard Worker .sr(1)
505*4bdc9457SAndroid Build Coastguard Worker .m(m)
506*4bdc9457SAndroid Build Coastguard Worker .n(n)
507*4bdc9457SAndroid Build Coastguard Worker .k(k)
508*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
509*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
510*4bdc9457SAndroid Build Coastguard Worker }
511*4bdc9457SAndroid Build Coastguard Worker }
512*4bdc9457SAndroid Build Coastguard Worker }
513*4bdc9457SAndroid Build Coastguard Worker }
514*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_div_4)515*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_div_4) {
516*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
517*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
518*4bdc9457SAndroid Build Coastguard Worker .mr(3)
519*4bdc9457SAndroid Build Coastguard Worker .nr(8)
520*4bdc9457SAndroid Build Coastguard Worker .kr(1)
521*4bdc9457SAndroid Build Coastguard Worker .sr(1)
522*4bdc9457SAndroid Build Coastguard Worker .m(3)
523*4bdc9457SAndroid Build Coastguard Worker .n(8)
524*4bdc9457SAndroid Build Coastguard Worker .k(k)
525*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
526*4bdc9457SAndroid Build Coastguard Worker }
527*4bdc9457SAndroid Build Coastguard Worker }
528*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,k_div_4_subtile)529*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, k_div_4_subtile) {
530*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
531*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
532*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
533*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
534*4bdc9457SAndroid Build Coastguard Worker .mr(3)
535*4bdc9457SAndroid Build Coastguard Worker .nr(8)
536*4bdc9457SAndroid Build Coastguard Worker .kr(1)
537*4bdc9457SAndroid Build Coastguard Worker .sr(1)
538*4bdc9457SAndroid Build Coastguard Worker .m(m)
539*4bdc9457SAndroid Build Coastguard Worker .n(n)
540*4bdc9457SAndroid Build Coastguard Worker .k(k)
541*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
542*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
543*4bdc9457SAndroid Build Coastguard Worker }
544*4bdc9457SAndroid Build Coastguard Worker }
545*4bdc9457SAndroid Build Coastguard Worker }
546*4bdc9457SAndroid Build Coastguard Worker }
547*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,n_gt_8)548*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, n_gt_8) {
549*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
550*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
551*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
552*4bdc9457SAndroid Build Coastguard Worker .mr(3)
553*4bdc9457SAndroid Build Coastguard Worker .nr(8)
554*4bdc9457SAndroid Build Coastguard Worker .kr(1)
555*4bdc9457SAndroid Build Coastguard Worker .sr(1)
556*4bdc9457SAndroid Build Coastguard Worker .m(3)
557*4bdc9457SAndroid Build Coastguard Worker .n(n)
558*4bdc9457SAndroid Build Coastguard Worker .k(k)
559*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
560*4bdc9457SAndroid Build Coastguard Worker }
561*4bdc9457SAndroid Build Coastguard Worker }
562*4bdc9457SAndroid Build Coastguard Worker }
563*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)564*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
565*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
566*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
567*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
568*4bdc9457SAndroid Build Coastguard Worker .mr(3)
569*4bdc9457SAndroid Build Coastguard Worker .nr(8)
570*4bdc9457SAndroid Build Coastguard Worker .kr(1)
571*4bdc9457SAndroid Build Coastguard Worker .sr(1)
572*4bdc9457SAndroid Build Coastguard Worker .m(3)
573*4bdc9457SAndroid Build Coastguard Worker .n(n)
574*4bdc9457SAndroid Build Coastguard Worker .k(k)
575*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
576*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
577*4bdc9457SAndroid Build Coastguard Worker }
578*4bdc9457SAndroid Build Coastguard Worker }
579*4bdc9457SAndroid Build Coastguard Worker }
580*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,n_gt_8_subtile)581*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
582*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
583*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
584*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
585*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
586*4bdc9457SAndroid Build Coastguard Worker .mr(3)
587*4bdc9457SAndroid Build Coastguard Worker .nr(8)
588*4bdc9457SAndroid Build Coastguard Worker .kr(1)
589*4bdc9457SAndroid Build Coastguard Worker .sr(1)
590*4bdc9457SAndroid Build Coastguard Worker .m(m)
591*4bdc9457SAndroid Build Coastguard Worker .n(n)
592*4bdc9457SAndroid Build Coastguard Worker .k(k)
593*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
594*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
595*4bdc9457SAndroid Build Coastguard Worker }
596*4bdc9457SAndroid Build Coastguard Worker }
597*4bdc9457SAndroid Build Coastguard Worker }
598*4bdc9457SAndroid Build Coastguard Worker }
599*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,n_div_8)600*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, n_div_8) {
601*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
602*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
603*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
604*4bdc9457SAndroid Build Coastguard Worker .mr(3)
605*4bdc9457SAndroid Build Coastguard Worker .nr(8)
606*4bdc9457SAndroid Build Coastguard Worker .kr(1)
607*4bdc9457SAndroid Build Coastguard Worker .sr(1)
608*4bdc9457SAndroid Build Coastguard Worker .m(3)
609*4bdc9457SAndroid Build Coastguard Worker .n(n)
610*4bdc9457SAndroid Build Coastguard Worker .k(k)
611*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
612*4bdc9457SAndroid Build Coastguard Worker }
613*4bdc9457SAndroid Build Coastguard Worker }
614*4bdc9457SAndroid Build Coastguard Worker }
615*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,n_div_8_strided_cn)616*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
617*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
618*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
619*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
620*4bdc9457SAndroid Build Coastguard Worker .mr(3)
621*4bdc9457SAndroid Build Coastguard Worker .nr(8)
622*4bdc9457SAndroid Build Coastguard Worker .kr(1)
623*4bdc9457SAndroid Build Coastguard Worker .sr(1)
624*4bdc9457SAndroid Build Coastguard Worker .m(3)
625*4bdc9457SAndroid Build Coastguard Worker .n(n)
626*4bdc9457SAndroid Build Coastguard Worker .k(k)
627*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
628*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
629*4bdc9457SAndroid Build Coastguard Worker }
630*4bdc9457SAndroid Build Coastguard Worker }
631*4bdc9457SAndroid Build Coastguard Worker }
632*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,n_div_8_subtile)633*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, n_div_8_subtile) {
634*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
635*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
636*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
637*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
638*4bdc9457SAndroid Build Coastguard Worker .mr(3)
639*4bdc9457SAndroid Build Coastguard Worker .nr(8)
640*4bdc9457SAndroid Build Coastguard Worker .kr(1)
641*4bdc9457SAndroid Build Coastguard Worker .sr(1)
642*4bdc9457SAndroid Build Coastguard Worker .m(m)
643*4bdc9457SAndroid Build Coastguard Worker .n(n)
644*4bdc9457SAndroid Build Coastguard Worker .k(k)
645*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
646*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
647*4bdc9457SAndroid Build Coastguard Worker }
648*4bdc9457SAndroid Build Coastguard Worker }
649*4bdc9457SAndroid Build Coastguard Worker }
650*4bdc9457SAndroid Build Coastguard Worker }
651*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,small_kernel)652*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, small_kernel) {
653*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
654*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
655*4bdc9457SAndroid Build Coastguard Worker .mr(3)
656*4bdc9457SAndroid Build Coastguard Worker .nr(8)
657*4bdc9457SAndroid Build Coastguard Worker .kr(1)
658*4bdc9457SAndroid Build Coastguard Worker .sr(1)
659*4bdc9457SAndroid Build Coastguard Worker .m(3)
660*4bdc9457SAndroid Build Coastguard Worker .n(8)
661*4bdc9457SAndroid Build Coastguard Worker .k(k)
662*4bdc9457SAndroid Build Coastguard Worker .ks(3)
663*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
664*4bdc9457SAndroid Build Coastguard Worker }
665*4bdc9457SAndroid Build Coastguard Worker }
666*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,small_kernel_subtile)667*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, small_kernel_subtile) {
668*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
669*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
670*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
671*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
672*4bdc9457SAndroid Build Coastguard Worker .mr(3)
673*4bdc9457SAndroid Build Coastguard Worker .nr(8)
674*4bdc9457SAndroid Build Coastguard Worker .kr(1)
675*4bdc9457SAndroid Build Coastguard Worker .sr(1)
676*4bdc9457SAndroid Build Coastguard Worker .m(m)
677*4bdc9457SAndroid Build Coastguard Worker .n(n)
678*4bdc9457SAndroid Build Coastguard Worker .k(k)
679*4bdc9457SAndroid Build Coastguard Worker .ks(3)
680*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
681*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
682*4bdc9457SAndroid Build Coastguard Worker }
683*4bdc9457SAndroid Build Coastguard Worker }
684*4bdc9457SAndroid Build Coastguard Worker }
685*4bdc9457SAndroid Build Coastguard Worker }
686*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,n_gt_8_small_kernel)687*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, n_gt_8_small_kernel) {
688*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
689*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
690*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
691*4bdc9457SAndroid Build Coastguard Worker .mr(3)
692*4bdc9457SAndroid Build Coastguard Worker .nr(8)
693*4bdc9457SAndroid Build Coastguard Worker .kr(1)
694*4bdc9457SAndroid Build Coastguard Worker .sr(1)
695*4bdc9457SAndroid Build Coastguard Worker .m(3)
696*4bdc9457SAndroid Build Coastguard Worker .n(n)
697*4bdc9457SAndroid Build Coastguard Worker .k(k)
698*4bdc9457SAndroid Build Coastguard Worker .ks(3)
699*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
700*4bdc9457SAndroid Build Coastguard Worker }
701*4bdc9457SAndroid Build Coastguard Worker }
702*4bdc9457SAndroid Build Coastguard Worker }
703*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,n_div_8_small_kernel)704*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, n_div_8_small_kernel) {
705*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
706*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
707*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
708*4bdc9457SAndroid Build Coastguard Worker .mr(3)
709*4bdc9457SAndroid Build Coastguard Worker .nr(8)
710*4bdc9457SAndroid Build Coastguard Worker .kr(1)
711*4bdc9457SAndroid Build Coastguard Worker .sr(1)
712*4bdc9457SAndroid Build Coastguard Worker .m(3)
713*4bdc9457SAndroid Build Coastguard Worker .n(n)
714*4bdc9457SAndroid Build Coastguard Worker .k(k)
715*4bdc9457SAndroid Build Coastguard Worker .ks(3)
716*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
717*4bdc9457SAndroid Build Coastguard Worker }
718*4bdc9457SAndroid Build Coastguard Worker }
719*4bdc9457SAndroid Build Coastguard Worker }
720*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,strided_cm_subtile)721*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, strided_cm_subtile) {
722*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
723*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
724*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
725*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
726*4bdc9457SAndroid Build Coastguard Worker .mr(3)
727*4bdc9457SAndroid Build Coastguard Worker .nr(8)
728*4bdc9457SAndroid Build Coastguard Worker .kr(1)
729*4bdc9457SAndroid Build Coastguard Worker .sr(1)
730*4bdc9457SAndroid Build Coastguard Worker .m(m)
731*4bdc9457SAndroid Build Coastguard Worker .n(n)
732*4bdc9457SAndroid Build Coastguard Worker .k(k)
733*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
734*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
735*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
736*4bdc9457SAndroid Build Coastguard Worker }
737*4bdc9457SAndroid Build Coastguard Worker }
738*4bdc9457SAndroid Build Coastguard Worker }
739*4bdc9457SAndroid Build Coastguard Worker }
740*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,a_offset)741*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, a_offset) {
742*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
743*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
744*4bdc9457SAndroid Build Coastguard Worker .mr(3)
745*4bdc9457SAndroid Build Coastguard Worker .nr(8)
746*4bdc9457SAndroid Build Coastguard Worker .kr(1)
747*4bdc9457SAndroid Build Coastguard Worker .sr(1)
748*4bdc9457SAndroid Build Coastguard Worker .m(3)
749*4bdc9457SAndroid Build Coastguard Worker .n(8)
750*4bdc9457SAndroid Build Coastguard Worker .k(k)
751*4bdc9457SAndroid Build Coastguard Worker .ks(3)
752*4bdc9457SAndroid Build Coastguard Worker .a_offset(67)
753*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
754*4bdc9457SAndroid Build Coastguard Worker }
755*4bdc9457SAndroid Build Coastguard Worker }
756*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,zero)757*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, zero) {
758*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
759*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 3; mz++) {
760*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
761*4bdc9457SAndroid Build Coastguard Worker .mr(3)
762*4bdc9457SAndroid Build Coastguard Worker .nr(8)
763*4bdc9457SAndroid Build Coastguard Worker .kr(1)
764*4bdc9457SAndroid Build Coastguard Worker .sr(1)
765*4bdc9457SAndroid Build Coastguard Worker .m(3)
766*4bdc9457SAndroid Build Coastguard Worker .n(8)
767*4bdc9457SAndroid Build Coastguard Worker .k(k)
768*4bdc9457SAndroid Build Coastguard Worker .ks(3)
769*4bdc9457SAndroid Build Coastguard Worker .a_offset(67)
770*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
771*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
772*4bdc9457SAndroid Build Coastguard Worker }
773*4bdc9457SAndroid Build Coastguard Worker }
774*4bdc9457SAndroid Build Coastguard Worker }
775*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT,strided_cm)776*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMSIMD_SPLAT, strided_cm) {
777*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
778*4bdc9457SAndroid Build Coastguard Worker .mr(3)
779*4bdc9457SAndroid Build Coastguard Worker .nr(8)
780*4bdc9457SAndroid Build Coastguard Worker .kr(1)
781*4bdc9457SAndroid Build Coastguard Worker .sr(1)
782*4bdc9457SAndroid Build Coastguard Worker .m(3)
783*4bdc9457SAndroid Build Coastguard Worker .n(8)
784*4bdc9457SAndroid Build Coastguard Worker .k(4)
785*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
786*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat);
787*4bdc9457SAndroid Build Coastguard Worker }
788*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
789*4bdc9457SAndroid Build Coastguard Worker
790*4bdc9457SAndroid Build Coastguard Worker
791*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_eq_4)792*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_eq_4) {
793*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
794*4bdc9457SAndroid Build Coastguard Worker .mr(3)
795*4bdc9457SAndroid Build Coastguard Worker .nr(8)
796*4bdc9457SAndroid Build Coastguard Worker .kr(1)
797*4bdc9457SAndroid Build Coastguard Worker .sr(4)
798*4bdc9457SAndroid Build Coastguard Worker .m(3)
799*4bdc9457SAndroid Build Coastguard Worker .n(8)
800*4bdc9457SAndroid Build Coastguard Worker .k(4)
801*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
802*4bdc9457SAndroid Build Coastguard Worker }
803*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,strided_cn)804*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, strided_cn) {
805*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
806*4bdc9457SAndroid Build Coastguard Worker .mr(3)
807*4bdc9457SAndroid Build Coastguard Worker .nr(8)
808*4bdc9457SAndroid Build Coastguard Worker .kr(1)
809*4bdc9457SAndroid Build Coastguard Worker .sr(4)
810*4bdc9457SAndroid Build Coastguard Worker .m(3)
811*4bdc9457SAndroid Build Coastguard Worker .n(8)
812*4bdc9457SAndroid Build Coastguard Worker .k(4)
813*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
814*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
815*4bdc9457SAndroid Build Coastguard Worker }
816*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_eq_4_subtile)817*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_eq_4_subtile) {
818*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
819*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
820*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
821*4bdc9457SAndroid Build Coastguard Worker .mr(3)
822*4bdc9457SAndroid Build Coastguard Worker .nr(8)
823*4bdc9457SAndroid Build Coastguard Worker .kr(1)
824*4bdc9457SAndroid Build Coastguard Worker .sr(4)
825*4bdc9457SAndroid Build Coastguard Worker .m(m)
826*4bdc9457SAndroid Build Coastguard Worker .n(n)
827*4bdc9457SAndroid Build Coastguard Worker .k(4)
828*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
829*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
830*4bdc9457SAndroid Build Coastguard Worker }
831*4bdc9457SAndroid Build Coastguard Worker }
832*4bdc9457SAndroid Build Coastguard Worker }
833*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_eq_4_subtile_m)834*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_eq_4_subtile_m) {
835*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
836*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
837*4bdc9457SAndroid Build Coastguard Worker .mr(3)
838*4bdc9457SAndroid Build Coastguard Worker .nr(8)
839*4bdc9457SAndroid Build Coastguard Worker .kr(1)
840*4bdc9457SAndroid Build Coastguard Worker .sr(4)
841*4bdc9457SAndroid Build Coastguard Worker .m(m)
842*4bdc9457SAndroid Build Coastguard Worker .n(8)
843*4bdc9457SAndroid Build Coastguard Worker .k(4)
844*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
845*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
846*4bdc9457SAndroid Build Coastguard Worker }
847*4bdc9457SAndroid Build Coastguard Worker }
848*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_eq_4_subtile_n)849*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_eq_4_subtile_n) {
850*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
851*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
852*4bdc9457SAndroid Build Coastguard Worker .mr(3)
853*4bdc9457SAndroid Build Coastguard Worker .nr(8)
854*4bdc9457SAndroid Build Coastguard Worker .kr(1)
855*4bdc9457SAndroid Build Coastguard Worker .sr(4)
856*4bdc9457SAndroid Build Coastguard Worker .m(3)
857*4bdc9457SAndroid Build Coastguard Worker .n(n)
858*4bdc9457SAndroid Build Coastguard Worker .k(4)
859*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
860*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
861*4bdc9457SAndroid Build Coastguard Worker }
862*4bdc9457SAndroid Build Coastguard Worker }
863*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_lt_4)864*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_lt_4) {
865*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
866*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
867*4bdc9457SAndroid Build Coastguard Worker .mr(3)
868*4bdc9457SAndroid Build Coastguard Worker .nr(8)
869*4bdc9457SAndroid Build Coastguard Worker .kr(1)
870*4bdc9457SAndroid Build Coastguard Worker .sr(4)
871*4bdc9457SAndroid Build Coastguard Worker .m(3)
872*4bdc9457SAndroid Build Coastguard Worker .n(8)
873*4bdc9457SAndroid Build Coastguard Worker .k(k)
874*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
875*4bdc9457SAndroid Build Coastguard Worker }
876*4bdc9457SAndroid Build Coastguard Worker }
877*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_lt_4_subtile)878*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_lt_4_subtile) {
879*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
880*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
881*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
882*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
883*4bdc9457SAndroid Build Coastguard Worker .mr(3)
884*4bdc9457SAndroid Build Coastguard Worker .nr(8)
885*4bdc9457SAndroid Build Coastguard Worker .kr(1)
886*4bdc9457SAndroid Build Coastguard Worker .sr(4)
887*4bdc9457SAndroid Build Coastguard Worker .m(m)
888*4bdc9457SAndroid Build Coastguard Worker .n(n)
889*4bdc9457SAndroid Build Coastguard Worker .k(k)
890*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
891*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
892*4bdc9457SAndroid Build Coastguard Worker }
893*4bdc9457SAndroid Build Coastguard Worker }
894*4bdc9457SAndroid Build Coastguard Worker }
895*4bdc9457SAndroid Build Coastguard Worker }
896*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_gt_4)897*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_gt_4) {
898*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
899*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
900*4bdc9457SAndroid Build Coastguard Worker .mr(3)
901*4bdc9457SAndroid Build Coastguard Worker .nr(8)
902*4bdc9457SAndroid Build Coastguard Worker .kr(1)
903*4bdc9457SAndroid Build Coastguard Worker .sr(4)
904*4bdc9457SAndroid Build Coastguard Worker .m(3)
905*4bdc9457SAndroid Build Coastguard Worker .n(8)
906*4bdc9457SAndroid Build Coastguard Worker .k(k)
907*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
908*4bdc9457SAndroid Build Coastguard Worker }
909*4bdc9457SAndroid Build Coastguard Worker }
910*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_gt_4_subtile)911*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_gt_4_subtile) {
912*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
913*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
914*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
915*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
916*4bdc9457SAndroid Build Coastguard Worker .mr(3)
917*4bdc9457SAndroid Build Coastguard Worker .nr(8)
918*4bdc9457SAndroid Build Coastguard Worker .kr(1)
919*4bdc9457SAndroid Build Coastguard Worker .sr(4)
920*4bdc9457SAndroid Build Coastguard Worker .m(m)
921*4bdc9457SAndroid Build Coastguard Worker .n(n)
922*4bdc9457SAndroid Build Coastguard Worker .k(k)
923*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
924*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
925*4bdc9457SAndroid Build Coastguard Worker }
926*4bdc9457SAndroid Build Coastguard Worker }
927*4bdc9457SAndroid Build Coastguard Worker }
928*4bdc9457SAndroid Build Coastguard Worker }
929*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_div_4)930*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_div_4) {
931*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
932*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
933*4bdc9457SAndroid Build Coastguard Worker .mr(3)
934*4bdc9457SAndroid Build Coastguard Worker .nr(8)
935*4bdc9457SAndroid Build Coastguard Worker .kr(1)
936*4bdc9457SAndroid Build Coastguard Worker .sr(4)
937*4bdc9457SAndroid Build Coastguard Worker .m(3)
938*4bdc9457SAndroid Build Coastguard Worker .n(8)
939*4bdc9457SAndroid Build Coastguard Worker .k(k)
940*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
941*4bdc9457SAndroid Build Coastguard Worker }
942*4bdc9457SAndroid Build Coastguard Worker }
943*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,k_div_4_subtile)944*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, k_div_4_subtile) {
945*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
946*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
947*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
948*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
949*4bdc9457SAndroid Build Coastguard Worker .mr(3)
950*4bdc9457SAndroid Build Coastguard Worker .nr(8)
951*4bdc9457SAndroid Build Coastguard Worker .kr(1)
952*4bdc9457SAndroid Build Coastguard Worker .sr(4)
953*4bdc9457SAndroid Build Coastguard Worker .m(m)
954*4bdc9457SAndroid Build Coastguard Worker .n(n)
955*4bdc9457SAndroid Build Coastguard Worker .k(k)
956*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
957*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
958*4bdc9457SAndroid Build Coastguard Worker }
959*4bdc9457SAndroid Build Coastguard Worker }
960*4bdc9457SAndroid Build Coastguard Worker }
961*4bdc9457SAndroid Build Coastguard Worker }
962*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,n_gt_8)963*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, n_gt_8) {
964*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
965*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
966*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
967*4bdc9457SAndroid Build Coastguard Worker .mr(3)
968*4bdc9457SAndroid Build Coastguard Worker .nr(8)
969*4bdc9457SAndroid Build Coastguard Worker .kr(1)
970*4bdc9457SAndroid Build Coastguard Worker .sr(4)
971*4bdc9457SAndroid Build Coastguard Worker .m(3)
972*4bdc9457SAndroid Build Coastguard Worker .n(n)
973*4bdc9457SAndroid Build Coastguard Worker .k(k)
974*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
975*4bdc9457SAndroid Build Coastguard Worker }
976*4bdc9457SAndroid Build Coastguard Worker }
977*4bdc9457SAndroid Build Coastguard Worker }
978*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,n_gt_8_strided_cn)979*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, n_gt_8_strided_cn) {
980*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
981*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
982*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
983*4bdc9457SAndroid Build Coastguard Worker .mr(3)
984*4bdc9457SAndroid Build Coastguard Worker .nr(8)
985*4bdc9457SAndroid Build Coastguard Worker .kr(1)
986*4bdc9457SAndroid Build Coastguard Worker .sr(4)
987*4bdc9457SAndroid Build Coastguard Worker .m(3)
988*4bdc9457SAndroid Build Coastguard Worker .n(n)
989*4bdc9457SAndroid Build Coastguard Worker .k(k)
990*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
991*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
992*4bdc9457SAndroid Build Coastguard Worker }
993*4bdc9457SAndroid Build Coastguard Worker }
994*4bdc9457SAndroid Build Coastguard Worker }
995*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,n_gt_8_subtile)996*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, n_gt_8_subtile) {
997*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
998*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
999*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1000*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1001*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1002*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1003*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1004*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1005*4bdc9457SAndroid Build Coastguard Worker .m(m)
1006*4bdc9457SAndroid Build Coastguard Worker .n(n)
1007*4bdc9457SAndroid Build Coastguard Worker .k(k)
1008*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1009*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1010*4bdc9457SAndroid Build Coastguard Worker }
1011*4bdc9457SAndroid Build Coastguard Worker }
1012*4bdc9457SAndroid Build Coastguard Worker }
1013*4bdc9457SAndroid Build Coastguard Worker }
1014*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,n_div_8)1015*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, n_div_8) {
1016*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1017*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1018*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1019*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1020*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1021*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1022*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1023*4bdc9457SAndroid Build Coastguard Worker .m(3)
1024*4bdc9457SAndroid Build Coastguard Worker .n(n)
1025*4bdc9457SAndroid Build Coastguard Worker .k(k)
1026*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1027*4bdc9457SAndroid Build Coastguard Worker }
1028*4bdc9457SAndroid Build Coastguard Worker }
1029*4bdc9457SAndroid Build Coastguard Worker }
1030*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,n_div_8_strided_cn)1031*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, n_div_8_strided_cn) {
1032*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1033*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1034*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1035*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1036*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1037*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1038*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1039*4bdc9457SAndroid Build Coastguard Worker .m(3)
1040*4bdc9457SAndroid Build Coastguard Worker .n(n)
1041*4bdc9457SAndroid Build Coastguard Worker .k(k)
1042*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1043*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1044*4bdc9457SAndroid Build Coastguard Worker }
1045*4bdc9457SAndroid Build Coastguard Worker }
1046*4bdc9457SAndroid Build Coastguard Worker }
1047*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,n_div_8_subtile)1048*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, n_div_8_subtile) {
1049*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1050*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1051*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1052*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1053*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1054*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1055*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1056*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1057*4bdc9457SAndroid Build Coastguard Worker .m(m)
1058*4bdc9457SAndroid Build Coastguard Worker .n(n)
1059*4bdc9457SAndroid Build Coastguard Worker .k(k)
1060*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1061*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1062*4bdc9457SAndroid Build Coastguard Worker }
1063*4bdc9457SAndroid Build Coastguard Worker }
1064*4bdc9457SAndroid Build Coastguard Worker }
1065*4bdc9457SAndroid Build Coastguard Worker }
1066*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,small_kernel)1067*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, small_kernel) {
1068*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1069*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1070*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1071*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1072*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1073*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1074*4bdc9457SAndroid Build Coastguard Worker .m(3)
1075*4bdc9457SAndroid Build Coastguard Worker .n(8)
1076*4bdc9457SAndroid Build Coastguard Worker .k(k)
1077*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1078*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1079*4bdc9457SAndroid Build Coastguard Worker }
1080*4bdc9457SAndroid Build Coastguard Worker }
1081*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,small_kernel_subtile)1082*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, small_kernel_subtile) {
1083*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1084*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1085*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1086*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1087*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1088*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1089*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1090*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1091*4bdc9457SAndroid Build Coastguard Worker .m(m)
1092*4bdc9457SAndroid Build Coastguard Worker .n(n)
1093*4bdc9457SAndroid Build Coastguard Worker .k(k)
1094*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1095*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1096*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1097*4bdc9457SAndroid Build Coastguard Worker }
1098*4bdc9457SAndroid Build Coastguard Worker }
1099*4bdc9457SAndroid Build Coastguard Worker }
1100*4bdc9457SAndroid Build Coastguard Worker }
1101*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,n_gt_8_small_kernel)1102*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, n_gt_8_small_kernel) {
1103*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1104*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1105*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1106*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1107*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1108*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1109*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1110*4bdc9457SAndroid Build Coastguard Worker .m(3)
1111*4bdc9457SAndroid Build Coastguard Worker .n(n)
1112*4bdc9457SAndroid Build Coastguard Worker .k(k)
1113*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1114*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1115*4bdc9457SAndroid Build Coastguard Worker }
1116*4bdc9457SAndroid Build Coastguard Worker }
1117*4bdc9457SAndroid Build Coastguard Worker }
1118*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,n_div_8_small_kernel)1119*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, n_div_8_small_kernel) {
1120*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1121*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1122*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1123*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1124*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1125*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1126*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1127*4bdc9457SAndroid Build Coastguard Worker .m(3)
1128*4bdc9457SAndroid Build Coastguard Worker .n(n)
1129*4bdc9457SAndroid Build Coastguard Worker .k(k)
1130*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1131*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1132*4bdc9457SAndroid Build Coastguard Worker }
1133*4bdc9457SAndroid Build Coastguard Worker }
1134*4bdc9457SAndroid Build Coastguard Worker }
1135*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,strided_cm_subtile)1136*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, strided_cm_subtile) {
1137*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1138*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1139*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1140*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1141*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1142*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1143*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1144*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1145*4bdc9457SAndroid Build Coastguard Worker .m(m)
1146*4bdc9457SAndroid Build Coastguard Worker .n(n)
1147*4bdc9457SAndroid Build Coastguard Worker .k(k)
1148*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1149*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1150*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1151*4bdc9457SAndroid Build Coastguard Worker }
1152*4bdc9457SAndroid Build Coastguard Worker }
1153*4bdc9457SAndroid Build Coastguard Worker }
1154*4bdc9457SAndroid Build Coastguard Worker }
1155*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,a_offset)1156*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, a_offset) {
1157*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1158*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1159*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1160*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1161*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1162*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1163*4bdc9457SAndroid Build Coastguard Worker .m(3)
1164*4bdc9457SAndroid Build Coastguard Worker .n(8)
1165*4bdc9457SAndroid Build Coastguard Worker .k(k)
1166*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1167*4bdc9457SAndroid Build Coastguard Worker .a_offset(67)
1168*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1169*4bdc9457SAndroid Build Coastguard Worker }
1170*4bdc9457SAndroid Build Coastguard Worker }
1171*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,zero)1172*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, zero) {
1173*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1174*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 3; mz++) {
1175*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1176*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1177*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1178*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1179*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1180*4bdc9457SAndroid Build Coastguard Worker .m(3)
1181*4bdc9457SAndroid Build Coastguard Worker .n(8)
1182*4bdc9457SAndroid Build Coastguard Worker .k(k)
1183*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1184*4bdc9457SAndroid Build Coastguard Worker .a_offset(67)
1185*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
1186*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1187*4bdc9457SAndroid Build Coastguard Worker }
1188*4bdc9457SAndroid Build Coastguard Worker }
1189*4bdc9457SAndroid Build Coastguard Worker }
1190*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD,strided_cm)1191*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMSIMD, strided_cm) {
1192*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1193*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1194*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1195*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1196*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1197*4bdc9457SAndroid Build Coastguard Worker .m(3)
1198*4bdc9457SAndroid Build Coastguard Worker .n(8)
1199*4bdc9457SAndroid Build Coastguard Worker .k(4)
1200*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1201*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmsimd);
1202*4bdc9457SAndroid Build Coastguard Worker }
1203*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1204*4bdc9457SAndroid Build Coastguard Worker
1205*4bdc9457SAndroid Build Coastguard Worker
1206*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_eq_4)1207*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_eq_4) {
1208*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1209*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1210*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1211*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1212*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1213*4bdc9457SAndroid Build Coastguard Worker .m(4)
1214*4bdc9457SAndroid Build Coastguard Worker .n(2)
1215*4bdc9457SAndroid Build Coastguard Worker .k(4)
1216*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1217*4bdc9457SAndroid Build Coastguard Worker }
1218*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,strided_cn)1219*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, strided_cn) {
1220*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1221*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1222*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1223*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1224*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1225*4bdc9457SAndroid Build Coastguard Worker .m(4)
1226*4bdc9457SAndroid Build Coastguard Worker .n(2)
1227*4bdc9457SAndroid Build Coastguard Worker .k(4)
1228*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
1229*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1230*4bdc9457SAndroid Build Coastguard Worker }
1231*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_eq_4_subtile)1232*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_eq_4_subtile) {
1233*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1234*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1235*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1236*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1237*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1238*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1239*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1240*4bdc9457SAndroid Build Coastguard Worker .m(m)
1241*4bdc9457SAndroid Build Coastguard Worker .n(n)
1242*4bdc9457SAndroid Build Coastguard Worker .k(4)
1243*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1244*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1245*4bdc9457SAndroid Build Coastguard Worker }
1246*4bdc9457SAndroid Build Coastguard Worker }
1247*4bdc9457SAndroid Build Coastguard Worker }
1248*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_eq_4_subtile_m)1249*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_eq_4_subtile_m) {
1250*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1251*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1252*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1253*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1254*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1255*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1256*4bdc9457SAndroid Build Coastguard Worker .m(m)
1257*4bdc9457SAndroid Build Coastguard Worker .n(2)
1258*4bdc9457SAndroid Build Coastguard Worker .k(4)
1259*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1260*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1261*4bdc9457SAndroid Build Coastguard Worker }
1262*4bdc9457SAndroid Build Coastguard Worker }
1263*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_eq_4_subtile_n)1264*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_eq_4_subtile_n) {
1265*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1266*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1267*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1268*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1269*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1270*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1271*4bdc9457SAndroid Build Coastguard Worker .m(4)
1272*4bdc9457SAndroid Build Coastguard Worker .n(n)
1273*4bdc9457SAndroid Build Coastguard Worker .k(4)
1274*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1275*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1276*4bdc9457SAndroid Build Coastguard Worker }
1277*4bdc9457SAndroid Build Coastguard Worker }
1278*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_lt_4)1279*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_lt_4) {
1280*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1281*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1282*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1283*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1284*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1285*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1286*4bdc9457SAndroid Build Coastguard Worker .m(4)
1287*4bdc9457SAndroid Build Coastguard Worker .n(2)
1288*4bdc9457SAndroid Build Coastguard Worker .k(k)
1289*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1290*4bdc9457SAndroid Build Coastguard Worker }
1291*4bdc9457SAndroid Build Coastguard Worker }
1292*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_lt_4_subtile)1293*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_lt_4_subtile) {
1294*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1295*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1296*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1297*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1298*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1299*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1300*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1301*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1302*4bdc9457SAndroid Build Coastguard Worker .m(m)
1303*4bdc9457SAndroid Build Coastguard Worker .n(n)
1304*4bdc9457SAndroid Build Coastguard Worker .k(k)
1305*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1306*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1307*4bdc9457SAndroid Build Coastguard Worker }
1308*4bdc9457SAndroid Build Coastguard Worker }
1309*4bdc9457SAndroid Build Coastguard Worker }
1310*4bdc9457SAndroid Build Coastguard Worker }
1311*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_gt_4)1312*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_gt_4) {
1313*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1314*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1315*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1316*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1317*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1318*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1319*4bdc9457SAndroid Build Coastguard Worker .m(4)
1320*4bdc9457SAndroid Build Coastguard Worker .n(2)
1321*4bdc9457SAndroid Build Coastguard Worker .k(k)
1322*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1323*4bdc9457SAndroid Build Coastguard Worker }
1324*4bdc9457SAndroid Build Coastguard Worker }
1325*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_gt_4_subtile)1326*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_gt_4_subtile) {
1327*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1328*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1329*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1330*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1331*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1332*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1333*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1334*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1335*4bdc9457SAndroid Build Coastguard Worker .m(m)
1336*4bdc9457SAndroid Build Coastguard Worker .n(n)
1337*4bdc9457SAndroid Build Coastguard Worker .k(k)
1338*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1339*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1340*4bdc9457SAndroid Build Coastguard Worker }
1341*4bdc9457SAndroid Build Coastguard Worker }
1342*4bdc9457SAndroid Build Coastguard Worker }
1343*4bdc9457SAndroid Build Coastguard Worker }
1344*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_div_4)1345*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_div_4) {
1346*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1347*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1348*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1349*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1350*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1351*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1352*4bdc9457SAndroid Build Coastguard Worker .m(4)
1353*4bdc9457SAndroid Build Coastguard Worker .n(2)
1354*4bdc9457SAndroid Build Coastguard Worker .k(k)
1355*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1356*4bdc9457SAndroid Build Coastguard Worker }
1357*4bdc9457SAndroid Build Coastguard Worker }
1358*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,k_div_4_subtile)1359*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, k_div_4_subtile) {
1360*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1361*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1362*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1363*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1364*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1365*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1366*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1367*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1368*4bdc9457SAndroid Build Coastguard Worker .m(m)
1369*4bdc9457SAndroid Build Coastguard Worker .n(n)
1370*4bdc9457SAndroid Build Coastguard Worker .k(k)
1371*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1372*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1373*4bdc9457SAndroid Build Coastguard Worker }
1374*4bdc9457SAndroid Build Coastguard Worker }
1375*4bdc9457SAndroid Build Coastguard Worker }
1376*4bdc9457SAndroid Build Coastguard Worker }
1377*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,n_gt_2)1378*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, n_gt_2) {
1379*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1380*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1381*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1382*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1383*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1384*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1385*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1386*4bdc9457SAndroid Build Coastguard Worker .m(4)
1387*4bdc9457SAndroid Build Coastguard Worker .n(n)
1388*4bdc9457SAndroid Build Coastguard Worker .k(k)
1389*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1390*4bdc9457SAndroid Build Coastguard Worker }
1391*4bdc9457SAndroid Build Coastguard Worker }
1392*4bdc9457SAndroid Build Coastguard Worker }
1393*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,n_gt_2_strided_cn)1394*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, n_gt_2_strided_cn) {
1395*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1396*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1397*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1398*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1399*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1400*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1401*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1402*4bdc9457SAndroid Build Coastguard Worker .m(4)
1403*4bdc9457SAndroid Build Coastguard Worker .n(n)
1404*4bdc9457SAndroid Build Coastguard Worker .k(k)
1405*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
1406*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1407*4bdc9457SAndroid Build Coastguard Worker }
1408*4bdc9457SAndroid Build Coastguard Worker }
1409*4bdc9457SAndroid Build Coastguard Worker }
1410*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,n_gt_2_subtile)1411*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, n_gt_2_subtile) {
1412*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1413*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1414*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1415*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1416*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1417*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1418*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1419*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1420*4bdc9457SAndroid Build Coastguard Worker .m(m)
1421*4bdc9457SAndroid Build Coastguard Worker .n(n)
1422*4bdc9457SAndroid Build Coastguard Worker .k(k)
1423*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1424*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1425*4bdc9457SAndroid Build Coastguard Worker }
1426*4bdc9457SAndroid Build Coastguard Worker }
1427*4bdc9457SAndroid Build Coastguard Worker }
1428*4bdc9457SAndroid Build Coastguard Worker }
1429*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,n_div_2)1430*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, n_div_2) {
1431*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1432*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1433*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1434*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1435*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1436*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1437*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1438*4bdc9457SAndroid Build Coastguard Worker .m(4)
1439*4bdc9457SAndroid Build Coastguard Worker .n(n)
1440*4bdc9457SAndroid Build Coastguard Worker .k(k)
1441*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1442*4bdc9457SAndroid Build Coastguard Worker }
1443*4bdc9457SAndroid Build Coastguard Worker }
1444*4bdc9457SAndroid Build Coastguard Worker }
1445*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,n_div_2_strided_cn)1446*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, n_div_2_strided_cn) {
1447*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1448*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1449*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1450*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1451*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1452*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1453*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1454*4bdc9457SAndroid Build Coastguard Worker .m(4)
1455*4bdc9457SAndroid Build Coastguard Worker .n(n)
1456*4bdc9457SAndroid Build Coastguard Worker .k(k)
1457*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
1458*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1459*4bdc9457SAndroid Build Coastguard Worker }
1460*4bdc9457SAndroid Build Coastguard Worker }
1461*4bdc9457SAndroid Build Coastguard Worker }
1462*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,n_div_2_subtile)1463*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, n_div_2_subtile) {
1464*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1465*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1466*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1467*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1468*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1469*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1470*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1471*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1472*4bdc9457SAndroid Build Coastguard Worker .m(m)
1473*4bdc9457SAndroid Build Coastguard Worker .n(n)
1474*4bdc9457SAndroid Build Coastguard Worker .k(k)
1475*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1476*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1477*4bdc9457SAndroid Build Coastguard Worker }
1478*4bdc9457SAndroid Build Coastguard Worker }
1479*4bdc9457SAndroid Build Coastguard Worker }
1480*4bdc9457SAndroid Build Coastguard Worker }
1481*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,small_kernel)1482*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, small_kernel) {
1483*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1484*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1485*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1486*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1487*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1488*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1489*4bdc9457SAndroid Build Coastguard Worker .m(4)
1490*4bdc9457SAndroid Build Coastguard Worker .n(2)
1491*4bdc9457SAndroid Build Coastguard Worker .k(k)
1492*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1493*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1494*4bdc9457SAndroid Build Coastguard Worker }
1495*4bdc9457SAndroid Build Coastguard Worker }
1496*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,small_kernel_subtile)1497*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, small_kernel_subtile) {
1498*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1499*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1500*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1501*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1502*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1503*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1504*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1505*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1506*4bdc9457SAndroid Build Coastguard Worker .m(m)
1507*4bdc9457SAndroid Build Coastguard Worker .n(n)
1508*4bdc9457SAndroid Build Coastguard Worker .k(k)
1509*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1510*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1511*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1512*4bdc9457SAndroid Build Coastguard Worker }
1513*4bdc9457SAndroid Build Coastguard Worker }
1514*4bdc9457SAndroid Build Coastguard Worker }
1515*4bdc9457SAndroid Build Coastguard Worker }
1516*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,n_gt_2_small_kernel)1517*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, n_gt_2_small_kernel) {
1518*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1519*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1520*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1521*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1522*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1523*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1524*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1525*4bdc9457SAndroid Build Coastguard Worker .m(4)
1526*4bdc9457SAndroid Build Coastguard Worker .n(n)
1527*4bdc9457SAndroid Build Coastguard Worker .k(k)
1528*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1529*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1530*4bdc9457SAndroid Build Coastguard Worker }
1531*4bdc9457SAndroid Build Coastguard Worker }
1532*4bdc9457SAndroid Build Coastguard Worker }
1533*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,n_div_2_small_kernel)1534*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, n_div_2_small_kernel) {
1535*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1536*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1537*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1538*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1539*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1540*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1541*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1542*4bdc9457SAndroid Build Coastguard Worker .m(4)
1543*4bdc9457SAndroid Build Coastguard Worker .n(n)
1544*4bdc9457SAndroid Build Coastguard Worker .k(k)
1545*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1546*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1547*4bdc9457SAndroid Build Coastguard Worker }
1548*4bdc9457SAndroid Build Coastguard Worker }
1549*4bdc9457SAndroid Build Coastguard Worker }
1550*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,strided_cm_subtile)1551*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, strided_cm_subtile) {
1552*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1553*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1554*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1555*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1556*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1557*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1558*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1559*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1560*4bdc9457SAndroid Build Coastguard Worker .m(m)
1561*4bdc9457SAndroid Build Coastguard Worker .n(n)
1562*4bdc9457SAndroid Build Coastguard Worker .k(k)
1563*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
1564*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1565*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1566*4bdc9457SAndroid Build Coastguard Worker }
1567*4bdc9457SAndroid Build Coastguard Worker }
1568*4bdc9457SAndroid Build Coastguard Worker }
1569*4bdc9457SAndroid Build Coastguard Worker }
1570*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,a_offset)1571*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, a_offset) {
1572*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1573*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1574*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1575*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1576*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1577*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1578*4bdc9457SAndroid Build Coastguard Worker .m(4)
1579*4bdc9457SAndroid Build Coastguard Worker .n(2)
1580*4bdc9457SAndroid Build Coastguard Worker .k(k)
1581*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1582*4bdc9457SAndroid Build Coastguard Worker .a_offset(83)
1583*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1584*4bdc9457SAndroid Build Coastguard Worker }
1585*4bdc9457SAndroid Build Coastguard Worker }
1586*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,zero)1587*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, zero) {
1588*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1589*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 4; mz++) {
1590*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1591*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1592*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1593*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1594*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1595*4bdc9457SAndroid Build Coastguard Worker .m(4)
1596*4bdc9457SAndroid Build Coastguard Worker .n(2)
1597*4bdc9457SAndroid Build Coastguard Worker .k(k)
1598*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1599*4bdc9457SAndroid Build Coastguard Worker .a_offset(83)
1600*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
1601*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1602*4bdc9457SAndroid Build Coastguard Worker }
1603*4bdc9457SAndroid Build Coastguard Worker }
1604*4bdc9457SAndroid Build Coastguard Worker }
1605*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD,strided_cm)1606*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2C4__WASMSIMD, strided_cm) {
1607*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1608*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1609*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1610*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1611*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1612*4bdc9457SAndroid Build Coastguard Worker .m(4)
1613*4bdc9457SAndroid Build Coastguard Worker .n(2)
1614*4bdc9457SAndroid Build Coastguard Worker .k(4)
1615*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
1616*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2c4__wasmsimd);
1617*4bdc9457SAndroid Build Coastguard Worker }
1618*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1619*4bdc9457SAndroid Build Coastguard Worker
1620*4bdc9457SAndroid Build Coastguard Worker
1621*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_eq_4)1622*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_eq_4) {
1623*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1624*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1625*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1626*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1627*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1628*4bdc9457SAndroid Build Coastguard Worker .m(4)
1629*4bdc9457SAndroid Build Coastguard Worker .n(8)
1630*4bdc9457SAndroid Build Coastguard Worker .k(4)
1631*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1632*4bdc9457SAndroid Build Coastguard Worker }
1633*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,strided_cn)1634*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, strided_cn) {
1635*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1636*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1637*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1638*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1639*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1640*4bdc9457SAndroid Build Coastguard Worker .m(4)
1641*4bdc9457SAndroid Build Coastguard Worker .n(8)
1642*4bdc9457SAndroid Build Coastguard Worker .k(4)
1643*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1644*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1645*4bdc9457SAndroid Build Coastguard Worker }
1646*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_eq_4_subtile)1647*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_eq_4_subtile) {
1648*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1649*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1650*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1651*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1652*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1653*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1654*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1655*4bdc9457SAndroid Build Coastguard Worker .m(m)
1656*4bdc9457SAndroid Build Coastguard Worker .n(n)
1657*4bdc9457SAndroid Build Coastguard Worker .k(4)
1658*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1659*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1660*4bdc9457SAndroid Build Coastguard Worker }
1661*4bdc9457SAndroid Build Coastguard Worker }
1662*4bdc9457SAndroid Build Coastguard Worker }
1663*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_eq_4_subtile_m)1664*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_eq_4_subtile_m) {
1665*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1666*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1667*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1668*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1669*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1670*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1671*4bdc9457SAndroid Build Coastguard Worker .m(m)
1672*4bdc9457SAndroid Build Coastguard Worker .n(8)
1673*4bdc9457SAndroid Build Coastguard Worker .k(4)
1674*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1675*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1676*4bdc9457SAndroid Build Coastguard Worker }
1677*4bdc9457SAndroid Build Coastguard Worker }
1678*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_eq_4_subtile_n)1679*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_eq_4_subtile_n) {
1680*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1681*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1682*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1683*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1684*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1685*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1686*4bdc9457SAndroid Build Coastguard Worker .m(4)
1687*4bdc9457SAndroid Build Coastguard Worker .n(n)
1688*4bdc9457SAndroid Build Coastguard Worker .k(4)
1689*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1690*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1691*4bdc9457SAndroid Build Coastguard Worker }
1692*4bdc9457SAndroid Build Coastguard Worker }
1693*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_lt_4)1694*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_lt_4) {
1695*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1696*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1697*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1698*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1699*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1700*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1701*4bdc9457SAndroid Build Coastguard Worker .m(4)
1702*4bdc9457SAndroid Build Coastguard Worker .n(8)
1703*4bdc9457SAndroid Build Coastguard Worker .k(k)
1704*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1705*4bdc9457SAndroid Build Coastguard Worker }
1706*4bdc9457SAndroid Build Coastguard Worker }
1707*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_lt_4_subtile)1708*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_lt_4_subtile) {
1709*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1710*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1711*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1712*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1713*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1714*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1715*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1716*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1717*4bdc9457SAndroid Build Coastguard Worker .m(m)
1718*4bdc9457SAndroid Build Coastguard Worker .n(n)
1719*4bdc9457SAndroid Build Coastguard Worker .k(k)
1720*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1721*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1722*4bdc9457SAndroid Build Coastguard Worker }
1723*4bdc9457SAndroid Build Coastguard Worker }
1724*4bdc9457SAndroid Build Coastguard Worker }
1725*4bdc9457SAndroid Build Coastguard Worker }
1726*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_gt_4)1727*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_gt_4) {
1728*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1729*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1730*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1731*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1732*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1733*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1734*4bdc9457SAndroid Build Coastguard Worker .m(4)
1735*4bdc9457SAndroid Build Coastguard Worker .n(8)
1736*4bdc9457SAndroid Build Coastguard Worker .k(k)
1737*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1738*4bdc9457SAndroid Build Coastguard Worker }
1739*4bdc9457SAndroid Build Coastguard Worker }
1740*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_gt_4_subtile)1741*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_gt_4_subtile) {
1742*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1743*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1744*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1745*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1746*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1747*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1748*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1749*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1750*4bdc9457SAndroid Build Coastguard Worker .m(m)
1751*4bdc9457SAndroid Build Coastguard Worker .n(n)
1752*4bdc9457SAndroid Build Coastguard Worker .k(k)
1753*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1754*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1755*4bdc9457SAndroid Build Coastguard Worker }
1756*4bdc9457SAndroid Build Coastguard Worker }
1757*4bdc9457SAndroid Build Coastguard Worker }
1758*4bdc9457SAndroid Build Coastguard Worker }
1759*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_div_4)1760*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_div_4) {
1761*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1762*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1763*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1764*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1765*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1766*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1767*4bdc9457SAndroid Build Coastguard Worker .m(4)
1768*4bdc9457SAndroid Build Coastguard Worker .n(8)
1769*4bdc9457SAndroid Build Coastguard Worker .k(k)
1770*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1771*4bdc9457SAndroid Build Coastguard Worker }
1772*4bdc9457SAndroid Build Coastguard Worker }
1773*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,k_div_4_subtile)1774*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, k_div_4_subtile) {
1775*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1776*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1777*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1778*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1779*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1780*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1781*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1782*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1783*4bdc9457SAndroid Build Coastguard Worker .m(m)
1784*4bdc9457SAndroid Build Coastguard Worker .n(n)
1785*4bdc9457SAndroid Build Coastguard Worker .k(k)
1786*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1787*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1788*4bdc9457SAndroid Build Coastguard Worker }
1789*4bdc9457SAndroid Build Coastguard Worker }
1790*4bdc9457SAndroid Build Coastguard Worker }
1791*4bdc9457SAndroid Build Coastguard Worker }
1792*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,n_gt_8)1793*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, n_gt_8) {
1794*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1795*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1796*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1797*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1798*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1799*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1800*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1801*4bdc9457SAndroid Build Coastguard Worker .m(4)
1802*4bdc9457SAndroid Build Coastguard Worker .n(n)
1803*4bdc9457SAndroid Build Coastguard Worker .k(k)
1804*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1805*4bdc9457SAndroid Build Coastguard Worker }
1806*4bdc9457SAndroid Build Coastguard Worker }
1807*4bdc9457SAndroid Build Coastguard Worker }
1808*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,n_gt_8_strided_cn)1809*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, n_gt_8_strided_cn) {
1810*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1811*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1812*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1813*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1814*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1815*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1816*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1817*4bdc9457SAndroid Build Coastguard Worker .m(4)
1818*4bdc9457SAndroid Build Coastguard Worker .n(n)
1819*4bdc9457SAndroid Build Coastguard Worker .k(k)
1820*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1821*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1822*4bdc9457SAndroid Build Coastguard Worker }
1823*4bdc9457SAndroid Build Coastguard Worker }
1824*4bdc9457SAndroid Build Coastguard Worker }
1825*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,n_gt_8_subtile)1826*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, n_gt_8_subtile) {
1827*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1828*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1829*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1830*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1831*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1832*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1833*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1834*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1835*4bdc9457SAndroid Build Coastguard Worker .m(m)
1836*4bdc9457SAndroid Build Coastguard Worker .n(n)
1837*4bdc9457SAndroid Build Coastguard Worker .k(k)
1838*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1839*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1840*4bdc9457SAndroid Build Coastguard Worker }
1841*4bdc9457SAndroid Build Coastguard Worker }
1842*4bdc9457SAndroid Build Coastguard Worker }
1843*4bdc9457SAndroid Build Coastguard Worker }
1844*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,n_div_8)1845*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, n_div_8) {
1846*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1847*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1848*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1849*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1850*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1851*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1852*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1853*4bdc9457SAndroid Build Coastguard Worker .m(4)
1854*4bdc9457SAndroid Build Coastguard Worker .n(n)
1855*4bdc9457SAndroid Build Coastguard Worker .k(k)
1856*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1857*4bdc9457SAndroid Build Coastguard Worker }
1858*4bdc9457SAndroid Build Coastguard Worker }
1859*4bdc9457SAndroid Build Coastguard Worker }
1860*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,n_div_8_strided_cn)1861*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, n_div_8_strided_cn) {
1862*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1863*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1864*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1865*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1866*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1867*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1868*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1869*4bdc9457SAndroid Build Coastguard Worker .m(4)
1870*4bdc9457SAndroid Build Coastguard Worker .n(n)
1871*4bdc9457SAndroid Build Coastguard Worker .k(k)
1872*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1873*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1874*4bdc9457SAndroid Build Coastguard Worker }
1875*4bdc9457SAndroid Build Coastguard Worker }
1876*4bdc9457SAndroid Build Coastguard Worker }
1877*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,n_div_8_subtile)1878*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, n_div_8_subtile) {
1879*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1880*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1881*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1882*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1883*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1884*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1885*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1886*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1887*4bdc9457SAndroid Build Coastguard Worker .m(m)
1888*4bdc9457SAndroid Build Coastguard Worker .n(n)
1889*4bdc9457SAndroid Build Coastguard Worker .k(k)
1890*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1891*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1892*4bdc9457SAndroid Build Coastguard Worker }
1893*4bdc9457SAndroid Build Coastguard Worker }
1894*4bdc9457SAndroid Build Coastguard Worker }
1895*4bdc9457SAndroid Build Coastguard Worker }
1896*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,small_kernel)1897*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, small_kernel) {
1898*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1899*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1900*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1901*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1902*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1903*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1904*4bdc9457SAndroid Build Coastguard Worker .m(4)
1905*4bdc9457SAndroid Build Coastguard Worker .n(8)
1906*4bdc9457SAndroid Build Coastguard Worker .k(k)
1907*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1908*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1909*4bdc9457SAndroid Build Coastguard Worker }
1910*4bdc9457SAndroid Build Coastguard Worker }
1911*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,small_kernel_subtile)1912*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, small_kernel_subtile) {
1913*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1914*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1915*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1916*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1917*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1918*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1919*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1920*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1921*4bdc9457SAndroid Build Coastguard Worker .m(m)
1922*4bdc9457SAndroid Build Coastguard Worker .n(n)
1923*4bdc9457SAndroid Build Coastguard Worker .k(k)
1924*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1925*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1926*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1927*4bdc9457SAndroid Build Coastguard Worker }
1928*4bdc9457SAndroid Build Coastguard Worker }
1929*4bdc9457SAndroid Build Coastguard Worker }
1930*4bdc9457SAndroid Build Coastguard Worker }
1931*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,n_gt_8_small_kernel)1932*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, n_gt_8_small_kernel) {
1933*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1934*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1935*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1936*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1937*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1938*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1939*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1940*4bdc9457SAndroid Build Coastguard Worker .m(4)
1941*4bdc9457SAndroid Build Coastguard Worker .n(n)
1942*4bdc9457SAndroid Build Coastguard Worker .k(k)
1943*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1944*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1945*4bdc9457SAndroid Build Coastguard Worker }
1946*4bdc9457SAndroid Build Coastguard Worker }
1947*4bdc9457SAndroid Build Coastguard Worker }
1948*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,n_div_8_small_kernel)1949*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, n_div_8_small_kernel) {
1950*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1951*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1952*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1953*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1954*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1955*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1956*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1957*4bdc9457SAndroid Build Coastguard Worker .m(4)
1958*4bdc9457SAndroid Build Coastguard Worker .n(n)
1959*4bdc9457SAndroid Build Coastguard Worker .k(k)
1960*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1961*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1962*4bdc9457SAndroid Build Coastguard Worker }
1963*4bdc9457SAndroid Build Coastguard Worker }
1964*4bdc9457SAndroid Build Coastguard Worker }
1965*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,strided_cm_subtile)1966*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, strided_cm_subtile) {
1967*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1968*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1969*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1970*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1971*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1972*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1973*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1974*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1975*4bdc9457SAndroid Build Coastguard Worker .m(m)
1976*4bdc9457SAndroid Build Coastguard Worker .n(n)
1977*4bdc9457SAndroid Build Coastguard Worker .k(k)
1978*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1979*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1980*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1981*4bdc9457SAndroid Build Coastguard Worker }
1982*4bdc9457SAndroid Build Coastguard Worker }
1983*4bdc9457SAndroid Build Coastguard Worker }
1984*4bdc9457SAndroid Build Coastguard Worker }
1985*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,a_offset)1986*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, a_offset) {
1987*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1988*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1989*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1990*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1991*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1992*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1993*4bdc9457SAndroid Build Coastguard Worker .m(4)
1994*4bdc9457SAndroid Build Coastguard Worker .n(8)
1995*4bdc9457SAndroid Build Coastguard Worker .k(k)
1996*4bdc9457SAndroid Build Coastguard Worker .ks(3)
1997*4bdc9457SAndroid Build Coastguard Worker .a_offset(83)
1998*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
1999*4bdc9457SAndroid Build Coastguard Worker }
2000*4bdc9457SAndroid Build Coastguard Worker }
2001*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,zero)2002*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, zero) {
2003*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2004*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 4; mz++) {
2005*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2006*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2007*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2008*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2009*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2010*4bdc9457SAndroid Build Coastguard Worker .m(4)
2011*4bdc9457SAndroid Build Coastguard Worker .n(8)
2012*4bdc9457SAndroid Build Coastguard Worker .k(k)
2013*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2014*4bdc9457SAndroid Build Coastguard Worker .a_offset(83)
2015*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
2016*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
2017*4bdc9457SAndroid Build Coastguard Worker }
2018*4bdc9457SAndroid Build Coastguard Worker }
2019*4bdc9457SAndroid Build Coastguard Worker }
2020*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD,strided_cm)2021*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMSIMD, strided_cm) {
2022*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2023*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2024*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2025*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2026*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2027*4bdc9457SAndroid Build Coastguard Worker .m(4)
2028*4bdc9457SAndroid Build Coastguard Worker .n(8)
2029*4bdc9457SAndroid Build Coastguard Worker .k(4)
2030*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2031*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmsimd);
2032*4bdc9457SAndroid Build Coastguard Worker }
2033*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2034*4bdc9457SAndroid Build Coastguard Worker
2035*4bdc9457SAndroid Build Coastguard Worker
2036*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_eq_4)2037*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_eq_4) {
2038*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2039*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2040*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2041*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2042*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2043*4bdc9457SAndroid Build Coastguard Worker .m(5)
2044*4bdc9457SAndroid Build Coastguard Worker .n(8)
2045*4bdc9457SAndroid Build Coastguard Worker .k(4)
2046*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2047*4bdc9457SAndroid Build Coastguard Worker }
2048*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,strided_cn)2049*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, strided_cn) {
2050*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2051*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2052*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2053*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2054*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2055*4bdc9457SAndroid Build Coastguard Worker .m(5)
2056*4bdc9457SAndroid Build Coastguard Worker .n(8)
2057*4bdc9457SAndroid Build Coastguard Worker .k(4)
2058*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2059*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2060*4bdc9457SAndroid Build Coastguard Worker }
2061*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_eq_4_subtile)2062*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_eq_4_subtile) {
2063*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2064*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2065*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2066*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2067*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2068*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2069*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2070*4bdc9457SAndroid Build Coastguard Worker .m(m)
2071*4bdc9457SAndroid Build Coastguard Worker .n(n)
2072*4bdc9457SAndroid Build Coastguard Worker .k(4)
2073*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2074*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2075*4bdc9457SAndroid Build Coastguard Worker }
2076*4bdc9457SAndroid Build Coastguard Worker }
2077*4bdc9457SAndroid Build Coastguard Worker }
2078*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_eq_4_subtile_m)2079*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_eq_4_subtile_m) {
2080*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2081*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2082*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2083*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2084*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2085*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2086*4bdc9457SAndroid Build Coastguard Worker .m(m)
2087*4bdc9457SAndroid Build Coastguard Worker .n(8)
2088*4bdc9457SAndroid Build Coastguard Worker .k(4)
2089*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2090*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2091*4bdc9457SAndroid Build Coastguard Worker }
2092*4bdc9457SAndroid Build Coastguard Worker }
2093*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_eq_4_subtile_n)2094*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_eq_4_subtile_n) {
2095*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2096*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2097*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2098*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2099*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2100*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2101*4bdc9457SAndroid Build Coastguard Worker .m(5)
2102*4bdc9457SAndroid Build Coastguard Worker .n(n)
2103*4bdc9457SAndroid Build Coastguard Worker .k(4)
2104*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2105*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2106*4bdc9457SAndroid Build Coastguard Worker }
2107*4bdc9457SAndroid Build Coastguard Worker }
2108*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_lt_4)2109*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_lt_4) {
2110*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2111*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2112*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2113*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2114*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2115*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2116*4bdc9457SAndroid Build Coastguard Worker .m(5)
2117*4bdc9457SAndroid Build Coastguard Worker .n(8)
2118*4bdc9457SAndroid Build Coastguard Worker .k(k)
2119*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2120*4bdc9457SAndroid Build Coastguard Worker }
2121*4bdc9457SAndroid Build Coastguard Worker }
2122*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_lt_4_subtile)2123*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_lt_4_subtile) {
2124*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2125*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2126*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2127*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2128*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2129*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2130*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2131*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2132*4bdc9457SAndroid Build Coastguard Worker .m(m)
2133*4bdc9457SAndroid Build Coastguard Worker .n(n)
2134*4bdc9457SAndroid Build Coastguard Worker .k(k)
2135*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2136*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2137*4bdc9457SAndroid Build Coastguard Worker }
2138*4bdc9457SAndroid Build Coastguard Worker }
2139*4bdc9457SAndroid Build Coastguard Worker }
2140*4bdc9457SAndroid Build Coastguard Worker }
2141*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_gt_4)2142*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_gt_4) {
2143*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2144*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2145*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2146*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2147*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2148*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2149*4bdc9457SAndroid Build Coastguard Worker .m(5)
2150*4bdc9457SAndroid Build Coastguard Worker .n(8)
2151*4bdc9457SAndroid Build Coastguard Worker .k(k)
2152*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2153*4bdc9457SAndroid Build Coastguard Worker }
2154*4bdc9457SAndroid Build Coastguard Worker }
2155*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_gt_4_subtile)2156*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_gt_4_subtile) {
2157*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2158*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2159*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2160*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2161*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2162*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2163*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2164*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2165*4bdc9457SAndroid Build Coastguard Worker .m(m)
2166*4bdc9457SAndroid Build Coastguard Worker .n(n)
2167*4bdc9457SAndroid Build Coastguard Worker .k(k)
2168*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2169*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2170*4bdc9457SAndroid Build Coastguard Worker }
2171*4bdc9457SAndroid Build Coastguard Worker }
2172*4bdc9457SAndroid Build Coastguard Worker }
2173*4bdc9457SAndroid Build Coastguard Worker }
2174*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_div_4)2175*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_div_4) {
2176*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2177*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2178*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2179*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2180*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2181*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2182*4bdc9457SAndroid Build Coastguard Worker .m(5)
2183*4bdc9457SAndroid Build Coastguard Worker .n(8)
2184*4bdc9457SAndroid Build Coastguard Worker .k(k)
2185*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2186*4bdc9457SAndroid Build Coastguard Worker }
2187*4bdc9457SAndroid Build Coastguard Worker }
2188*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,k_div_4_subtile)2189*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, k_div_4_subtile) {
2190*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2191*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2192*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2193*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2194*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2195*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2196*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2197*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2198*4bdc9457SAndroid Build Coastguard Worker .m(m)
2199*4bdc9457SAndroid Build Coastguard Worker .n(n)
2200*4bdc9457SAndroid Build Coastguard Worker .k(k)
2201*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2202*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2203*4bdc9457SAndroid Build Coastguard Worker }
2204*4bdc9457SAndroid Build Coastguard Worker }
2205*4bdc9457SAndroid Build Coastguard Worker }
2206*4bdc9457SAndroid Build Coastguard Worker }
2207*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,n_gt_8)2208*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, n_gt_8) {
2209*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2210*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2211*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2212*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2213*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2214*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2215*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2216*4bdc9457SAndroid Build Coastguard Worker .m(5)
2217*4bdc9457SAndroid Build Coastguard Worker .n(n)
2218*4bdc9457SAndroid Build Coastguard Worker .k(k)
2219*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2220*4bdc9457SAndroid Build Coastguard Worker }
2221*4bdc9457SAndroid Build Coastguard Worker }
2222*4bdc9457SAndroid Build Coastguard Worker }
2223*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,n_gt_8_strided_cn)2224*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, n_gt_8_strided_cn) {
2225*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2226*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2227*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2228*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2229*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2230*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2231*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2232*4bdc9457SAndroid Build Coastguard Worker .m(5)
2233*4bdc9457SAndroid Build Coastguard Worker .n(n)
2234*4bdc9457SAndroid Build Coastguard Worker .k(k)
2235*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2236*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2237*4bdc9457SAndroid Build Coastguard Worker }
2238*4bdc9457SAndroid Build Coastguard Worker }
2239*4bdc9457SAndroid Build Coastguard Worker }
2240*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,n_gt_8_subtile)2241*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, n_gt_8_subtile) {
2242*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2243*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2244*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2245*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2246*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2247*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2248*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2249*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2250*4bdc9457SAndroid Build Coastguard Worker .m(m)
2251*4bdc9457SAndroid Build Coastguard Worker .n(n)
2252*4bdc9457SAndroid Build Coastguard Worker .k(k)
2253*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2254*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2255*4bdc9457SAndroid Build Coastguard Worker }
2256*4bdc9457SAndroid Build Coastguard Worker }
2257*4bdc9457SAndroid Build Coastguard Worker }
2258*4bdc9457SAndroid Build Coastguard Worker }
2259*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,n_div_8)2260*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, n_div_8) {
2261*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2262*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2263*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2264*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2265*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2266*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2267*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2268*4bdc9457SAndroid Build Coastguard Worker .m(5)
2269*4bdc9457SAndroid Build Coastguard Worker .n(n)
2270*4bdc9457SAndroid Build Coastguard Worker .k(k)
2271*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2272*4bdc9457SAndroid Build Coastguard Worker }
2273*4bdc9457SAndroid Build Coastguard Worker }
2274*4bdc9457SAndroid Build Coastguard Worker }
2275*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,n_div_8_strided_cn)2276*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, n_div_8_strided_cn) {
2277*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2278*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2279*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2280*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2281*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2282*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2283*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2284*4bdc9457SAndroid Build Coastguard Worker .m(5)
2285*4bdc9457SAndroid Build Coastguard Worker .n(n)
2286*4bdc9457SAndroid Build Coastguard Worker .k(k)
2287*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2288*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2289*4bdc9457SAndroid Build Coastguard Worker }
2290*4bdc9457SAndroid Build Coastguard Worker }
2291*4bdc9457SAndroid Build Coastguard Worker }
2292*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,n_div_8_subtile)2293*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, n_div_8_subtile) {
2294*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2295*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2296*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2297*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2298*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2299*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2300*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2301*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2302*4bdc9457SAndroid Build Coastguard Worker .m(m)
2303*4bdc9457SAndroid Build Coastguard Worker .n(n)
2304*4bdc9457SAndroid Build Coastguard Worker .k(k)
2305*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2306*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2307*4bdc9457SAndroid Build Coastguard Worker }
2308*4bdc9457SAndroid Build Coastguard Worker }
2309*4bdc9457SAndroid Build Coastguard Worker }
2310*4bdc9457SAndroid Build Coastguard Worker }
2311*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,small_kernel)2312*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, small_kernel) {
2313*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2314*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2315*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2316*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2317*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2318*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2319*4bdc9457SAndroid Build Coastguard Worker .m(5)
2320*4bdc9457SAndroid Build Coastguard Worker .n(8)
2321*4bdc9457SAndroid Build Coastguard Worker .k(k)
2322*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2323*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2324*4bdc9457SAndroid Build Coastguard Worker }
2325*4bdc9457SAndroid Build Coastguard Worker }
2326*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,small_kernel_subtile)2327*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, small_kernel_subtile) {
2328*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2329*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2330*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2331*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2332*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2333*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2334*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2335*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2336*4bdc9457SAndroid Build Coastguard Worker .m(m)
2337*4bdc9457SAndroid Build Coastguard Worker .n(n)
2338*4bdc9457SAndroid Build Coastguard Worker .k(k)
2339*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2340*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2341*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2342*4bdc9457SAndroid Build Coastguard Worker }
2343*4bdc9457SAndroid Build Coastguard Worker }
2344*4bdc9457SAndroid Build Coastguard Worker }
2345*4bdc9457SAndroid Build Coastguard Worker }
2346*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,n_gt_8_small_kernel)2347*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, n_gt_8_small_kernel) {
2348*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2349*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2350*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2351*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2352*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2353*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2354*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2355*4bdc9457SAndroid Build Coastguard Worker .m(5)
2356*4bdc9457SAndroid Build Coastguard Worker .n(n)
2357*4bdc9457SAndroid Build Coastguard Worker .k(k)
2358*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2359*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2360*4bdc9457SAndroid Build Coastguard Worker }
2361*4bdc9457SAndroid Build Coastguard Worker }
2362*4bdc9457SAndroid Build Coastguard Worker }
2363*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,n_div_8_small_kernel)2364*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, n_div_8_small_kernel) {
2365*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2366*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2367*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2368*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2369*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2370*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2371*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2372*4bdc9457SAndroid Build Coastguard Worker .m(5)
2373*4bdc9457SAndroid Build Coastguard Worker .n(n)
2374*4bdc9457SAndroid Build Coastguard Worker .k(k)
2375*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2376*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2377*4bdc9457SAndroid Build Coastguard Worker }
2378*4bdc9457SAndroid Build Coastguard Worker }
2379*4bdc9457SAndroid Build Coastguard Worker }
2380*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,strided_cm_subtile)2381*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, strided_cm_subtile) {
2382*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2383*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2384*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2385*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2386*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2387*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2388*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2389*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2390*4bdc9457SAndroid Build Coastguard Worker .m(m)
2391*4bdc9457SAndroid Build Coastguard Worker .n(n)
2392*4bdc9457SAndroid Build Coastguard Worker .k(k)
2393*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2394*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2395*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2396*4bdc9457SAndroid Build Coastguard Worker }
2397*4bdc9457SAndroid Build Coastguard Worker }
2398*4bdc9457SAndroid Build Coastguard Worker }
2399*4bdc9457SAndroid Build Coastguard Worker }
2400*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,a_offset)2401*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, a_offset) {
2402*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2403*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2404*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2405*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2406*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2407*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2408*4bdc9457SAndroid Build Coastguard Worker .m(5)
2409*4bdc9457SAndroid Build Coastguard Worker .n(8)
2410*4bdc9457SAndroid Build Coastguard Worker .k(k)
2411*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2412*4bdc9457SAndroid Build Coastguard Worker .a_offset(103)
2413*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2414*4bdc9457SAndroid Build Coastguard Worker }
2415*4bdc9457SAndroid Build Coastguard Worker }
2416*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,zero)2417*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, zero) {
2418*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2419*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 5; mz++) {
2420*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2421*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2422*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2423*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2424*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2425*4bdc9457SAndroid Build Coastguard Worker .m(5)
2426*4bdc9457SAndroid Build Coastguard Worker .n(8)
2427*4bdc9457SAndroid Build Coastguard Worker .k(k)
2428*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2429*4bdc9457SAndroid Build Coastguard Worker .a_offset(103)
2430*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
2431*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2432*4bdc9457SAndroid Build Coastguard Worker }
2433*4bdc9457SAndroid Build Coastguard Worker }
2434*4bdc9457SAndroid Build Coastguard Worker }
2435*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD,strided_cm)2436*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8S4__WASMSIMD, strided_cm) {
2437*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2438*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2439*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2440*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2441*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2442*4bdc9457SAndroid Build Coastguard Worker .m(5)
2443*4bdc9457SAndroid Build Coastguard Worker .n(8)
2444*4bdc9457SAndroid Build Coastguard Worker .k(4)
2445*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2446*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8s4__wasmsimd);
2447*4bdc9457SAndroid Build Coastguard Worker }
2448*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2449*4bdc9457SAndroid Build Coastguard Worker
2450*4bdc9457SAndroid Build Coastguard Worker
2451*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_eq_1)2452*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_eq_1) {
2453*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2454*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2455*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2456*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2457*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2458*4bdc9457SAndroid Build Coastguard Worker .m(6)
2459*4bdc9457SAndroid Build Coastguard Worker .n(8)
2460*4bdc9457SAndroid Build Coastguard Worker .k(1)
2461*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2462*4bdc9457SAndroid Build Coastguard Worker }
2463*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,strided_cn)2464*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, strided_cn) {
2465*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2466*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2467*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2468*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2469*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2470*4bdc9457SAndroid Build Coastguard Worker .m(6)
2471*4bdc9457SAndroid Build Coastguard Worker .n(8)
2472*4bdc9457SAndroid Build Coastguard Worker .k(1)
2473*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2474*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2475*4bdc9457SAndroid Build Coastguard Worker }
2476*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)2477*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
2478*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2479*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2480*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2481*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2482*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2483*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2484*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2485*4bdc9457SAndroid Build Coastguard Worker .m(m)
2486*4bdc9457SAndroid Build Coastguard Worker .n(n)
2487*4bdc9457SAndroid Build Coastguard Worker .k(1)
2488*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2489*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2490*4bdc9457SAndroid Build Coastguard Worker }
2491*4bdc9457SAndroid Build Coastguard Worker }
2492*4bdc9457SAndroid Build Coastguard Worker }
2493*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)2494*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
2495*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2496*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2497*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2498*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2499*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2500*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2501*4bdc9457SAndroid Build Coastguard Worker .m(m)
2502*4bdc9457SAndroid Build Coastguard Worker .n(8)
2503*4bdc9457SAndroid Build Coastguard Worker .k(1)
2504*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2505*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2506*4bdc9457SAndroid Build Coastguard Worker }
2507*4bdc9457SAndroid Build Coastguard Worker }
2508*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)2509*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
2510*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2511*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2512*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2513*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2514*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2515*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2516*4bdc9457SAndroid Build Coastguard Worker .m(6)
2517*4bdc9457SAndroid Build Coastguard Worker .n(n)
2518*4bdc9457SAndroid Build Coastguard Worker .k(1)
2519*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2520*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2521*4bdc9457SAndroid Build Coastguard Worker }
2522*4bdc9457SAndroid Build Coastguard Worker }
2523*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_gt_1)2524*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_gt_1) {
2525*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2526*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2527*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2528*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2529*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2530*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2531*4bdc9457SAndroid Build Coastguard Worker .m(6)
2532*4bdc9457SAndroid Build Coastguard Worker .n(8)
2533*4bdc9457SAndroid Build Coastguard Worker .k(k)
2534*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2535*4bdc9457SAndroid Build Coastguard Worker }
2536*4bdc9457SAndroid Build Coastguard Worker }
2537*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)2538*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
2539*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2540*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2541*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2542*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2543*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2544*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2545*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2546*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2547*4bdc9457SAndroid Build Coastguard Worker .m(m)
2548*4bdc9457SAndroid Build Coastguard Worker .n(n)
2549*4bdc9457SAndroid Build Coastguard Worker .k(k)
2550*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2551*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2552*4bdc9457SAndroid Build Coastguard Worker }
2553*4bdc9457SAndroid Build Coastguard Worker }
2554*4bdc9457SAndroid Build Coastguard Worker }
2555*4bdc9457SAndroid Build Coastguard Worker }
2556*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_gt_8)2557*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_gt_8) {
2558*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2559*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2560*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2561*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2562*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2563*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2564*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2565*4bdc9457SAndroid Build Coastguard Worker .m(6)
2566*4bdc9457SAndroid Build Coastguard Worker .n(n)
2567*4bdc9457SAndroid Build Coastguard Worker .k(k)
2568*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2569*4bdc9457SAndroid Build Coastguard Worker }
2570*4bdc9457SAndroid Build Coastguard Worker }
2571*4bdc9457SAndroid Build Coastguard Worker }
2572*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)2573*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
2574*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2575*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2576*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2577*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2578*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2579*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2580*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2581*4bdc9457SAndroid Build Coastguard Worker .m(6)
2582*4bdc9457SAndroid Build Coastguard Worker .n(n)
2583*4bdc9457SAndroid Build Coastguard Worker .k(k)
2584*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2585*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2586*4bdc9457SAndroid Build Coastguard Worker }
2587*4bdc9457SAndroid Build Coastguard Worker }
2588*4bdc9457SAndroid Build Coastguard Worker }
2589*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)2590*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
2591*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2592*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2593*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2594*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2595*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2596*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2597*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2598*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2599*4bdc9457SAndroid Build Coastguard Worker .m(m)
2600*4bdc9457SAndroid Build Coastguard Worker .n(n)
2601*4bdc9457SAndroid Build Coastguard Worker .k(k)
2602*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2603*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2604*4bdc9457SAndroid Build Coastguard Worker }
2605*4bdc9457SAndroid Build Coastguard Worker }
2606*4bdc9457SAndroid Build Coastguard Worker }
2607*4bdc9457SAndroid Build Coastguard Worker }
2608*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_div_8)2609*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_div_8) {
2610*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2611*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2612*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2613*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2614*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2615*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2616*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2617*4bdc9457SAndroid Build Coastguard Worker .m(6)
2618*4bdc9457SAndroid Build Coastguard Worker .n(n)
2619*4bdc9457SAndroid Build Coastguard Worker .k(k)
2620*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2621*4bdc9457SAndroid Build Coastguard Worker }
2622*4bdc9457SAndroid Build Coastguard Worker }
2623*4bdc9457SAndroid Build Coastguard Worker }
2624*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)2625*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
2626*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2627*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2628*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2629*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2630*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2631*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2632*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2633*4bdc9457SAndroid Build Coastguard Worker .m(6)
2634*4bdc9457SAndroid Build Coastguard Worker .n(n)
2635*4bdc9457SAndroid Build Coastguard Worker .k(k)
2636*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2637*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2638*4bdc9457SAndroid Build Coastguard Worker }
2639*4bdc9457SAndroid Build Coastguard Worker }
2640*4bdc9457SAndroid Build Coastguard Worker }
2641*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)2642*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
2643*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2644*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2645*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2646*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2647*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2648*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2649*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2650*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2651*4bdc9457SAndroid Build Coastguard Worker .m(m)
2652*4bdc9457SAndroid Build Coastguard Worker .n(n)
2653*4bdc9457SAndroid Build Coastguard Worker .k(k)
2654*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2655*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2656*4bdc9457SAndroid Build Coastguard Worker }
2657*4bdc9457SAndroid Build Coastguard Worker }
2658*4bdc9457SAndroid Build Coastguard Worker }
2659*4bdc9457SAndroid Build Coastguard Worker }
2660*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,small_kernel)2661*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, small_kernel) {
2662*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2663*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2664*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2665*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2666*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2667*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2668*4bdc9457SAndroid Build Coastguard Worker .m(6)
2669*4bdc9457SAndroid Build Coastguard Worker .n(8)
2670*4bdc9457SAndroid Build Coastguard Worker .k(k)
2671*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2672*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2673*4bdc9457SAndroid Build Coastguard Worker }
2674*4bdc9457SAndroid Build Coastguard Worker }
2675*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,small_kernel_subtile)2676*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, small_kernel_subtile) {
2677*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2678*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2679*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2680*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2681*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2682*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2683*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2684*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2685*4bdc9457SAndroid Build Coastguard Worker .m(m)
2686*4bdc9457SAndroid Build Coastguard Worker .n(n)
2687*4bdc9457SAndroid Build Coastguard Worker .k(k)
2688*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2689*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2690*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2691*4bdc9457SAndroid Build Coastguard Worker }
2692*4bdc9457SAndroid Build Coastguard Worker }
2693*4bdc9457SAndroid Build Coastguard Worker }
2694*4bdc9457SAndroid Build Coastguard Worker }
2695*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_gt_8_small_kernel)2696*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_gt_8_small_kernel) {
2697*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2698*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2699*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2700*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2701*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2702*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2703*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2704*4bdc9457SAndroid Build Coastguard Worker .m(6)
2705*4bdc9457SAndroid Build Coastguard Worker .n(n)
2706*4bdc9457SAndroid Build Coastguard Worker .k(k)
2707*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2708*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2709*4bdc9457SAndroid Build Coastguard Worker }
2710*4bdc9457SAndroid Build Coastguard Worker }
2711*4bdc9457SAndroid Build Coastguard Worker }
2712*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_div_8_small_kernel)2713*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_div_8_small_kernel) {
2714*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2715*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2716*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2717*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2718*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2719*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2720*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2721*4bdc9457SAndroid Build Coastguard Worker .m(6)
2722*4bdc9457SAndroid Build Coastguard Worker .n(n)
2723*4bdc9457SAndroid Build Coastguard Worker .k(k)
2724*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2725*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2726*4bdc9457SAndroid Build Coastguard Worker }
2727*4bdc9457SAndroid Build Coastguard Worker }
2728*4bdc9457SAndroid Build Coastguard Worker }
2729*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)2730*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
2731*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2732*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2733*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2734*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2735*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2736*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2737*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2738*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2739*4bdc9457SAndroid Build Coastguard Worker .m(m)
2740*4bdc9457SAndroid Build Coastguard Worker .n(n)
2741*4bdc9457SAndroid Build Coastguard Worker .k(k)
2742*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2743*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2744*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2745*4bdc9457SAndroid Build Coastguard Worker }
2746*4bdc9457SAndroid Build Coastguard Worker }
2747*4bdc9457SAndroid Build Coastguard Worker }
2748*4bdc9457SAndroid Build Coastguard Worker }
2749*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,a_offset)2750*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, a_offset) {
2751*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2752*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2753*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2754*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2755*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2756*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2757*4bdc9457SAndroid Build Coastguard Worker .m(6)
2758*4bdc9457SAndroid Build Coastguard Worker .n(8)
2759*4bdc9457SAndroid Build Coastguard Worker .k(k)
2760*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2761*4bdc9457SAndroid Build Coastguard Worker .a_offset(37)
2762*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2763*4bdc9457SAndroid Build Coastguard Worker }
2764*4bdc9457SAndroid Build Coastguard Worker }
2765*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,zero)2766*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, zero) {
2767*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2768*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 6; mz++) {
2769*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2770*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2771*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2772*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2773*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2774*4bdc9457SAndroid Build Coastguard Worker .m(6)
2775*4bdc9457SAndroid Build Coastguard Worker .n(8)
2776*4bdc9457SAndroid Build Coastguard Worker .k(k)
2777*4bdc9457SAndroid Build Coastguard Worker .ks(3)
2778*4bdc9457SAndroid Build Coastguard Worker .a_offset(37)
2779*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
2780*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2781*4bdc9457SAndroid Build Coastguard Worker }
2782*4bdc9457SAndroid Build Coastguard Worker }
2783*4bdc9457SAndroid Build Coastguard Worker }
2784*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT,strided_cm)2785*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_LOADSPLAT, strided_cm) {
2786*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2787*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2788*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2789*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2790*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2791*4bdc9457SAndroid Build Coastguard Worker .m(6)
2792*4bdc9457SAndroid Build Coastguard Worker .n(8)
2793*4bdc9457SAndroid Build Coastguard Worker .k(1)
2794*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2795*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2796*4bdc9457SAndroid Build Coastguard Worker }
2797*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2798*4bdc9457SAndroid Build Coastguard Worker
2799*4bdc9457SAndroid Build Coastguard Worker
2800*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_eq_4)2801*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_eq_4) {
2802*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2803*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2804*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2805*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2806*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2807*4bdc9457SAndroid Build Coastguard Worker .m(6)
2808*4bdc9457SAndroid Build Coastguard Worker .n(8)
2809*4bdc9457SAndroid Build Coastguard Worker .k(4)
2810*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2811*4bdc9457SAndroid Build Coastguard Worker }
2812*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,strided_cn)2813*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, strided_cn) {
2814*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2815*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2816*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2817*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2818*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2819*4bdc9457SAndroid Build Coastguard Worker .m(6)
2820*4bdc9457SAndroid Build Coastguard Worker .n(8)
2821*4bdc9457SAndroid Build Coastguard Worker .k(4)
2822*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2823*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2824*4bdc9457SAndroid Build Coastguard Worker }
2825*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_eq_4_subtile)2826*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
2827*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2828*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2829*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2830*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2831*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2832*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2833*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2834*4bdc9457SAndroid Build Coastguard Worker .m(m)
2835*4bdc9457SAndroid Build Coastguard Worker .n(n)
2836*4bdc9457SAndroid Build Coastguard Worker .k(4)
2837*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2838*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2839*4bdc9457SAndroid Build Coastguard Worker }
2840*4bdc9457SAndroid Build Coastguard Worker }
2841*4bdc9457SAndroid Build Coastguard Worker }
2842*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)2843*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
2844*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2845*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2846*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2847*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2848*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2849*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2850*4bdc9457SAndroid Build Coastguard Worker .m(m)
2851*4bdc9457SAndroid Build Coastguard Worker .n(8)
2852*4bdc9457SAndroid Build Coastguard Worker .k(4)
2853*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2854*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2855*4bdc9457SAndroid Build Coastguard Worker }
2856*4bdc9457SAndroid Build Coastguard Worker }
2857*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)2858*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
2859*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2860*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2861*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2862*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2863*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2864*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2865*4bdc9457SAndroid Build Coastguard Worker .m(6)
2866*4bdc9457SAndroid Build Coastguard Worker .n(n)
2867*4bdc9457SAndroid Build Coastguard Worker .k(4)
2868*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2869*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2870*4bdc9457SAndroid Build Coastguard Worker }
2871*4bdc9457SAndroid Build Coastguard Worker }
2872*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_lt_4)2873*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_lt_4) {
2874*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2875*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2876*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2877*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2878*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2879*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2880*4bdc9457SAndroid Build Coastguard Worker .m(6)
2881*4bdc9457SAndroid Build Coastguard Worker .n(8)
2882*4bdc9457SAndroid Build Coastguard Worker .k(k)
2883*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2884*4bdc9457SAndroid Build Coastguard Worker }
2885*4bdc9457SAndroid Build Coastguard Worker }
2886*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_lt_4_subtile)2887*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
2888*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2889*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2890*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2891*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2892*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2893*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2894*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2895*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2896*4bdc9457SAndroid Build Coastguard Worker .m(m)
2897*4bdc9457SAndroid Build Coastguard Worker .n(n)
2898*4bdc9457SAndroid Build Coastguard Worker .k(k)
2899*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2900*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2901*4bdc9457SAndroid Build Coastguard Worker }
2902*4bdc9457SAndroid Build Coastguard Worker }
2903*4bdc9457SAndroid Build Coastguard Worker }
2904*4bdc9457SAndroid Build Coastguard Worker }
2905*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_gt_4)2906*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_gt_4) {
2907*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2908*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2909*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2910*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2911*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2912*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2913*4bdc9457SAndroid Build Coastguard Worker .m(6)
2914*4bdc9457SAndroid Build Coastguard Worker .n(8)
2915*4bdc9457SAndroid Build Coastguard Worker .k(k)
2916*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2917*4bdc9457SAndroid Build Coastguard Worker }
2918*4bdc9457SAndroid Build Coastguard Worker }
2919*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_gt_4_subtile)2920*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
2921*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2922*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2923*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2924*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2925*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2926*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2927*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2928*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2929*4bdc9457SAndroid Build Coastguard Worker .m(m)
2930*4bdc9457SAndroid Build Coastguard Worker .n(n)
2931*4bdc9457SAndroid Build Coastguard Worker .k(k)
2932*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2933*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2934*4bdc9457SAndroid Build Coastguard Worker }
2935*4bdc9457SAndroid Build Coastguard Worker }
2936*4bdc9457SAndroid Build Coastguard Worker }
2937*4bdc9457SAndroid Build Coastguard Worker }
2938*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_div_4)2939*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_div_4) {
2940*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2941*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2942*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2943*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2944*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2945*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2946*4bdc9457SAndroid Build Coastguard Worker .m(6)
2947*4bdc9457SAndroid Build Coastguard Worker .n(8)
2948*4bdc9457SAndroid Build Coastguard Worker .k(k)
2949*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2950*4bdc9457SAndroid Build Coastguard Worker }
2951*4bdc9457SAndroid Build Coastguard Worker }
2952*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,k_div_4_subtile)2953*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, k_div_4_subtile) {
2954*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2955*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2956*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2957*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2958*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2959*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2960*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2961*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2962*4bdc9457SAndroid Build Coastguard Worker .m(m)
2963*4bdc9457SAndroid Build Coastguard Worker .n(n)
2964*4bdc9457SAndroid Build Coastguard Worker .k(k)
2965*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2966*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2967*4bdc9457SAndroid Build Coastguard Worker }
2968*4bdc9457SAndroid Build Coastguard Worker }
2969*4bdc9457SAndroid Build Coastguard Worker }
2970*4bdc9457SAndroid Build Coastguard Worker }
2971*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,n_gt_8)2972*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, n_gt_8) {
2973*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2974*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2975*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2976*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2977*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2978*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2979*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2980*4bdc9457SAndroid Build Coastguard Worker .m(6)
2981*4bdc9457SAndroid Build Coastguard Worker .n(n)
2982*4bdc9457SAndroid Build Coastguard Worker .k(k)
2983*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
2984*4bdc9457SAndroid Build Coastguard Worker }
2985*4bdc9457SAndroid Build Coastguard Worker }
2986*4bdc9457SAndroid Build Coastguard Worker }
2987*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)2988*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
2989*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2990*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2991*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2992*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2993*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2994*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2995*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2996*4bdc9457SAndroid Build Coastguard Worker .m(6)
2997*4bdc9457SAndroid Build Coastguard Worker .n(n)
2998*4bdc9457SAndroid Build Coastguard Worker .k(k)
2999*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3000*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3001*4bdc9457SAndroid Build Coastguard Worker }
3002*4bdc9457SAndroid Build Coastguard Worker }
3003*4bdc9457SAndroid Build Coastguard Worker }
3004*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,n_gt_8_subtile)3005*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
3006*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3007*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3008*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3009*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3010*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3011*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3012*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3013*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3014*4bdc9457SAndroid Build Coastguard Worker .m(m)
3015*4bdc9457SAndroid Build Coastguard Worker .n(n)
3016*4bdc9457SAndroid Build Coastguard Worker .k(k)
3017*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3018*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3019*4bdc9457SAndroid Build Coastguard Worker }
3020*4bdc9457SAndroid Build Coastguard Worker }
3021*4bdc9457SAndroid Build Coastguard Worker }
3022*4bdc9457SAndroid Build Coastguard Worker }
3023*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,n_div_8)3024*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, n_div_8) {
3025*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3026*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3027*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3028*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3029*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3030*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3031*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3032*4bdc9457SAndroid Build Coastguard Worker .m(6)
3033*4bdc9457SAndroid Build Coastguard Worker .n(n)
3034*4bdc9457SAndroid Build Coastguard Worker .k(k)
3035*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3036*4bdc9457SAndroid Build Coastguard Worker }
3037*4bdc9457SAndroid Build Coastguard Worker }
3038*4bdc9457SAndroid Build Coastguard Worker }
3039*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,n_div_8_strided_cn)3040*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
3041*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3042*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3043*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3044*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3045*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3046*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3047*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3048*4bdc9457SAndroid Build Coastguard Worker .m(6)
3049*4bdc9457SAndroid Build Coastguard Worker .n(n)
3050*4bdc9457SAndroid Build Coastguard Worker .k(k)
3051*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3052*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3053*4bdc9457SAndroid Build Coastguard Worker }
3054*4bdc9457SAndroid Build Coastguard Worker }
3055*4bdc9457SAndroid Build Coastguard Worker }
3056*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,n_div_8_subtile)3057*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, n_div_8_subtile) {
3058*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3059*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3060*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3061*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3062*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3063*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3064*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3065*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3066*4bdc9457SAndroid Build Coastguard Worker .m(m)
3067*4bdc9457SAndroid Build Coastguard Worker .n(n)
3068*4bdc9457SAndroid Build Coastguard Worker .k(k)
3069*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3070*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3071*4bdc9457SAndroid Build Coastguard Worker }
3072*4bdc9457SAndroid Build Coastguard Worker }
3073*4bdc9457SAndroid Build Coastguard Worker }
3074*4bdc9457SAndroid Build Coastguard Worker }
3075*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,small_kernel)3076*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, small_kernel) {
3077*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3078*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3079*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3080*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3081*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3082*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3083*4bdc9457SAndroid Build Coastguard Worker .m(6)
3084*4bdc9457SAndroid Build Coastguard Worker .n(8)
3085*4bdc9457SAndroid Build Coastguard Worker .k(k)
3086*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3087*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3088*4bdc9457SAndroid Build Coastguard Worker }
3089*4bdc9457SAndroid Build Coastguard Worker }
3090*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,small_kernel_subtile)3091*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, small_kernel_subtile) {
3092*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3093*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3094*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3095*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3096*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3097*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3098*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3099*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3100*4bdc9457SAndroid Build Coastguard Worker .m(m)
3101*4bdc9457SAndroid Build Coastguard Worker .n(n)
3102*4bdc9457SAndroid Build Coastguard Worker .k(k)
3103*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3104*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3105*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3106*4bdc9457SAndroid Build Coastguard Worker }
3107*4bdc9457SAndroid Build Coastguard Worker }
3108*4bdc9457SAndroid Build Coastguard Worker }
3109*4bdc9457SAndroid Build Coastguard Worker }
3110*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,n_gt_8_small_kernel)3111*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, n_gt_8_small_kernel) {
3112*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3113*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3114*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3115*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3116*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3117*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3118*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3119*4bdc9457SAndroid Build Coastguard Worker .m(6)
3120*4bdc9457SAndroid Build Coastguard Worker .n(n)
3121*4bdc9457SAndroid Build Coastguard Worker .k(k)
3122*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3123*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3124*4bdc9457SAndroid Build Coastguard Worker }
3125*4bdc9457SAndroid Build Coastguard Worker }
3126*4bdc9457SAndroid Build Coastguard Worker }
3127*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,n_div_8_small_kernel)3128*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, n_div_8_small_kernel) {
3129*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3130*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3131*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3132*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3133*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3134*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3135*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3136*4bdc9457SAndroid Build Coastguard Worker .m(6)
3137*4bdc9457SAndroid Build Coastguard Worker .n(n)
3138*4bdc9457SAndroid Build Coastguard Worker .k(k)
3139*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3140*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3141*4bdc9457SAndroid Build Coastguard Worker }
3142*4bdc9457SAndroid Build Coastguard Worker }
3143*4bdc9457SAndroid Build Coastguard Worker }
3144*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,strided_cm_subtile)3145*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, strided_cm_subtile) {
3146*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3147*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3148*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3149*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3150*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3151*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3152*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3153*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3154*4bdc9457SAndroid Build Coastguard Worker .m(m)
3155*4bdc9457SAndroid Build Coastguard Worker .n(n)
3156*4bdc9457SAndroid Build Coastguard Worker .k(k)
3157*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3158*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3159*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3160*4bdc9457SAndroid Build Coastguard Worker }
3161*4bdc9457SAndroid Build Coastguard Worker }
3162*4bdc9457SAndroid Build Coastguard Worker }
3163*4bdc9457SAndroid Build Coastguard Worker }
3164*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,a_offset)3165*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, a_offset) {
3166*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3167*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3168*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3169*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3170*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3171*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3172*4bdc9457SAndroid Build Coastguard Worker .m(6)
3173*4bdc9457SAndroid Build Coastguard Worker .n(8)
3174*4bdc9457SAndroid Build Coastguard Worker .k(k)
3175*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3176*4bdc9457SAndroid Build Coastguard Worker .a_offset(127)
3177*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3178*4bdc9457SAndroid Build Coastguard Worker }
3179*4bdc9457SAndroid Build Coastguard Worker }
3180*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,zero)3181*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, zero) {
3182*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3183*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 6; mz++) {
3184*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3185*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3186*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3187*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3188*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3189*4bdc9457SAndroid Build Coastguard Worker .m(6)
3190*4bdc9457SAndroid Build Coastguard Worker .n(8)
3191*4bdc9457SAndroid Build Coastguard Worker .k(k)
3192*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3193*4bdc9457SAndroid Build Coastguard Worker .a_offset(127)
3194*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
3195*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3196*4bdc9457SAndroid Build Coastguard Worker }
3197*4bdc9457SAndroid Build Coastguard Worker }
3198*4bdc9457SAndroid Build Coastguard Worker }
3199*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT,strided_cm)3200*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMSIMD_SPLAT, strided_cm) {
3201*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3202*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3203*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3204*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3205*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3206*4bdc9457SAndroid Build Coastguard Worker .m(6)
3207*4bdc9457SAndroid Build Coastguard Worker .n(8)
3208*4bdc9457SAndroid Build Coastguard Worker .k(4)
3209*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3210*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmsimd_splat);
3211*4bdc9457SAndroid Build Coastguard Worker }
3212*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
3213*4bdc9457SAndroid Build Coastguard Worker
3214*4bdc9457SAndroid Build Coastguard Worker
3215*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)3216*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
3217*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3218*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3219*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3220*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3221*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3222*4bdc9457SAndroid Build Coastguard Worker .m(1)
3223*4bdc9457SAndroid Build Coastguard Worker .n(8)
3224*4bdc9457SAndroid Build Coastguard Worker .k(1)
3225*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3226*4bdc9457SAndroid Build Coastguard Worker }
3227*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)3228*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
3229*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3230*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3231*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3232*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3233*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3234*4bdc9457SAndroid Build Coastguard Worker .m(1)
3235*4bdc9457SAndroid Build Coastguard Worker .n(8)
3236*4bdc9457SAndroid Build Coastguard Worker .k(1)
3237*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3238*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3239*4bdc9457SAndroid Build Coastguard Worker }
3240*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)3241*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
3242*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3243*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3244*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3245*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3246*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3247*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3248*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3249*4bdc9457SAndroid Build Coastguard Worker .m(m)
3250*4bdc9457SAndroid Build Coastguard Worker .n(n)
3251*4bdc9457SAndroid Build Coastguard Worker .k(1)
3252*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3253*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3254*4bdc9457SAndroid Build Coastguard Worker }
3255*4bdc9457SAndroid Build Coastguard Worker }
3256*4bdc9457SAndroid Build Coastguard Worker }
3257*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)3258*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
3259*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3260*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3261*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3262*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3263*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3264*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3265*4bdc9457SAndroid Build Coastguard Worker .m(m)
3266*4bdc9457SAndroid Build Coastguard Worker .n(8)
3267*4bdc9457SAndroid Build Coastguard Worker .k(1)
3268*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3269*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3270*4bdc9457SAndroid Build Coastguard Worker }
3271*4bdc9457SAndroid Build Coastguard Worker }
3272*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)3273*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
3274*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3275*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3276*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3277*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3278*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3279*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3280*4bdc9457SAndroid Build Coastguard Worker .m(1)
3281*4bdc9457SAndroid Build Coastguard Worker .n(n)
3282*4bdc9457SAndroid Build Coastguard Worker .k(1)
3283*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3284*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3285*4bdc9457SAndroid Build Coastguard Worker }
3286*4bdc9457SAndroid Build Coastguard Worker }
3287*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)3288*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
3289*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3290*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3291*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3292*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3293*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3294*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3295*4bdc9457SAndroid Build Coastguard Worker .m(1)
3296*4bdc9457SAndroid Build Coastguard Worker .n(8)
3297*4bdc9457SAndroid Build Coastguard Worker .k(k)
3298*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3299*4bdc9457SAndroid Build Coastguard Worker }
3300*4bdc9457SAndroid Build Coastguard Worker }
3301*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)3302*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
3303*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3304*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3305*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3306*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3307*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3308*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3309*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3310*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3311*4bdc9457SAndroid Build Coastguard Worker .m(m)
3312*4bdc9457SAndroid Build Coastguard Worker .n(n)
3313*4bdc9457SAndroid Build Coastguard Worker .k(k)
3314*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3315*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3316*4bdc9457SAndroid Build Coastguard Worker }
3317*4bdc9457SAndroid Build Coastguard Worker }
3318*4bdc9457SAndroid Build Coastguard Worker }
3319*4bdc9457SAndroid Build Coastguard Worker }
3320*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)3321*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
3322*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3323*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3324*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3325*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3326*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3327*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3328*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3329*4bdc9457SAndroid Build Coastguard Worker .m(1)
3330*4bdc9457SAndroid Build Coastguard Worker .n(n)
3331*4bdc9457SAndroid Build Coastguard Worker .k(k)
3332*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3333*4bdc9457SAndroid Build Coastguard Worker }
3334*4bdc9457SAndroid Build Coastguard Worker }
3335*4bdc9457SAndroid Build Coastguard Worker }
3336*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)3337*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
3338*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3339*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3340*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3341*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3342*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3343*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3344*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3345*4bdc9457SAndroid Build Coastguard Worker .m(1)
3346*4bdc9457SAndroid Build Coastguard Worker .n(n)
3347*4bdc9457SAndroid Build Coastguard Worker .k(k)
3348*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3349*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3350*4bdc9457SAndroid Build Coastguard Worker }
3351*4bdc9457SAndroid Build Coastguard Worker }
3352*4bdc9457SAndroid Build Coastguard Worker }
3353*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)3354*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
3355*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3356*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3357*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3358*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3359*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3360*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3361*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3362*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3363*4bdc9457SAndroid Build Coastguard Worker .m(m)
3364*4bdc9457SAndroid Build Coastguard Worker .n(n)
3365*4bdc9457SAndroid Build Coastguard Worker .k(k)
3366*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3367*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3368*4bdc9457SAndroid Build Coastguard Worker }
3369*4bdc9457SAndroid Build Coastguard Worker }
3370*4bdc9457SAndroid Build Coastguard Worker }
3371*4bdc9457SAndroid Build Coastguard Worker }
3372*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)3373*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
3374*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3375*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3376*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3377*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3378*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3379*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3380*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3381*4bdc9457SAndroid Build Coastguard Worker .m(1)
3382*4bdc9457SAndroid Build Coastguard Worker .n(n)
3383*4bdc9457SAndroid Build Coastguard Worker .k(k)
3384*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3385*4bdc9457SAndroid Build Coastguard Worker }
3386*4bdc9457SAndroid Build Coastguard Worker }
3387*4bdc9457SAndroid Build Coastguard Worker }
3388*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)3389*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
3390*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3391*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3392*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3393*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3394*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3395*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3396*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3397*4bdc9457SAndroid Build Coastguard Worker .m(1)
3398*4bdc9457SAndroid Build Coastguard Worker .n(n)
3399*4bdc9457SAndroid Build Coastguard Worker .k(k)
3400*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3401*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3402*4bdc9457SAndroid Build Coastguard Worker }
3403*4bdc9457SAndroid Build Coastguard Worker }
3404*4bdc9457SAndroid Build Coastguard Worker }
3405*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)3406*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
3407*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3408*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3409*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3410*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3411*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3412*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3413*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3414*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3415*4bdc9457SAndroid Build Coastguard Worker .m(m)
3416*4bdc9457SAndroid Build Coastguard Worker .n(n)
3417*4bdc9457SAndroid Build Coastguard Worker .k(k)
3418*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3419*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3420*4bdc9457SAndroid Build Coastguard Worker }
3421*4bdc9457SAndroid Build Coastguard Worker }
3422*4bdc9457SAndroid Build Coastguard Worker }
3423*4bdc9457SAndroid Build Coastguard Worker }
3424*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel)3425*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel) {
3426*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3427*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3428*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3429*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3430*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3431*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3432*4bdc9457SAndroid Build Coastguard Worker .m(1)
3433*4bdc9457SAndroid Build Coastguard Worker .n(8)
3434*4bdc9457SAndroid Build Coastguard Worker .k(k)
3435*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3436*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3437*4bdc9457SAndroid Build Coastguard Worker }
3438*4bdc9457SAndroid Build Coastguard Worker }
3439*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel_subtile)3440*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel_subtile) {
3441*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3442*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3443*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3444*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3445*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3446*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3447*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3448*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3449*4bdc9457SAndroid Build Coastguard Worker .m(m)
3450*4bdc9457SAndroid Build Coastguard Worker .n(n)
3451*4bdc9457SAndroid Build Coastguard Worker .k(k)
3452*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3453*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3454*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3455*4bdc9457SAndroid Build Coastguard Worker }
3456*4bdc9457SAndroid Build Coastguard Worker }
3457*4bdc9457SAndroid Build Coastguard Worker }
3458*4bdc9457SAndroid Build Coastguard Worker }
3459*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_small_kernel)3460*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_small_kernel) {
3461*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3462*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3463*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3464*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3465*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3466*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3467*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3468*4bdc9457SAndroid Build Coastguard Worker .m(1)
3469*4bdc9457SAndroid Build Coastguard Worker .n(n)
3470*4bdc9457SAndroid Build Coastguard Worker .k(k)
3471*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3472*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3473*4bdc9457SAndroid Build Coastguard Worker }
3474*4bdc9457SAndroid Build Coastguard Worker }
3475*4bdc9457SAndroid Build Coastguard Worker }
3476*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_small_kernel)3477*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_small_kernel) {
3478*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3479*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3480*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3481*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3482*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3483*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3484*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3485*4bdc9457SAndroid Build Coastguard Worker .m(1)
3486*4bdc9457SAndroid Build Coastguard Worker .n(n)
3487*4bdc9457SAndroid Build Coastguard Worker .k(k)
3488*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3489*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3490*4bdc9457SAndroid Build Coastguard Worker }
3491*4bdc9457SAndroid Build Coastguard Worker }
3492*4bdc9457SAndroid Build Coastguard Worker }
3493*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)3494*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
3495*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3496*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3497*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3498*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3499*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3500*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3501*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3502*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3503*4bdc9457SAndroid Build Coastguard Worker .m(m)
3504*4bdc9457SAndroid Build Coastguard Worker .n(n)
3505*4bdc9457SAndroid Build Coastguard Worker .k(k)
3506*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3507*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3508*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3509*4bdc9457SAndroid Build Coastguard Worker }
3510*4bdc9457SAndroid Build Coastguard Worker }
3511*4bdc9457SAndroid Build Coastguard Worker }
3512*4bdc9457SAndroid Build Coastguard Worker }
3513*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,a_offset)3514*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, a_offset) {
3515*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3516*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3517*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3518*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3519*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3520*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3521*4bdc9457SAndroid Build Coastguard Worker .m(1)
3522*4bdc9457SAndroid Build Coastguard Worker .n(8)
3523*4bdc9457SAndroid Build Coastguard Worker .k(k)
3524*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3525*4bdc9457SAndroid Build Coastguard Worker .a_offset(7)
3526*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3527*4bdc9457SAndroid Build Coastguard Worker }
3528*4bdc9457SAndroid Build Coastguard Worker }
3529*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,zero)3530*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, zero) {
3531*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3532*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 1; mz++) {
3533*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3534*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3535*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3536*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3537*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3538*4bdc9457SAndroid Build Coastguard Worker .m(1)
3539*4bdc9457SAndroid Build Coastguard Worker .n(8)
3540*4bdc9457SAndroid Build Coastguard Worker .k(k)
3541*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3542*4bdc9457SAndroid Build Coastguard Worker .a_offset(7)
3543*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
3544*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3545*4bdc9457SAndroid Build Coastguard Worker }
3546*4bdc9457SAndroid Build Coastguard Worker }
3547*4bdc9457SAndroid Build Coastguard Worker }
3548*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)3549*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
3550*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3551*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3552*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3553*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3554*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3555*4bdc9457SAndroid Build Coastguard Worker .m(1)
3556*4bdc9457SAndroid Build Coastguard Worker .n(8)
3557*4bdc9457SAndroid Build Coastguard Worker .k(1)
3558*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3559*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3560*4bdc9457SAndroid Build Coastguard Worker }
3561*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
3562*4bdc9457SAndroid Build Coastguard Worker
3563*4bdc9457SAndroid Build Coastguard Worker
3564*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)3565*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
3566*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3567*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3568*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3569*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3570*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3571*4bdc9457SAndroid Build Coastguard Worker .m(3)
3572*4bdc9457SAndroid Build Coastguard Worker .n(8)
3573*4bdc9457SAndroid Build Coastguard Worker .k(1)
3574*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3575*4bdc9457SAndroid Build Coastguard Worker }
3576*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)3577*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
3578*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3579*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3580*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3581*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3582*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3583*4bdc9457SAndroid Build Coastguard Worker .m(3)
3584*4bdc9457SAndroid Build Coastguard Worker .n(8)
3585*4bdc9457SAndroid Build Coastguard Worker .k(1)
3586*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3587*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3588*4bdc9457SAndroid Build Coastguard Worker }
3589*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)3590*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
3591*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3592*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3593*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3594*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3595*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3596*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3597*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3598*4bdc9457SAndroid Build Coastguard Worker .m(m)
3599*4bdc9457SAndroid Build Coastguard Worker .n(n)
3600*4bdc9457SAndroid Build Coastguard Worker .k(1)
3601*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3602*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3603*4bdc9457SAndroid Build Coastguard Worker }
3604*4bdc9457SAndroid Build Coastguard Worker }
3605*4bdc9457SAndroid Build Coastguard Worker }
3606*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)3607*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
3608*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3609*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3610*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3611*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3612*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3613*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3614*4bdc9457SAndroid Build Coastguard Worker .m(m)
3615*4bdc9457SAndroid Build Coastguard Worker .n(8)
3616*4bdc9457SAndroid Build Coastguard Worker .k(1)
3617*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3618*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3619*4bdc9457SAndroid Build Coastguard Worker }
3620*4bdc9457SAndroid Build Coastguard Worker }
3621*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)3622*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
3623*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3624*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3625*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3626*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3627*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3628*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3629*4bdc9457SAndroid Build Coastguard Worker .m(3)
3630*4bdc9457SAndroid Build Coastguard Worker .n(n)
3631*4bdc9457SAndroid Build Coastguard Worker .k(1)
3632*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3633*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3634*4bdc9457SAndroid Build Coastguard Worker }
3635*4bdc9457SAndroid Build Coastguard Worker }
3636*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)3637*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
3638*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3639*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3640*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3641*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3642*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3643*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3644*4bdc9457SAndroid Build Coastguard Worker .m(3)
3645*4bdc9457SAndroid Build Coastguard Worker .n(8)
3646*4bdc9457SAndroid Build Coastguard Worker .k(k)
3647*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3648*4bdc9457SAndroid Build Coastguard Worker }
3649*4bdc9457SAndroid Build Coastguard Worker }
3650*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)3651*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
3652*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3653*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3654*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3655*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3656*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3657*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3658*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3659*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3660*4bdc9457SAndroid Build Coastguard Worker .m(m)
3661*4bdc9457SAndroid Build Coastguard Worker .n(n)
3662*4bdc9457SAndroid Build Coastguard Worker .k(k)
3663*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3664*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3665*4bdc9457SAndroid Build Coastguard Worker }
3666*4bdc9457SAndroid Build Coastguard Worker }
3667*4bdc9457SAndroid Build Coastguard Worker }
3668*4bdc9457SAndroid Build Coastguard Worker }
3669*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)3670*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
3671*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3672*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3673*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3674*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3675*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3676*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3677*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3678*4bdc9457SAndroid Build Coastguard Worker .m(3)
3679*4bdc9457SAndroid Build Coastguard Worker .n(n)
3680*4bdc9457SAndroid Build Coastguard Worker .k(k)
3681*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3682*4bdc9457SAndroid Build Coastguard Worker }
3683*4bdc9457SAndroid Build Coastguard Worker }
3684*4bdc9457SAndroid Build Coastguard Worker }
3685*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)3686*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
3687*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3688*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3689*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3690*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3691*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3692*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3693*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3694*4bdc9457SAndroid Build Coastguard Worker .m(3)
3695*4bdc9457SAndroid Build Coastguard Worker .n(n)
3696*4bdc9457SAndroid Build Coastguard Worker .k(k)
3697*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3698*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3699*4bdc9457SAndroid Build Coastguard Worker }
3700*4bdc9457SAndroid Build Coastguard Worker }
3701*4bdc9457SAndroid Build Coastguard Worker }
3702*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)3703*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
3704*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3705*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3706*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3707*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3708*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3709*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3710*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3711*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3712*4bdc9457SAndroid Build Coastguard Worker .m(m)
3713*4bdc9457SAndroid Build Coastguard Worker .n(n)
3714*4bdc9457SAndroid Build Coastguard Worker .k(k)
3715*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3716*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3717*4bdc9457SAndroid Build Coastguard Worker }
3718*4bdc9457SAndroid Build Coastguard Worker }
3719*4bdc9457SAndroid Build Coastguard Worker }
3720*4bdc9457SAndroid Build Coastguard Worker }
3721*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)3722*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
3723*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3724*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3725*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3726*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3727*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3728*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3729*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3730*4bdc9457SAndroid Build Coastguard Worker .m(3)
3731*4bdc9457SAndroid Build Coastguard Worker .n(n)
3732*4bdc9457SAndroid Build Coastguard Worker .k(k)
3733*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3734*4bdc9457SAndroid Build Coastguard Worker }
3735*4bdc9457SAndroid Build Coastguard Worker }
3736*4bdc9457SAndroid Build Coastguard Worker }
3737*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)3738*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
3739*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3740*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3741*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3742*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3743*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3744*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3745*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3746*4bdc9457SAndroid Build Coastguard Worker .m(3)
3747*4bdc9457SAndroid Build Coastguard Worker .n(n)
3748*4bdc9457SAndroid Build Coastguard Worker .k(k)
3749*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3750*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3751*4bdc9457SAndroid Build Coastguard Worker }
3752*4bdc9457SAndroid Build Coastguard Worker }
3753*4bdc9457SAndroid Build Coastguard Worker }
3754*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)3755*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
3756*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3757*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3758*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3759*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3760*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3761*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3762*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3763*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3764*4bdc9457SAndroid Build Coastguard Worker .m(m)
3765*4bdc9457SAndroid Build Coastguard Worker .n(n)
3766*4bdc9457SAndroid Build Coastguard Worker .k(k)
3767*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3768*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3769*4bdc9457SAndroid Build Coastguard Worker }
3770*4bdc9457SAndroid Build Coastguard Worker }
3771*4bdc9457SAndroid Build Coastguard Worker }
3772*4bdc9457SAndroid Build Coastguard Worker }
3773*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel)3774*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel) {
3775*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3776*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3777*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3778*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3779*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3780*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3781*4bdc9457SAndroid Build Coastguard Worker .m(3)
3782*4bdc9457SAndroid Build Coastguard Worker .n(8)
3783*4bdc9457SAndroid Build Coastguard Worker .k(k)
3784*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3785*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3786*4bdc9457SAndroid Build Coastguard Worker }
3787*4bdc9457SAndroid Build Coastguard Worker }
3788*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel_subtile)3789*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel_subtile) {
3790*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3791*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3792*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3793*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3794*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3795*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3796*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3797*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3798*4bdc9457SAndroid Build Coastguard Worker .m(m)
3799*4bdc9457SAndroid Build Coastguard Worker .n(n)
3800*4bdc9457SAndroid Build Coastguard Worker .k(k)
3801*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3802*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3803*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3804*4bdc9457SAndroid Build Coastguard Worker }
3805*4bdc9457SAndroid Build Coastguard Worker }
3806*4bdc9457SAndroid Build Coastguard Worker }
3807*4bdc9457SAndroid Build Coastguard Worker }
3808*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_small_kernel)3809*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_small_kernel) {
3810*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3811*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3812*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3813*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3814*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3815*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3816*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3817*4bdc9457SAndroid Build Coastguard Worker .m(3)
3818*4bdc9457SAndroid Build Coastguard Worker .n(n)
3819*4bdc9457SAndroid Build Coastguard Worker .k(k)
3820*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3821*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3822*4bdc9457SAndroid Build Coastguard Worker }
3823*4bdc9457SAndroid Build Coastguard Worker }
3824*4bdc9457SAndroid Build Coastguard Worker }
3825*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_small_kernel)3826*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_small_kernel) {
3827*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3828*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3829*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3830*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3831*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3832*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3833*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3834*4bdc9457SAndroid Build Coastguard Worker .m(3)
3835*4bdc9457SAndroid Build Coastguard Worker .n(n)
3836*4bdc9457SAndroid Build Coastguard Worker .k(k)
3837*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3838*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3839*4bdc9457SAndroid Build Coastguard Worker }
3840*4bdc9457SAndroid Build Coastguard Worker }
3841*4bdc9457SAndroid Build Coastguard Worker }
3842*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)3843*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
3844*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3845*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3846*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3847*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3848*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3849*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3850*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3851*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3852*4bdc9457SAndroid Build Coastguard Worker .m(m)
3853*4bdc9457SAndroid Build Coastguard Worker .n(n)
3854*4bdc9457SAndroid Build Coastguard Worker .k(k)
3855*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3856*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3857*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3858*4bdc9457SAndroid Build Coastguard Worker }
3859*4bdc9457SAndroid Build Coastguard Worker }
3860*4bdc9457SAndroid Build Coastguard Worker }
3861*4bdc9457SAndroid Build Coastguard Worker }
3862*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,a_offset)3863*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, a_offset) {
3864*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3865*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3866*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3867*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3868*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3869*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3870*4bdc9457SAndroid Build Coastguard Worker .m(3)
3871*4bdc9457SAndroid Build Coastguard Worker .n(8)
3872*4bdc9457SAndroid Build Coastguard Worker .k(k)
3873*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3874*4bdc9457SAndroid Build Coastguard Worker .a_offset(17)
3875*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3876*4bdc9457SAndroid Build Coastguard Worker }
3877*4bdc9457SAndroid Build Coastguard Worker }
3878*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,zero)3879*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, zero) {
3880*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3881*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 3; mz++) {
3882*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3883*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3884*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3885*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3886*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3887*4bdc9457SAndroid Build Coastguard Worker .m(3)
3888*4bdc9457SAndroid Build Coastguard Worker .n(8)
3889*4bdc9457SAndroid Build Coastguard Worker .k(k)
3890*4bdc9457SAndroid Build Coastguard Worker .ks(3)
3891*4bdc9457SAndroid Build Coastguard Worker .a_offset(17)
3892*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
3893*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3894*4bdc9457SAndroid Build Coastguard Worker }
3895*4bdc9457SAndroid Build Coastguard Worker }
3896*4bdc9457SAndroid Build Coastguard Worker }
3897*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)3898*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
3899*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3900*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3901*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3902*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3903*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3904*4bdc9457SAndroid Build Coastguard Worker .m(3)
3905*4bdc9457SAndroid Build Coastguard Worker .n(8)
3906*4bdc9457SAndroid Build Coastguard Worker .k(1)
3907*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3908*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
3909*4bdc9457SAndroid Build Coastguard Worker }
3910*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
3911*4bdc9457SAndroid Build Coastguard Worker
3912*4bdc9457SAndroid Build Coastguard Worker
3913*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)3914*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
3915*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3916*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3917*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3918*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3919*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3920*4bdc9457SAndroid Build Coastguard Worker .m(3)
3921*4bdc9457SAndroid Build Coastguard Worker .n(8)
3922*4bdc9457SAndroid Build Coastguard Worker .k(4)
3923*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3924*4bdc9457SAndroid Build Coastguard Worker }
3925*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,strided_cn)3926*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
3927*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3928*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3929*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3930*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3931*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3932*4bdc9457SAndroid Build Coastguard Worker .m(3)
3933*4bdc9457SAndroid Build Coastguard Worker .n(8)
3934*4bdc9457SAndroid Build Coastguard Worker .k(4)
3935*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3936*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3937*4bdc9457SAndroid Build Coastguard Worker }
3938*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)3939*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
3940*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3941*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3942*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3943*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3944*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3945*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3946*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3947*4bdc9457SAndroid Build Coastguard Worker .m(m)
3948*4bdc9457SAndroid Build Coastguard Worker .n(n)
3949*4bdc9457SAndroid Build Coastguard Worker .k(4)
3950*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3951*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3952*4bdc9457SAndroid Build Coastguard Worker }
3953*4bdc9457SAndroid Build Coastguard Worker }
3954*4bdc9457SAndroid Build Coastguard Worker }
3955*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)3956*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
3957*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3958*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3959*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3960*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3961*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3962*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3963*4bdc9457SAndroid Build Coastguard Worker .m(m)
3964*4bdc9457SAndroid Build Coastguard Worker .n(8)
3965*4bdc9457SAndroid Build Coastguard Worker .k(4)
3966*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3967*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3968*4bdc9457SAndroid Build Coastguard Worker }
3969*4bdc9457SAndroid Build Coastguard Worker }
3970*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)3971*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
3972*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3973*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3974*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3975*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3976*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3977*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3978*4bdc9457SAndroid Build Coastguard Worker .m(3)
3979*4bdc9457SAndroid Build Coastguard Worker .n(n)
3980*4bdc9457SAndroid Build Coastguard Worker .k(4)
3981*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3982*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3983*4bdc9457SAndroid Build Coastguard Worker }
3984*4bdc9457SAndroid Build Coastguard Worker }
3985*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)3986*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
3987*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3988*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3989*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3990*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3991*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3992*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3993*4bdc9457SAndroid Build Coastguard Worker .m(3)
3994*4bdc9457SAndroid Build Coastguard Worker .n(8)
3995*4bdc9457SAndroid Build Coastguard Worker .k(k)
3996*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3997*4bdc9457SAndroid Build Coastguard Worker }
3998*4bdc9457SAndroid Build Coastguard Worker }
3999*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)4000*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
4001*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4002*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4003*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4004*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4005*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4006*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4007*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4008*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4009*4bdc9457SAndroid Build Coastguard Worker .m(m)
4010*4bdc9457SAndroid Build Coastguard Worker .n(n)
4011*4bdc9457SAndroid Build Coastguard Worker .k(k)
4012*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4013*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4014*4bdc9457SAndroid Build Coastguard Worker }
4015*4bdc9457SAndroid Build Coastguard Worker }
4016*4bdc9457SAndroid Build Coastguard Worker }
4017*4bdc9457SAndroid Build Coastguard Worker }
4018*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)4019*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
4020*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4021*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4022*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4023*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4024*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4025*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4026*4bdc9457SAndroid Build Coastguard Worker .m(3)
4027*4bdc9457SAndroid Build Coastguard Worker .n(8)
4028*4bdc9457SAndroid Build Coastguard Worker .k(k)
4029*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4030*4bdc9457SAndroid Build Coastguard Worker }
4031*4bdc9457SAndroid Build Coastguard Worker }
4032*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)4033*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
4034*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4035*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4036*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4037*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4038*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4039*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4040*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4041*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4042*4bdc9457SAndroid Build Coastguard Worker .m(m)
4043*4bdc9457SAndroid Build Coastguard Worker .n(n)
4044*4bdc9457SAndroid Build Coastguard Worker .k(k)
4045*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4046*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4047*4bdc9457SAndroid Build Coastguard Worker }
4048*4bdc9457SAndroid Build Coastguard Worker }
4049*4bdc9457SAndroid Build Coastguard Worker }
4050*4bdc9457SAndroid Build Coastguard Worker }
4051*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_div_4)4052*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
4053*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4054*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4055*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4056*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4057*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4058*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4059*4bdc9457SAndroid Build Coastguard Worker .m(3)
4060*4bdc9457SAndroid Build Coastguard Worker .n(8)
4061*4bdc9457SAndroid Build Coastguard Worker .k(k)
4062*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4063*4bdc9457SAndroid Build Coastguard Worker }
4064*4bdc9457SAndroid Build Coastguard Worker }
4065*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)4066*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
4067*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4068*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4069*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4070*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4071*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4072*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4073*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4074*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4075*4bdc9457SAndroid Build Coastguard Worker .m(m)
4076*4bdc9457SAndroid Build Coastguard Worker .n(n)
4077*4bdc9457SAndroid Build Coastguard Worker .k(k)
4078*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4079*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4080*4bdc9457SAndroid Build Coastguard Worker }
4081*4bdc9457SAndroid Build Coastguard Worker }
4082*4bdc9457SAndroid Build Coastguard Worker }
4083*4bdc9457SAndroid Build Coastguard Worker }
4084*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)4085*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
4086*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4087*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4088*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4089*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4090*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4091*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4092*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4093*4bdc9457SAndroid Build Coastguard Worker .m(3)
4094*4bdc9457SAndroid Build Coastguard Worker .n(n)
4095*4bdc9457SAndroid Build Coastguard Worker .k(k)
4096*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4097*4bdc9457SAndroid Build Coastguard Worker }
4098*4bdc9457SAndroid Build Coastguard Worker }
4099*4bdc9457SAndroid Build Coastguard Worker }
4100*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)4101*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
4102*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4103*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4104*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4105*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4106*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4107*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4108*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4109*4bdc9457SAndroid Build Coastguard Worker .m(3)
4110*4bdc9457SAndroid Build Coastguard Worker .n(n)
4111*4bdc9457SAndroid Build Coastguard Worker .k(k)
4112*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4113*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4114*4bdc9457SAndroid Build Coastguard Worker }
4115*4bdc9457SAndroid Build Coastguard Worker }
4116*4bdc9457SAndroid Build Coastguard Worker }
4117*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)4118*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
4119*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4120*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4121*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4122*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4123*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4124*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4125*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4126*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4127*4bdc9457SAndroid Build Coastguard Worker .m(m)
4128*4bdc9457SAndroid Build Coastguard Worker .n(n)
4129*4bdc9457SAndroid Build Coastguard Worker .k(k)
4130*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4131*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4132*4bdc9457SAndroid Build Coastguard Worker }
4133*4bdc9457SAndroid Build Coastguard Worker }
4134*4bdc9457SAndroid Build Coastguard Worker }
4135*4bdc9457SAndroid Build Coastguard Worker }
4136*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8)4137*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
4138*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4139*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4140*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4141*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4142*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4143*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4144*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4145*4bdc9457SAndroid Build Coastguard Worker .m(3)
4146*4bdc9457SAndroid Build Coastguard Worker .n(n)
4147*4bdc9457SAndroid Build Coastguard Worker .k(k)
4148*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4149*4bdc9457SAndroid Build Coastguard Worker }
4150*4bdc9457SAndroid Build Coastguard Worker }
4151*4bdc9457SAndroid Build Coastguard Worker }
4152*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)4153*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
4154*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4155*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4156*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4157*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4158*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4159*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4160*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4161*4bdc9457SAndroid Build Coastguard Worker .m(3)
4162*4bdc9457SAndroid Build Coastguard Worker .n(n)
4163*4bdc9457SAndroid Build Coastguard Worker .k(k)
4164*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4165*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4166*4bdc9457SAndroid Build Coastguard Worker }
4167*4bdc9457SAndroid Build Coastguard Worker }
4168*4bdc9457SAndroid Build Coastguard Worker }
4169*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)4170*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
4171*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4172*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4173*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4174*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4175*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4176*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4177*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4178*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4179*4bdc9457SAndroid Build Coastguard Worker .m(m)
4180*4bdc9457SAndroid Build Coastguard Worker .n(n)
4181*4bdc9457SAndroid Build Coastguard Worker .k(k)
4182*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4183*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4184*4bdc9457SAndroid Build Coastguard Worker }
4185*4bdc9457SAndroid Build Coastguard Worker }
4186*4bdc9457SAndroid Build Coastguard Worker }
4187*4bdc9457SAndroid Build Coastguard Worker }
4188*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,small_kernel)4189*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, small_kernel) {
4190*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4191*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4192*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4193*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4194*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4195*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4196*4bdc9457SAndroid Build Coastguard Worker .m(3)
4197*4bdc9457SAndroid Build Coastguard Worker .n(8)
4198*4bdc9457SAndroid Build Coastguard Worker .k(k)
4199*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4200*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4201*4bdc9457SAndroid Build Coastguard Worker }
4202*4bdc9457SAndroid Build Coastguard Worker }
4203*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,small_kernel_subtile)4204*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, small_kernel_subtile) {
4205*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4206*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4207*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4208*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4209*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4210*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4211*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4212*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4213*4bdc9457SAndroid Build Coastguard Worker .m(m)
4214*4bdc9457SAndroid Build Coastguard Worker .n(n)
4215*4bdc9457SAndroid Build Coastguard Worker .k(k)
4216*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4217*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4218*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4219*4bdc9457SAndroid Build Coastguard Worker }
4220*4bdc9457SAndroid Build Coastguard Worker }
4221*4bdc9457SAndroid Build Coastguard Worker }
4222*4bdc9457SAndroid Build Coastguard Worker }
4223*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_small_kernel)4224*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_small_kernel) {
4225*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4226*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4227*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4228*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4229*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4230*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4231*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4232*4bdc9457SAndroid Build Coastguard Worker .m(3)
4233*4bdc9457SAndroid Build Coastguard Worker .n(n)
4234*4bdc9457SAndroid Build Coastguard Worker .k(k)
4235*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4236*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4237*4bdc9457SAndroid Build Coastguard Worker }
4238*4bdc9457SAndroid Build Coastguard Worker }
4239*4bdc9457SAndroid Build Coastguard Worker }
4240*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8_small_kernel)4241*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8_small_kernel) {
4242*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4243*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4244*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4245*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4246*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4247*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4248*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4249*4bdc9457SAndroid Build Coastguard Worker .m(3)
4250*4bdc9457SAndroid Build Coastguard Worker .n(n)
4251*4bdc9457SAndroid Build Coastguard Worker .k(k)
4252*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4253*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4254*4bdc9457SAndroid Build Coastguard Worker }
4255*4bdc9457SAndroid Build Coastguard Worker }
4256*4bdc9457SAndroid Build Coastguard Worker }
4257*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)4258*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
4259*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4260*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4261*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4262*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4263*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4264*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4265*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4266*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4267*4bdc9457SAndroid Build Coastguard Worker .m(m)
4268*4bdc9457SAndroid Build Coastguard Worker .n(n)
4269*4bdc9457SAndroid Build Coastguard Worker .k(k)
4270*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4271*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4272*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4273*4bdc9457SAndroid Build Coastguard Worker }
4274*4bdc9457SAndroid Build Coastguard Worker }
4275*4bdc9457SAndroid Build Coastguard Worker }
4276*4bdc9457SAndroid Build Coastguard Worker }
4277*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,a_offset)4278*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, a_offset) {
4279*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4280*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4281*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4282*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4283*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4284*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4285*4bdc9457SAndroid Build Coastguard Worker .m(3)
4286*4bdc9457SAndroid Build Coastguard Worker .n(8)
4287*4bdc9457SAndroid Build Coastguard Worker .k(k)
4288*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4289*4bdc9457SAndroid Build Coastguard Worker .a_offset(67)
4290*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4291*4bdc9457SAndroid Build Coastguard Worker }
4292*4bdc9457SAndroid Build Coastguard Worker }
4293*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,zero)4294*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, zero) {
4295*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4296*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 3; mz++) {
4297*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4298*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4299*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4300*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4301*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4302*4bdc9457SAndroid Build Coastguard Worker .m(3)
4303*4bdc9457SAndroid Build Coastguard Worker .n(8)
4304*4bdc9457SAndroid Build Coastguard Worker .k(k)
4305*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4306*4bdc9457SAndroid Build Coastguard Worker .a_offset(67)
4307*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
4308*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4309*4bdc9457SAndroid Build Coastguard Worker }
4310*4bdc9457SAndroid Build Coastguard Worker }
4311*4bdc9457SAndroid Build Coastguard Worker }
4312*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,strided_cm)4313*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
4314*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4315*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4316*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4317*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4318*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4319*4bdc9457SAndroid Build Coastguard Worker .m(3)
4320*4bdc9457SAndroid Build Coastguard Worker .n(8)
4321*4bdc9457SAndroid Build Coastguard Worker .k(4)
4322*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4323*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
4324*4bdc9457SAndroid Build Coastguard Worker }
4325*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4326*4bdc9457SAndroid Build Coastguard Worker
4327*4bdc9457SAndroid Build Coastguard Worker
4328*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)4329*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
4330*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4331*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4332*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4333*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4334*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4335*4bdc9457SAndroid Build Coastguard Worker .m(4)
4336*4bdc9457SAndroid Build Coastguard Worker .n(8)
4337*4bdc9457SAndroid Build Coastguard Worker .k(1)
4338*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4339*4bdc9457SAndroid Build Coastguard Worker }
4340*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)4341*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
4342*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4343*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4344*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4345*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4346*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4347*4bdc9457SAndroid Build Coastguard Worker .m(4)
4348*4bdc9457SAndroid Build Coastguard Worker .n(8)
4349*4bdc9457SAndroid Build Coastguard Worker .k(1)
4350*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4351*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4352*4bdc9457SAndroid Build Coastguard Worker }
4353*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)4354*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
4355*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4356*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4357*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4358*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4359*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4360*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4361*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4362*4bdc9457SAndroid Build Coastguard Worker .m(m)
4363*4bdc9457SAndroid Build Coastguard Worker .n(n)
4364*4bdc9457SAndroid Build Coastguard Worker .k(1)
4365*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4366*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4367*4bdc9457SAndroid Build Coastguard Worker }
4368*4bdc9457SAndroid Build Coastguard Worker }
4369*4bdc9457SAndroid Build Coastguard Worker }
4370*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)4371*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
4372*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4373*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4374*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4375*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4376*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4377*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4378*4bdc9457SAndroid Build Coastguard Worker .m(m)
4379*4bdc9457SAndroid Build Coastguard Worker .n(8)
4380*4bdc9457SAndroid Build Coastguard Worker .k(1)
4381*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4382*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4383*4bdc9457SAndroid Build Coastguard Worker }
4384*4bdc9457SAndroid Build Coastguard Worker }
4385*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)4386*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
4387*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4388*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4389*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4390*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4391*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4392*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4393*4bdc9457SAndroid Build Coastguard Worker .m(4)
4394*4bdc9457SAndroid Build Coastguard Worker .n(n)
4395*4bdc9457SAndroid Build Coastguard Worker .k(1)
4396*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4397*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4398*4bdc9457SAndroid Build Coastguard Worker }
4399*4bdc9457SAndroid Build Coastguard Worker }
4400*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)4401*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
4402*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4403*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4404*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4405*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4406*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4407*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4408*4bdc9457SAndroid Build Coastguard Worker .m(4)
4409*4bdc9457SAndroid Build Coastguard Worker .n(8)
4410*4bdc9457SAndroid Build Coastguard Worker .k(k)
4411*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4412*4bdc9457SAndroid Build Coastguard Worker }
4413*4bdc9457SAndroid Build Coastguard Worker }
4414*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)4415*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
4416*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4417*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4418*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4419*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4420*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4421*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4422*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4423*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4424*4bdc9457SAndroid Build Coastguard Worker .m(m)
4425*4bdc9457SAndroid Build Coastguard Worker .n(n)
4426*4bdc9457SAndroid Build Coastguard Worker .k(k)
4427*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4428*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4429*4bdc9457SAndroid Build Coastguard Worker }
4430*4bdc9457SAndroid Build Coastguard Worker }
4431*4bdc9457SAndroid Build Coastguard Worker }
4432*4bdc9457SAndroid Build Coastguard Worker }
4433*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)4434*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
4435*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4436*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4437*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4438*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4439*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4440*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4441*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4442*4bdc9457SAndroid Build Coastguard Worker .m(4)
4443*4bdc9457SAndroid Build Coastguard Worker .n(n)
4444*4bdc9457SAndroid Build Coastguard Worker .k(k)
4445*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4446*4bdc9457SAndroid Build Coastguard Worker }
4447*4bdc9457SAndroid Build Coastguard Worker }
4448*4bdc9457SAndroid Build Coastguard Worker }
4449*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)4450*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
4451*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4452*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4453*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4454*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4455*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4456*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4457*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4458*4bdc9457SAndroid Build Coastguard Worker .m(4)
4459*4bdc9457SAndroid Build Coastguard Worker .n(n)
4460*4bdc9457SAndroid Build Coastguard Worker .k(k)
4461*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4462*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4463*4bdc9457SAndroid Build Coastguard Worker }
4464*4bdc9457SAndroid Build Coastguard Worker }
4465*4bdc9457SAndroid Build Coastguard Worker }
4466*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)4467*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
4468*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4469*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4470*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4471*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4472*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4473*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4474*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4475*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4476*4bdc9457SAndroid Build Coastguard Worker .m(m)
4477*4bdc9457SAndroid Build Coastguard Worker .n(n)
4478*4bdc9457SAndroid Build Coastguard Worker .k(k)
4479*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4480*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4481*4bdc9457SAndroid Build Coastguard Worker }
4482*4bdc9457SAndroid Build Coastguard Worker }
4483*4bdc9457SAndroid Build Coastguard Worker }
4484*4bdc9457SAndroid Build Coastguard Worker }
4485*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)4486*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
4487*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4488*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4489*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4490*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4491*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4492*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4493*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4494*4bdc9457SAndroid Build Coastguard Worker .m(4)
4495*4bdc9457SAndroid Build Coastguard Worker .n(n)
4496*4bdc9457SAndroid Build Coastguard Worker .k(k)
4497*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4498*4bdc9457SAndroid Build Coastguard Worker }
4499*4bdc9457SAndroid Build Coastguard Worker }
4500*4bdc9457SAndroid Build Coastguard Worker }
4501*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)4502*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
4503*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4504*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4505*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4506*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4507*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4508*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4509*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4510*4bdc9457SAndroid Build Coastguard Worker .m(4)
4511*4bdc9457SAndroid Build Coastguard Worker .n(n)
4512*4bdc9457SAndroid Build Coastguard Worker .k(k)
4513*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4514*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4515*4bdc9457SAndroid Build Coastguard Worker }
4516*4bdc9457SAndroid Build Coastguard Worker }
4517*4bdc9457SAndroid Build Coastguard Worker }
4518*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)4519*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
4520*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4521*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4522*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4523*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4524*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4525*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4526*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4527*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4528*4bdc9457SAndroid Build Coastguard Worker .m(m)
4529*4bdc9457SAndroid Build Coastguard Worker .n(n)
4530*4bdc9457SAndroid Build Coastguard Worker .k(k)
4531*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4532*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4533*4bdc9457SAndroid Build Coastguard Worker }
4534*4bdc9457SAndroid Build Coastguard Worker }
4535*4bdc9457SAndroid Build Coastguard Worker }
4536*4bdc9457SAndroid Build Coastguard Worker }
4537*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel)4538*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel) {
4539*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4540*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4541*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4542*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4543*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4544*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4545*4bdc9457SAndroid Build Coastguard Worker .m(4)
4546*4bdc9457SAndroid Build Coastguard Worker .n(8)
4547*4bdc9457SAndroid Build Coastguard Worker .k(k)
4548*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4549*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4550*4bdc9457SAndroid Build Coastguard Worker }
4551*4bdc9457SAndroid Build Coastguard Worker }
4552*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel_subtile)4553*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel_subtile) {
4554*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4555*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4556*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4557*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4558*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4559*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4560*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4561*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4562*4bdc9457SAndroid Build Coastguard Worker .m(m)
4563*4bdc9457SAndroid Build Coastguard Worker .n(n)
4564*4bdc9457SAndroid Build Coastguard Worker .k(k)
4565*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4566*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4567*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4568*4bdc9457SAndroid Build Coastguard Worker }
4569*4bdc9457SAndroid Build Coastguard Worker }
4570*4bdc9457SAndroid Build Coastguard Worker }
4571*4bdc9457SAndroid Build Coastguard Worker }
4572*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_small_kernel)4573*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_small_kernel) {
4574*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4575*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4576*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4577*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4578*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4579*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4580*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4581*4bdc9457SAndroid Build Coastguard Worker .m(4)
4582*4bdc9457SAndroid Build Coastguard Worker .n(n)
4583*4bdc9457SAndroid Build Coastguard Worker .k(k)
4584*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4585*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4586*4bdc9457SAndroid Build Coastguard Worker }
4587*4bdc9457SAndroid Build Coastguard Worker }
4588*4bdc9457SAndroid Build Coastguard Worker }
4589*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_small_kernel)4590*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_small_kernel) {
4591*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4592*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4593*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4594*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4595*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4596*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4597*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4598*4bdc9457SAndroid Build Coastguard Worker .m(4)
4599*4bdc9457SAndroid Build Coastguard Worker .n(n)
4600*4bdc9457SAndroid Build Coastguard Worker .k(k)
4601*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4602*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4603*4bdc9457SAndroid Build Coastguard Worker }
4604*4bdc9457SAndroid Build Coastguard Worker }
4605*4bdc9457SAndroid Build Coastguard Worker }
4606*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)4607*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
4608*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4609*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4610*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4611*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4612*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4613*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4614*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4615*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4616*4bdc9457SAndroid Build Coastguard Worker .m(m)
4617*4bdc9457SAndroid Build Coastguard Worker .n(n)
4618*4bdc9457SAndroid Build Coastguard Worker .k(k)
4619*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4620*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4621*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4622*4bdc9457SAndroid Build Coastguard Worker }
4623*4bdc9457SAndroid Build Coastguard Worker }
4624*4bdc9457SAndroid Build Coastguard Worker }
4625*4bdc9457SAndroid Build Coastguard Worker }
4626*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,a_offset)4627*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, a_offset) {
4628*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4629*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4630*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4631*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4632*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4633*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4634*4bdc9457SAndroid Build Coastguard Worker .m(4)
4635*4bdc9457SAndroid Build Coastguard Worker .n(8)
4636*4bdc9457SAndroid Build Coastguard Worker .k(k)
4637*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4638*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
4639*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4640*4bdc9457SAndroid Build Coastguard Worker }
4641*4bdc9457SAndroid Build Coastguard Worker }
4642*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,zero)4643*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, zero) {
4644*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4645*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 4; mz++) {
4646*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4647*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4648*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4649*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4650*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4651*4bdc9457SAndroid Build Coastguard Worker .m(4)
4652*4bdc9457SAndroid Build Coastguard Worker .n(8)
4653*4bdc9457SAndroid Build Coastguard Worker .k(k)
4654*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4655*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
4656*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
4657*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4658*4bdc9457SAndroid Build Coastguard Worker }
4659*4bdc9457SAndroid Build Coastguard Worker }
4660*4bdc9457SAndroid Build Coastguard Worker }
4661*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)4662*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
4663*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4664*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4665*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4666*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4667*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4668*4bdc9457SAndroid Build Coastguard Worker .m(4)
4669*4bdc9457SAndroid Build Coastguard Worker .n(8)
4670*4bdc9457SAndroid Build Coastguard Worker .k(1)
4671*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4672*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4673*4bdc9457SAndroid Build Coastguard Worker }
4674*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4675*4bdc9457SAndroid Build Coastguard Worker
4676*4bdc9457SAndroid Build Coastguard Worker
4677*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)4678*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
4679*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4680*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4681*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4682*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4683*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4684*4bdc9457SAndroid Build Coastguard Worker .m(4)
4685*4bdc9457SAndroid Build Coastguard Worker .n(8)
4686*4bdc9457SAndroid Build Coastguard Worker .k(4)
4687*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4688*4bdc9457SAndroid Build Coastguard Worker }
4689*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,strided_cn)4690*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
4691*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4692*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4693*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4694*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4695*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4696*4bdc9457SAndroid Build Coastguard Worker .m(4)
4697*4bdc9457SAndroid Build Coastguard Worker .n(8)
4698*4bdc9457SAndroid Build Coastguard Worker .k(4)
4699*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4700*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4701*4bdc9457SAndroid Build Coastguard Worker }
4702*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)4703*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
4704*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4705*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4706*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4707*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4708*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4709*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4710*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4711*4bdc9457SAndroid Build Coastguard Worker .m(m)
4712*4bdc9457SAndroid Build Coastguard Worker .n(n)
4713*4bdc9457SAndroid Build Coastguard Worker .k(4)
4714*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4715*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4716*4bdc9457SAndroid Build Coastguard Worker }
4717*4bdc9457SAndroid Build Coastguard Worker }
4718*4bdc9457SAndroid Build Coastguard Worker }
4719*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)4720*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
4721*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4722*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4723*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4724*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4725*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4726*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4727*4bdc9457SAndroid Build Coastguard Worker .m(m)
4728*4bdc9457SAndroid Build Coastguard Worker .n(8)
4729*4bdc9457SAndroid Build Coastguard Worker .k(4)
4730*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4731*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4732*4bdc9457SAndroid Build Coastguard Worker }
4733*4bdc9457SAndroid Build Coastguard Worker }
4734*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)4735*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
4736*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4737*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4738*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4739*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4740*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4741*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4742*4bdc9457SAndroid Build Coastguard Worker .m(4)
4743*4bdc9457SAndroid Build Coastguard Worker .n(n)
4744*4bdc9457SAndroid Build Coastguard Worker .k(4)
4745*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4746*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4747*4bdc9457SAndroid Build Coastguard Worker }
4748*4bdc9457SAndroid Build Coastguard Worker }
4749*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)4750*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
4751*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4752*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4753*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4754*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4755*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4756*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4757*4bdc9457SAndroid Build Coastguard Worker .m(4)
4758*4bdc9457SAndroid Build Coastguard Worker .n(8)
4759*4bdc9457SAndroid Build Coastguard Worker .k(k)
4760*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4761*4bdc9457SAndroid Build Coastguard Worker }
4762*4bdc9457SAndroid Build Coastguard Worker }
4763*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)4764*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
4765*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4766*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4767*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4768*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4769*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4770*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4771*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4772*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4773*4bdc9457SAndroid Build Coastguard Worker .m(m)
4774*4bdc9457SAndroid Build Coastguard Worker .n(n)
4775*4bdc9457SAndroid Build Coastguard Worker .k(k)
4776*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4777*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4778*4bdc9457SAndroid Build Coastguard Worker }
4779*4bdc9457SAndroid Build Coastguard Worker }
4780*4bdc9457SAndroid Build Coastguard Worker }
4781*4bdc9457SAndroid Build Coastguard Worker }
4782*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)4783*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
4784*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4785*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4786*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4787*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4788*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4789*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4790*4bdc9457SAndroid Build Coastguard Worker .m(4)
4791*4bdc9457SAndroid Build Coastguard Worker .n(8)
4792*4bdc9457SAndroid Build Coastguard Worker .k(k)
4793*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4794*4bdc9457SAndroid Build Coastguard Worker }
4795*4bdc9457SAndroid Build Coastguard Worker }
4796*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)4797*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
4798*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4799*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4800*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4801*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4802*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4803*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4804*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4805*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4806*4bdc9457SAndroid Build Coastguard Worker .m(m)
4807*4bdc9457SAndroid Build Coastguard Worker .n(n)
4808*4bdc9457SAndroid Build Coastguard Worker .k(k)
4809*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4810*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4811*4bdc9457SAndroid Build Coastguard Worker }
4812*4bdc9457SAndroid Build Coastguard Worker }
4813*4bdc9457SAndroid Build Coastguard Worker }
4814*4bdc9457SAndroid Build Coastguard Worker }
4815*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_div_4)4816*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
4817*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4818*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4819*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4820*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4821*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4822*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4823*4bdc9457SAndroid Build Coastguard Worker .m(4)
4824*4bdc9457SAndroid Build Coastguard Worker .n(8)
4825*4bdc9457SAndroid Build Coastguard Worker .k(k)
4826*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4827*4bdc9457SAndroid Build Coastguard Worker }
4828*4bdc9457SAndroid Build Coastguard Worker }
4829*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)4830*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
4831*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4832*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4833*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4834*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4835*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4836*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4837*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4838*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4839*4bdc9457SAndroid Build Coastguard Worker .m(m)
4840*4bdc9457SAndroid Build Coastguard Worker .n(n)
4841*4bdc9457SAndroid Build Coastguard Worker .k(k)
4842*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4843*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4844*4bdc9457SAndroid Build Coastguard Worker }
4845*4bdc9457SAndroid Build Coastguard Worker }
4846*4bdc9457SAndroid Build Coastguard Worker }
4847*4bdc9457SAndroid Build Coastguard Worker }
4848*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)4849*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
4850*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4851*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4852*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4853*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4854*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4855*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4856*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4857*4bdc9457SAndroid Build Coastguard Worker .m(4)
4858*4bdc9457SAndroid Build Coastguard Worker .n(n)
4859*4bdc9457SAndroid Build Coastguard Worker .k(k)
4860*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4861*4bdc9457SAndroid Build Coastguard Worker }
4862*4bdc9457SAndroid Build Coastguard Worker }
4863*4bdc9457SAndroid Build Coastguard Worker }
4864*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)4865*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
4866*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4867*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4868*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4869*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4870*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4871*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4872*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4873*4bdc9457SAndroid Build Coastguard Worker .m(4)
4874*4bdc9457SAndroid Build Coastguard Worker .n(n)
4875*4bdc9457SAndroid Build Coastguard Worker .k(k)
4876*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4877*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4878*4bdc9457SAndroid Build Coastguard Worker }
4879*4bdc9457SAndroid Build Coastguard Worker }
4880*4bdc9457SAndroid Build Coastguard Worker }
4881*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)4882*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
4883*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4884*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4885*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4886*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4887*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4888*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4889*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4890*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4891*4bdc9457SAndroid Build Coastguard Worker .m(m)
4892*4bdc9457SAndroid Build Coastguard Worker .n(n)
4893*4bdc9457SAndroid Build Coastguard Worker .k(k)
4894*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4895*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4896*4bdc9457SAndroid Build Coastguard Worker }
4897*4bdc9457SAndroid Build Coastguard Worker }
4898*4bdc9457SAndroid Build Coastguard Worker }
4899*4bdc9457SAndroid Build Coastguard Worker }
4900*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8)4901*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
4902*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4903*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4904*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4905*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4906*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4907*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4908*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4909*4bdc9457SAndroid Build Coastguard Worker .m(4)
4910*4bdc9457SAndroid Build Coastguard Worker .n(n)
4911*4bdc9457SAndroid Build Coastguard Worker .k(k)
4912*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4913*4bdc9457SAndroid Build Coastguard Worker }
4914*4bdc9457SAndroid Build Coastguard Worker }
4915*4bdc9457SAndroid Build Coastguard Worker }
4916*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)4917*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
4918*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4919*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4920*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4921*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4922*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4923*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4924*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4925*4bdc9457SAndroid Build Coastguard Worker .m(4)
4926*4bdc9457SAndroid Build Coastguard Worker .n(n)
4927*4bdc9457SAndroid Build Coastguard Worker .k(k)
4928*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4929*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4930*4bdc9457SAndroid Build Coastguard Worker }
4931*4bdc9457SAndroid Build Coastguard Worker }
4932*4bdc9457SAndroid Build Coastguard Worker }
4933*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)4934*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
4935*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4936*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4937*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4938*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4939*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4940*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4941*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4942*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4943*4bdc9457SAndroid Build Coastguard Worker .m(m)
4944*4bdc9457SAndroid Build Coastguard Worker .n(n)
4945*4bdc9457SAndroid Build Coastguard Worker .k(k)
4946*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4947*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4948*4bdc9457SAndroid Build Coastguard Worker }
4949*4bdc9457SAndroid Build Coastguard Worker }
4950*4bdc9457SAndroid Build Coastguard Worker }
4951*4bdc9457SAndroid Build Coastguard Worker }
4952*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,small_kernel)4953*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, small_kernel) {
4954*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4955*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4956*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4957*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4958*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4959*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4960*4bdc9457SAndroid Build Coastguard Worker .m(4)
4961*4bdc9457SAndroid Build Coastguard Worker .n(8)
4962*4bdc9457SAndroid Build Coastguard Worker .k(k)
4963*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4964*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4965*4bdc9457SAndroid Build Coastguard Worker }
4966*4bdc9457SAndroid Build Coastguard Worker }
4967*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,small_kernel_subtile)4968*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, small_kernel_subtile) {
4969*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4970*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4971*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4972*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4973*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4974*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4975*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4976*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4977*4bdc9457SAndroid Build Coastguard Worker .m(m)
4978*4bdc9457SAndroid Build Coastguard Worker .n(n)
4979*4bdc9457SAndroid Build Coastguard Worker .k(k)
4980*4bdc9457SAndroid Build Coastguard Worker .ks(3)
4981*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4982*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4983*4bdc9457SAndroid Build Coastguard Worker }
4984*4bdc9457SAndroid Build Coastguard Worker }
4985*4bdc9457SAndroid Build Coastguard Worker }
4986*4bdc9457SAndroid Build Coastguard Worker }
4987*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_small_kernel)4988*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_small_kernel) {
4989*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4990*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4991*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4992*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4993*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4994*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4995*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4996*4bdc9457SAndroid Build Coastguard Worker .m(4)
4997*4bdc9457SAndroid Build Coastguard Worker .n(n)
4998*4bdc9457SAndroid Build Coastguard Worker .k(k)
4999*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5000*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
5001*4bdc9457SAndroid Build Coastguard Worker }
5002*4bdc9457SAndroid Build Coastguard Worker }
5003*4bdc9457SAndroid Build Coastguard Worker }
5004*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8_small_kernel)5005*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8_small_kernel) {
5006*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5007*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5008*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5009*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5010*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5011*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5012*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5013*4bdc9457SAndroid Build Coastguard Worker .m(4)
5014*4bdc9457SAndroid Build Coastguard Worker .n(n)
5015*4bdc9457SAndroid Build Coastguard Worker .k(k)
5016*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5017*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
5018*4bdc9457SAndroid Build Coastguard Worker }
5019*4bdc9457SAndroid Build Coastguard Worker }
5020*4bdc9457SAndroid Build Coastguard Worker }
5021*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)5022*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
5023*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5024*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5025*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5026*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5027*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5028*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5029*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5030*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5031*4bdc9457SAndroid Build Coastguard Worker .m(m)
5032*4bdc9457SAndroid Build Coastguard Worker .n(n)
5033*4bdc9457SAndroid Build Coastguard Worker .k(k)
5034*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5035*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5036*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
5037*4bdc9457SAndroid Build Coastguard Worker }
5038*4bdc9457SAndroid Build Coastguard Worker }
5039*4bdc9457SAndroid Build Coastguard Worker }
5040*4bdc9457SAndroid Build Coastguard Worker }
5041*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,a_offset)5042*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, a_offset) {
5043*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5044*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5045*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5046*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5047*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5048*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5049*4bdc9457SAndroid Build Coastguard Worker .m(4)
5050*4bdc9457SAndroid Build Coastguard Worker .n(8)
5051*4bdc9457SAndroid Build Coastguard Worker .k(k)
5052*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5053*4bdc9457SAndroid Build Coastguard Worker .a_offset(83)
5054*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
5055*4bdc9457SAndroid Build Coastguard Worker }
5056*4bdc9457SAndroid Build Coastguard Worker }
5057*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,zero)5058*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, zero) {
5059*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5060*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 4; mz++) {
5061*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5062*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5063*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5064*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5065*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5066*4bdc9457SAndroid Build Coastguard Worker .m(4)
5067*4bdc9457SAndroid Build Coastguard Worker .n(8)
5068*4bdc9457SAndroid Build Coastguard Worker .k(k)
5069*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5070*4bdc9457SAndroid Build Coastguard Worker .a_offset(83)
5071*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
5072*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
5073*4bdc9457SAndroid Build Coastguard Worker }
5074*4bdc9457SAndroid Build Coastguard Worker }
5075*4bdc9457SAndroid Build Coastguard Worker }
5076*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,strided_cm)5077*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
5078*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5079*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5080*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5081*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5082*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5083*4bdc9457SAndroid Build Coastguard Worker .m(4)
5084*4bdc9457SAndroid Build Coastguard Worker .n(8)
5085*4bdc9457SAndroid Build Coastguard Worker .k(4)
5086*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5087*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
5088*4bdc9457SAndroid Build Coastguard Worker }
5089*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5090*4bdc9457SAndroid Build Coastguard Worker
5091*4bdc9457SAndroid Build Coastguard Worker
5092*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)5093*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
5094*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5095*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5096*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5097*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5098*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5099*4bdc9457SAndroid Build Coastguard Worker .m(5)
5100*4bdc9457SAndroid Build Coastguard Worker .n(8)
5101*4bdc9457SAndroid Build Coastguard Worker .k(1)
5102*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5103*4bdc9457SAndroid Build Coastguard Worker }
5104*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)5105*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
5106*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5107*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5108*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5109*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5110*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5111*4bdc9457SAndroid Build Coastguard Worker .m(5)
5112*4bdc9457SAndroid Build Coastguard Worker .n(8)
5113*4bdc9457SAndroid Build Coastguard Worker .k(1)
5114*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5115*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5116*4bdc9457SAndroid Build Coastguard Worker }
5117*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)5118*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
5119*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5120*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5121*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5122*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5123*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5124*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5125*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5126*4bdc9457SAndroid Build Coastguard Worker .m(m)
5127*4bdc9457SAndroid Build Coastguard Worker .n(n)
5128*4bdc9457SAndroid Build Coastguard Worker .k(1)
5129*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5130*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5131*4bdc9457SAndroid Build Coastguard Worker }
5132*4bdc9457SAndroid Build Coastguard Worker }
5133*4bdc9457SAndroid Build Coastguard Worker }
5134*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)5135*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
5136*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5137*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5138*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5139*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5140*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5141*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5142*4bdc9457SAndroid Build Coastguard Worker .m(m)
5143*4bdc9457SAndroid Build Coastguard Worker .n(8)
5144*4bdc9457SAndroid Build Coastguard Worker .k(1)
5145*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5146*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5147*4bdc9457SAndroid Build Coastguard Worker }
5148*4bdc9457SAndroid Build Coastguard Worker }
5149*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)5150*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
5151*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5152*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5153*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5154*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5155*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5156*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5157*4bdc9457SAndroid Build Coastguard Worker .m(5)
5158*4bdc9457SAndroid Build Coastguard Worker .n(n)
5159*4bdc9457SAndroid Build Coastguard Worker .k(1)
5160*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5161*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5162*4bdc9457SAndroid Build Coastguard Worker }
5163*4bdc9457SAndroid Build Coastguard Worker }
5164*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)5165*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
5166*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5167*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5168*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5169*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5170*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5171*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5172*4bdc9457SAndroid Build Coastguard Worker .m(5)
5173*4bdc9457SAndroid Build Coastguard Worker .n(8)
5174*4bdc9457SAndroid Build Coastguard Worker .k(k)
5175*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5176*4bdc9457SAndroid Build Coastguard Worker }
5177*4bdc9457SAndroid Build Coastguard Worker }
5178*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)5179*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
5180*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5181*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5182*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5183*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5184*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5185*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5186*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5187*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5188*4bdc9457SAndroid Build Coastguard Worker .m(m)
5189*4bdc9457SAndroid Build Coastguard Worker .n(n)
5190*4bdc9457SAndroid Build Coastguard Worker .k(k)
5191*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5192*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5193*4bdc9457SAndroid Build Coastguard Worker }
5194*4bdc9457SAndroid Build Coastguard Worker }
5195*4bdc9457SAndroid Build Coastguard Worker }
5196*4bdc9457SAndroid Build Coastguard Worker }
5197*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)5198*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
5199*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5200*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5201*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5202*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5203*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5204*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5205*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5206*4bdc9457SAndroid Build Coastguard Worker .m(5)
5207*4bdc9457SAndroid Build Coastguard Worker .n(n)
5208*4bdc9457SAndroid Build Coastguard Worker .k(k)
5209*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5210*4bdc9457SAndroid Build Coastguard Worker }
5211*4bdc9457SAndroid Build Coastguard Worker }
5212*4bdc9457SAndroid Build Coastguard Worker }
5213*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)5214*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
5215*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5216*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5217*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5218*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5219*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5220*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5221*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5222*4bdc9457SAndroid Build Coastguard Worker .m(5)
5223*4bdc9457SAndroid Build Coastguard Worker .n(n)
5224*4bdc9457SAndroid Build Coastguard Worker .k(k)
5225*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5226*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5227*4bdc9457SAndroid Build Coastguard Worker }
5228*4bdc9457SAndroid Build Coastguard Worker }
5229*4bdc9457SAndroid Build Coastguard Worker }
5230*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)5231*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
5232*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5233*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5234*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5235*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5236*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5237*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5238*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5239*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5240*4bdc9457SAndroid Build Coastguard Worker .m(m)
5241*4bdc9457SAndroid Build Coastguard Worker .n(n)
5242*4bdc9457SAndroid Build Coastguard Worker .k(k)
5243*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5244*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5245*4bdc9457SAndroid Build Coastguard Worker }
5246*4bdc9457SAndroid Build Coastguard Worker }
5247*4bdc9457SAndroid Build Coastguard Worker }
5248*4bdc9457SAndroid Build Coastguard Worker }
5249*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)5250*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
5251*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5252*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5253*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5254*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5255*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5256*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5257*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5258*4bdc9457SAndroid Build Coastguard Worker .m(5)
5259*4bdc9457SAndroid Build Coastguard Worker .n(n)
5260*4bdc9457SAndroid Build Coastguard Worker .k(k)
5261*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5262*4bdc9457SAndroid Build Coastguard Worker }
5263*4bdc9457SAndroid Build Coastguard Worker }
5264*4bdc9457SAndroid Build Coastguard Worker }
5265*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)5266*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
5267*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5268*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5269*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5270*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5271*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5272*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5273*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5274*4bdc9457SAndroid Build Coastguard Worker .m(5)
5275*4bdc9457SAndroid Build Coastguard Worker .n(n)
5276*4bdc9457SAndroid Build Coastguard Worker .k(k)
5277*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5278*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5279*4bdc9457SAndroid Build Coastguard Worker }
5280*4bdc9457SAndroid Build Coastguard Worker }
5281*4bdc9457SAndroid Build Coastguard Worker }
5282*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)5283*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
5284*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5285*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5286*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5287*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5288*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5289*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5290*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5291*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5292*4bdc9457SAndroid Build Coastguard Worker .m(m)
5293*4bdc9457SAndroid Build Coastguard Worker .n(n)
5294*4bdc9457SAndroid Build Coastguard Worker .k(k)
5295*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5296*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5297*4bdc9457SAndroid Build Coastguard Worker }
5298*4bdc9457SAndroid Build Coastguard Worker }
5299*4bdc9457SAndroid Build Coastguard Worker }
5300*4bdc9457SAndroid Build Coastguard Worker }
5301*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel)5302*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel) {
5303*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5304*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5305*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5306*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5307*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5308*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5309*4bdc9457SAndroid Build Coastguard Worker .m(5)
5310*4bdc9457SAndroid Build Coastguard Worker .n(8)
5311*4bdc9457SAndroid Build Coastguard Worker .k(k)
5312*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5313*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5314*4bdc9457SAndroid Build Coastguard Worker }
5315*4bdc9457SAndroid Build Coastguard Worker }
5316*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel_subtile)5317*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel_subtile) {
5318*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5319*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5320*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5321*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5322*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5323*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5324*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5325*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5326*4bdc9457SAndroid Build Coastguard Worker .m(m)
5327*4bdc9457SAndroid Build Coastguard Worker .n(n)
5328*4bdc9457SAndroid Build Coastguard Worker .k(k)
5329*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5330*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5331*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5332*4bdc9457SAndroid Build Coastguard Worker }
5333*4bdc9457SAndroid Build Coastguard Worker }
5334*4bdc9457SAndroid Build Coastguard Worker }
5335*4bdc9457SAndroid Build Coastguard Worker }
5336*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_small_kernel)5337*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_small_kernel) {
5338*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5339*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5340*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5341*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5342*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5343*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5344*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5345*4bdc9457SAndroid Build Coastguard Worker .m(5)
5346*4bdc9457SAndroid Build Coastguard Worker .n(n)
5347*4bdc9457SAndroid Build Coastguard Worker .k(k)
5348*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5349*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5350*4bdc9457SAndroid Build Coastguard Worker }
5351*4bdc9457SAndroid Build Coastguard Worker }
5352*4bdc9457SAndroid Build Coastguard Worker }
5353*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_small_kernel)5354*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_small_kernel) {
5355*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5356*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5357*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5358*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5359*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5360*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5361*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5362*4bdc9457SAndroid Build Coastguard Worker .m(5)
5363*4bdc9457SAndroid Build Coastguard Worker .n(n)
5364*4bdc9457SAndroid Build Coastguard Worker .k(k)
5365*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5366*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5367*4bdc9457SAndroid Build Coastguard Worker }
5368*4bdc9457SAndroid Build Coastguard Worker }
5369*4bdc9457SAndroid Build Coastguard Worker }
5370*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)5371*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
5372*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5373*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5374*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5375*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5376*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5377*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5378*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5379*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5380*4bdc9457SAndroid Build Coastguard Worker .m(m)
5381*4bdc9457SAndroid Build Coastguard Worker .n(n)
5382*4bdc9457SAndroid Build Coastguard Worker .k(k)
5383*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5384*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5385*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5386*4bdc9457SAndroid Build Coastguard Worker }
5387*4bdc9457SAndroid Build Coastguard Worker }
5388*4bdc9457SAndroid Build Coastguard Worker }
5389*4bdc9457SAndroid Build Coastguard Worker }
5390*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,a_offset)5391*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, a_offset) {
5392*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5393*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5394*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5395*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5396*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5397*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5398*4bdc9457SAndroid Build Coastguard Worker .m(5)
5399*4bdc9457SAndroid Build Coastguard Worker .n(8)
5400*4bdc9457SAndroid Build Coastguard Worker .k(k)
5401*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5402*4bdc9457SAndroid Build Coastguard Worker .a_offset(29)
5403*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5404*4bdc9457SAndroid Build Coastguard Worker }
5405*4bdc9457SAndroid Build Coastguard Worker }
5406*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,zero)5407*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, zero) {
5408*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5409*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 5; mz++) {
5410*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5411*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5412*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5413*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5414*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5415*4bdc9457SAndroid Build Coastguard Worker .m(5)
5416*4bdc9457SAndroid Build Coastguard Worker .n(8)
5417*4bdc9457SAndroid Build Coastguard Worker .k(k)
5418*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5419*4bdc9457SAndroid Build Coastguard Worker .a_offset(29)
5420*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
5421*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5422*4bdc9457SAndroid Build Coastguard Worker }
5423*4bdc9457SAndroid Build Coastguard Worker }
5424*4bdc9457SAndroid Build Coastguard Worker }
5425*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)5426*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
5427*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5428*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5429*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5430*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5431*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5432*4bdc9457SAndroid Build Coastguard Worker .m(5)
5433*4bdc9457SAndroid Build Coastguard Worker .n(8)
5434*4bdc9457SAndroid Build Coastguard Worker .k(1)
5435*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5436*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5437*4bdc9457SAndroid Build Coastguard Worker }
5438*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5439*4bdc9457SAndroid Build Coastguard Worker
5440*4bdc9457SAndroid Build Coastguard Worker
5441*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)5442*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
5443*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5444*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5445*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5446*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5447*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5448*4bdc9457SAndroid Build Coastguard Worker .m(6)
5449*4bdc9457SAndroid Build Coastguard Worker .n(8)
5450*4bdc9457SAndroid Build Coastguard Worker .k(1)
5451*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5452*4bdc9457SAndroid Build Coastguard Worker }
5453*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)5454*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
5455*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5456*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5457*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5458*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5459*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5460*4bdc9457SAndroid Build Coastguard Worker .m(6)
5461*4bdc9457SAndroid Build Coastguard Worker .n(8)
5462*4bdc9457SAndroid Build Coastguard Worker .k(1)
5463*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5464*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5465*4bdc9457SAndroid Build Coastguard Worker }
5466*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)5467*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
5468*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5469*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5470*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5471*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5472*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5473*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5474*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5475*4bdc9457SAndroid Build Coastguard Worker .m(m)
5476*4bdc9457SAndroid Build Coastguard Worker .n(n)
5477*4bdc9457SAndroid Build Coastguard Worker .k(1)
5478*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5479*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5480*4bdc9457SAndroid Build Coastguard Worker }
5481*4bdc9457SAndroid Build Coastguard Worker }
5482*4bdc9457SAndroid Build Coastguard Worker }
5483*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)5484*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
5485*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5486*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5487*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5488*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5489*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5490*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5491*4bdc9457SAndroid Build Coastguard Worker .m(m)
5492*4bdc9457SAndroid Build Coastguard Worker .n(8)
5493*4bdc9457SAndroid Build Coastguard Worker .k(1)
5494*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5495*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5496*4bdc9457SAndroid Build Coastguard Worker }
5497*4bdc9457SAndroid Build Coastguard Worker }
5498*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)5499*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
5500*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5501*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5502*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5503*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5504*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5505*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5506*4bdc9457SAndroid Build Coastguard Worker .m(6)
5507*4bdc9457SAndroid Build Coastguard Worker .n(n)
5508*4bdc9457SAndroid Build Coastguard Worker .k(1)
5509*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5510*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5511*4bdc9457SAndroid Build Coastguard Worker }
5512*4bdc9457SAndroid Build Coastguard Worker }
5513*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)5514*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
5515*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5516*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5517*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5518*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5519*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5520*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5521*4bdc9457SAndroid Build Coastguard Worker .m(6)
5522*4bdc9457SAndroid Build Coastguard Worker .n(8)
5523*4bdc9457SAndroid Build Coastguard Worker .k(k)
5524*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5525*4bdc9457SAndroid Build Coastguard Worker }
5526*4bdc9457SAndroid Build Coastguard Worker }
5527*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)5528*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
5529*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5530*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5531*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5532*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5533*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5534*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5535*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5536*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5537*4bdc9457SAndroid Build Coastguard Worker .m(m)
5538*4bdc9457SAndroid Build Coastguard Worker .n(n)
5539*4bdc9457SAndroid Build Coastguard Worker .k(k)
5540*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5541*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5542*4bdc9457SAndroid Build Coastguard Worker }
5543*4bdc9457SAndroid Build Coastguard Worker }
5544*4bdc9457SAndroid Build Coastguard Worker }
5545*4bdc9457SAndroid Build Coastguard Worker }
5546*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)5547*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
5548*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5549*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5550*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5551*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5552*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5553*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5554*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5555*4bdc9457SAndroid Build Coastguard Worker .m(6)
5556*4bdc9457SAndroid Build Coastguard Worker .n(n)
5557*4bdc9457SAndroid Build Coastguard Worker .k(k)
5558*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5559*4bdc9457SAndroid Build Coastguard Worker }
5560*4bdc9457SAndroid Build Coastguard Worker }
5561*4bdc9457SAndroid Build Coastguard Worker }
5562*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)5563*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
5564*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5565*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5566*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5567*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5568*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5569*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5570*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5571*4bdc9457SAndroid Build Coastguard Worker .m(6)
5572*4bdc9457SAndroid Build Coastguard Worker .n(n)
5573*4bdc9457SAndroid Build Coastguard Worker .k(k)
5574*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5575*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5576*4bdc9457SAndroid Build Coastguard Worker }
5577*4bdc9457SAndroid Build Coastguard Worker }
5578*4bdc9457SAndroid Build Coastguard Worker }
5579*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)5580*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
5581*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5582*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5583*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5584*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5585*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5586*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5587*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5588*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5589*4bdc9457SAndroid Build Coastguard Worker .m(m)
5590*4bdc9457SAndroid Build Coastguard Worker .n(n)
5591*4bdc9457SAndroid Build Coastguard Worker .k(k)
5592*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5593*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5594*4bdc9457SAndroid Build Coastguard Worker }
5595*4bdc9457SAndroid Build Coastguard Worker }
5596*4bdc9457SAndroid Build Coastguard Worker }
5597*4bdc9457SAndroid Build Coastguard Worker }
5598*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)5599*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
5600*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5601*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5602*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5603*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5604*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5605*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5606*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5607*4bdc9457SAndroid Build Coastguard Worker .m(6)
5608*4bdc9457SAndroid Build Coastguard Worker .n(n)
5609*4bdc9457SAndroid Build Coastguard Worker .k(k)
5610*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5611*4bdc9457SAndroid Build Coastguard Worker }
5612*4bdc9457SAndroid Build Coastguard Worker }
5613*4bdc9457SAndroid Build Coastguard Worker }
5614*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)5615*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
5616*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5617*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5618*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5619*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5620*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5621*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5622*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5623*4bdc9457SAndroid Build Coastguard Worker .m(6)
5624*4bdc9457SAndroid Build Coastguard Worker .n(n)
5625*4bdc9457SAndroid Build Coastguard Worker .k(k)
5626*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5627*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5628*4bdc9457SAndroid Build Coastguard Worker }
5629*4bdc9457SAndroid Build Coastguard Worker }
5630*4bdc9457SAndroid Build Coastguard Worker }
5631*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)5632*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
5633*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5634*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5635*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5636*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5637*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5638*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5639*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5640*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5641*4bdc9457SAndroid Build Coastguard Worker .m(m)
5642*4bdc9457SAndroid Build Coastguard Worker .n(n)
5643*4bdc9457SAndroid Build Coastguard Worker .k(k)
5644*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5645*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5646*4bdc9457SAndroid Build Coastguard Worker }
5647*4bdc9457SAndroid Build Coastguard Worker }
5648*4bdc9457SAndroid Build Coastguard Worker }
5649*4bdc9457SAndroid Build Coastguard Worker }
5650*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel)5651*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel) {
5652*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5653*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5654*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5655*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5656*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5657*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5658*4bdc9457SAndroid Build Coastguard Worker .m(6)
5659*4bdc9457SAndroid Build Coastguard Worker .n(8)
5660*4bdc9457SAndroid Build Coastguard Worker .k(k)
5661*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5662*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5663*4bdc9457SAndroid Build Coastguard Worker }
5664*4bdc9457SAndroid Build Coastguard Worker }
5665*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,small_kernel_subtile)5666*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, small_kernel_subtile) {
5667*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5668*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5669*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5670*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5671*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5672*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5673*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5674*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5675*4bdc9457SAndroid Build Coastguard Worker .m(m)
5676*4bdc9457SAndroid Build Coastguard Worker .n(n)
5677*4bdc9457SAndroid Build Coastguard Worker .k(k)
5678*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5679*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5680*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5681*4bdc9457SAndroid Build Coastguard Worker }
5682*4bdc9457SAndroid Build Coastguard Worker }
5683*4bdc9457SAndroid Build Coastguard Worker }
5684*4bdc9457SAndroid Build Coastguard Worker }
5685*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_small_kernel)5686*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_small_kernel) {
5687*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5688*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5689*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5690*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5691*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5692*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5693*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5694*4bdc9457SAndroid Build Coastguard Worker .m(6)
5695*4bdc9457SAndroid Build Coastguard Worker .n(n)
5696*4bdc9457SAndroid Build Coastguard Worker .k(k)
5697*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5698*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5699*4bdc9457SAndroid Build Coastguard Worker }
5700*4bdc9457SAndroid Build Coastguard Worker }
5701*4bdc9457SAndroid Build Coastguard Worker }
5702*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_small_kernel)5703*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_small_kernel) {
5704*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5705*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5706*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5707*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5708*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5709*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5710*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5711*4bdc9457SAndroid Build Coastguard Worker .m(6)
5712*4bdc9457SAndroid Build Coastguard Worker .n(n)
5713*4bdc9457SAndroid Build Coastguard Worker .k(k)
5714*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5715*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5716*4bdc9457SAndroid Build Coastguard Worker }
5717*4bdc9457SAndroid Build Coastguard Worker }
5718*4bdc9457SAndroid Build Coastguard Worker }
5719*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)5720*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
5721*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5722*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5723*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5724*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5725*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5726*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5727*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5728*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5729*4bdc9457SAndroid Build Coastguard Worker .m(m)
5730*4bdc9457SAndroid Build Coastguard Worker .n(n)
5731*4bdc9457SAndroid Build Coastguard Worker .k(k)
5732*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5733*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5734*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5735*4bdc9457SAndroid Build Coastguard Worker }
5736*4bdc9457SAndroid Build Coastguard Worker }
5737*4bdc9457SAndroid Build Coastguard Worker }
5738*4bdc9457SAndroid Build Coastguard Worker }
5739*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,a_offset)5740*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, a_offset) {
5741*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5742*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5743*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5744*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5745*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5746*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5747*4bdc9457SAndroid Build Coastguard Worker .m(6)
5748*4bdc9457SAndroid Build Coastguard Worker .n(8)
5749*4bdc9457SAndroid Build Coastguard Worker .k(k)
5750*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5751*4bdc9457SAndroid Build Coastguard Worker .a_offset(37)
5752*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5753*4bdc9457SAndroid Build Coastguard Worker }
5754*4bdc9457SAndroid Build Coastguard Worker }
5755*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,zero)5756*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, zero) {
5757*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5758*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 6; mz++) {
5759*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5760*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5761*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5762*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5763*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5764*4bdc9457SAndroid Build Coastguard Worker .m(6)
5765*4bdc9457SAndroid Build Coastguard Worker .n(8)
5766*4bdc9457SAndroid Build Coastguard Worker .k(k)
5767*4bdc9457SAndroid Build Coastguard Worker .ks(3)
5768*4bdc9457SAndroid Build Coastguard Worker .a_offset(37)
5769*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
5770*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5771*4bdc9457SAndroid Build Coastguard Worker }
5772*4bdc9457SAndroid Build Coastguard Worker }
5773*4bdc9457SAndroid Build Coastguard Worker }
5774*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)5775*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
5776*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5777*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5778*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5779*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5780*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5781*4bdc9457SAndroid Build Coastguard Worker .m(6)
5782*4bdc9457SAndroid Build Coastguard Worker .n(8)
5783*4bdc9457SAndroid Build Coastguard Worker .k(1)
5784*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5785*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5786*4bdc9457SAndroid Build Coastguard Worker }
5787*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5788*4bdc9457SAndroid Build Coastguard Worker
5789*4bdc9457SAndroid Build Coastguard Worker
5790*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_2X4__WASM,k_eq_1)5791*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, k_eq_1) {
5792*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5793*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5794*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5795*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5796*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5797*4bdc9457SAndroid Build Coastguard Worker .m(2)
5798*4bdc9457SAndroid Build Coastguard Worker .n(4)
5799*4bdc9457SAndroid Build Coastguard Worker .k(1)
5800*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5801*4bdc9457SAndroid Build Coastguard Worker }
5802*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,strided_cn)5803*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, strided_cn) {
5804*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5805*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5806*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5807*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5808*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5809*4bdc9457SAndroid Build Coastguard Worker .m(2)
5810*4bdc9457SAndroid Build Coastguard Worker .n(4)
5811*4bdc9457SAndroid Build Coastguard Worker .k(1)
5812*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
5813*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5814*4bdc9457SAndroid Build Coastguard Worker }
5815*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,k_eq_1_subtile)5816*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, k_eq_1_subtile) {
5817*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5818*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
5819*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5820*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5821*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5822*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5823*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5824*4bdc9457SAndroid Build Coastguard Worker .m(m)
5825*4bdc9457SAndroid Build Coastguard Worker .n(n)
5826*4bdc9457SAndroid Build Coastguard Worker .k(1)
5827*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5828*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5829*4bdc9457SAndroid Build Coastguard Worker }
5830*4bdc9457SAndroid Build Coastguard Worker }
5831*4bdc9457SAndroid Build Coastguard Worker }
5832*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,k_eq_1_subtile_m)5833*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, k_eq_1_subtile_m) {
5834*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
5835*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5836*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5837*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5838*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5839*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5840*4bdc9457SAndroid Build Coastguard Worker .m(m)
5841*4bdc9457SAndroid Build Coastguard Worker .n(4)
5842*4bdc9457SAndroid Build Coastguard Worker .k(1)
5843*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5844*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5845*4bdc9457SAndroid Build Coastguard Worker }
5846*4bdc9457SAndroid Build Coastguard Worker }
5847*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,k_eq_1_subtile_n)5848*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, k_eq_1_subtile_n) {
5849*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5850*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5851*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5852*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5853*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5854*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5855*4bdc9457SAndroid Build Coastguard Worker .m(2)
5856*4bdc9457SAndroid Build Coastguard Worker .n(n)
5857*4bdc9457SAndroid Build Coastguard Worker .k(1)
5858*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5859*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5860*4bdc9457SAndroid Build Coastguard Worker }
5861*4bdc9457SAndroid Build Coastguard Worker }
5862*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,k_gt_1)5863*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, k_gt_1) {
5864*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5865*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5866*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5867*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5868*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5869*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5870*4bdc9457SAndroid Build Coastguard Worker .m(2)
5871*4bdc9457SAndroid Build Coastguard Worker .n(4)
5872*4bdc9457SAndroid Build Coastguard Worker .k(k)
5873*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5874*4bdc9457SAndroid Build Coastguard Worker }
5875*4bdc9457SAndroid Build Coastguard Worker }
5876*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,k_gt_1_subtile)5877*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, k_gt_1_subtile) {
5878*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5879*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5880*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
5881*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5882*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5883*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5884*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5885*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5886*4bdc9457SAndroid Build Coastguard Worker .m(m)
5887*4bdc9457SAndroid Build Coastguard Worker .n(n)
5888*4bdc9457SAndroid Build Coastguard Worker .k(k)
5889*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5890*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5891*4bdc9457SAndroid Build Coastguard Worker }
5892*4bdc9457SAndroid Build Coastguard Worker }
5893*4bdc9457SAndroid Build Coastguard Worker }
5894*4bdc9457SAndroid Build Coastguard Worker }
5895*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,n_gt_4)5896*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, n_gt_4) {
5897*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5898*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5899*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5900*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5901*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5902*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5903*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5904*4bdc9457SAndroid Build Coastguard Worker .m(2)
5905*4bdc9457SAndroid Build Coastguard Worker .n(n)
5906*4bdc9457SAndroid Build Coastguard Worker .k(k)
5907*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5908*4bdc9457SAndroid Build Coastguard Worker }
5909*4bdc9457SAndroid Build Coastguard Worker }
5910*4bdc9457SAndroid Build Coastguard Worker }
5911*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,n_gt_4_strided_cn)5912*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, n_gt_4_strided_cn) {
5913*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5914*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5915*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5916*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5917*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5918*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5919*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5920*4bdc9457SAndroid Build Coastguard Worker .m(2)
5921*4bdc9457SAndroid Build Coastguard Worker .n(n)
5922*4bdc9457SAndroid Build Coastguard Worker .k(k)
5923*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
5924*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5925*4bdc9457SAndroid Build Coastguard Worker }
5926*4bdc9457SAndroid Build Coastguard Worker }
5927*4bdc9457SAndroid Build Coastguard Worker }
5928*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,n_gt_4_subtile)5929*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, n_gt_4_subtile) {
5930*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5931*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5932*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
5933*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5934*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5935*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5936*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5937*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5938*4bdc9457SAndroid Build Coastguard Worker .m(m)
5939*4bdc9457SAndroid Build Coastguard Worker .n(n)
5940*4bdc9457SAndroid Build Coastguard Worker .k(k)
5941*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5942*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5943*4bdc9457SAndroid Build Coastguard Worker }
5944*4bdc9457SAndroid Build Coastguard Worker }
5945*4bdc9457SAndroid Build Coastguard Worker }
5946*4bdc9457SAndroid Build Coastguard Worker }
5947*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,n_div_4)5948*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, n_div_4) {
5949*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
5950*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5951*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5952*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5953*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5954*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5955*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5956*4bdc9457SAndroid Build Coastguard Worker .m(2)
5957*4bdc9457SAndroid Build Coastguard Worker .n(n)
5958*4bdc9457SAndroid Build Coastguard Worker .k(k)
5959*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5960*4bdc9457SAndroid Build Coastguard Worker }
5961*4bdc9457SAndroid Build Coastguard Worker }
5962*4bdc9457SAndroid Build Coastguard Worker }
5963*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,n_div_4_strided_cn)5964*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, n_div_4_strided_cn) {
5965*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
5966*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5967*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5968*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5969*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5970*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5971*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5972*4bdc9457SAndroid Build Coastguard Worker .m(2)
5973*4bdc9457SAndroid Build Coastguard Worker .n(n)
5974*4bdc9457SAndroid Build Coastguard Worker .k(k)
5975*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
5976*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5977*4bdc9457SAndroid Build Coastguard Worker }
5978*4bdc9457SAndroid Build Coastguard Worker }
5979*4bdc9457SAndroid Build Coastguard Worker }
5980*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,n_div_4_subtile)5981*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, n_div_4_subtile) {
5982*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
5983*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5984*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
5985*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5986*4bdc9457SAndroid Build Coastguard Worker .mr(2)
5987*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5988*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5989*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5990*4bdc9457SAndroid Build Coastguard Worker .m(m)
5991*4bdc9457SAndroid Build Coastguard Worker .n(n)
5992*4bdc9457SAndroid Build Coastguard Worker .k(k)
5993*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5994*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
5995*4bdc9457SAndroid Build Coastguard Worker }
5996*4bdc9457SAndroid Build Coastguard Worker }
5997*4bdc9457SAndroid Build Coastguard Worker }
5998*4bdc9457SAndroid Build Coastguard Worker }
5999*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,small_kernel)6000*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, small_kernel) {
6001*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6002*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6003*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6004*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6005*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6006*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6007*4bdc9457SAndroid Build Coastguard Worker .m(2)
6008*4bdc9457SAndroid Build Coastguard Worker .n(4)
6009*4bdc9457SAndroid Build Coastguard Worker .k(k)
6010*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6011*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
6012*4bdc9457SAndroid Build Coastguard Worker }
6013*4bdc9457SAndroid Build Coastguard Worker }
6014*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,small_kernel_subtile)6015*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, small_kernel_subtile) {
6016*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6017*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6018*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6019*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6020*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6021*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6022*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6023*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6024*4bdc9457SAndroid Build Coastguard Worker .m(m)
6025*4bdc9457SAndroid Build Coastguard Worker .n(n)
6026*4bdc9457SAndroid Build Coastguard Worker .k(k)
6027*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6028*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6029*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
6030*4bdc9457SAndroid Build Coastguard Worker }
6031*4bdc9457SAndroid Build Coastguard Worker }
6032*4bdc9457SAndroid Build Coastguard Worker }
6033*4bdc9457SAndroid Build Coastguard Worker }
6034*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,n_gt_4_small_kernel)6035*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, n_gt_4_small_kernel) {
6036*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6037*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6038*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6039*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6040*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6041*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6042*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6043*4bdc9457SAndroid Build Coastguard Worker .m(2)
6044*4bdc9457SAndroid Build Coastguard Worker .n(n)
6045*4bdc9457SAndroid Build Coastguard Worker .k(k)
6046*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6047*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
6048*4bdc9457SAndroid Build Coastguard Worker }
6049*4bdc9457SAndroid Build Coastguard Worker }
6050*4bdc9457SAndroid Build Coastguard Worker }
6051*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,n_div_4_small_kernel)6052*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, n_div_4_small_kernel) {
6053*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6054*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6055*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6056*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6057*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6058*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6059*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6060*4bdc9457SAndroid Build Coastguard Worker .m(2)
6061*4bdc9457SAndroid Build Coastguard Worker .n(n)
6062*4bdc9457SAndroid Build Coastguard Worker .k(k)
6063*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6064*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
6065*4bdc9457SAndroid Build Coastguard Worker }
6066*4bdc9457SAndroid Build Coastguard Worker }
6067*4bdc9457SAndroid Build Coastguard Worker }
6068*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,strided_cm_subtile)6069*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, strided_cm_subtile) {
6070*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6071*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6072*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6073*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6074*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6075*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6076*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6077*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6078*4bdc9457SAndroid Build Coastguard Worker .m(m)
6079*4bdc9457SAndroid Build Coastguard Worker .n(n)
6080*4bdc9457SAndroid Build Coastguard Worker .k(k)
6081*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6082*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6083*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
6084*4bdc9457SAndroid Build Coastguard Worker }
6085*4bdc9457SAndroid Build Coastguard Worker }
6086*4bdc9457SAndroid Build Coastguard Worker }
6087*4bdc9457SAndroid Build Coastguard Worker }
6088*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,a_offset)6089*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, a_offset) {
6090*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6091*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6092*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6093*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6094*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6095*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6096*4bdc9457SAndroid Build Coastguard Worker .m(2)
6097*4bdc9457SAndroid Build Coastguard Worker .n(4)
6098*4bdc9457SAndroid Build Coastguard Worker .k(k)
6099*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6100*4bdc9457SAndroid Build Coastguard Worker .a_offset(13)
6101*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
6102*4bdc9457SAndroid Build Coastguard Worker }
6103*4bdc9457SAndroid Build Coastguard Worker }
6104*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,zero)6105*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, zero) {
6106*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6107*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 2; mz++) {
6108*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6109*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6110*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6111*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6112*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6113*4bdc9457SAndroid Build Coastguard Worker .m(2)
6114*4bdc9457SAndroid Build Coastguard Worker .n(4)
6115*4bdc9457SAndroid Build Coastguard Worker .k(k)
6116*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6117*4bdc9457SAndroid Build Coastguard Worker .a_offset(13)
6118*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
6119*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
6120*4bdc9457SAndroid Build Coastguard Worker }
6121*4bdc9457SAndroid Build Coastguard Worker }
6122*4bdc9457SAndroid Build Coastguard Worker }
6123*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_2X4__WASM,strided_cm)6124*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_2X4__WASM, strided_cm) {
6125*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6126*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6127*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6128*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6129*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6130*4bdc9457SAndroid Build Coastguard Worker .m(2)
6131*4bdc9457SAndroid Build Coastguard Worker .n(4)
6132*4bdc9457SAndroid Build Coastguard Worker .k(1)
6133*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6134*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_2x4__wasm);
6135*4bdc9457SAndroid Build Coastguard Worker }
6136*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
6137*4bdc9457SAndroid Build Coastguard Worker
6138*4bdc9457SAndroid Build Coastguard Worker
6139*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X2__WASM,k_eq_1)6140*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, k_eq_1) {
6141*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6142*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6143*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6144*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6145*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6146*4bdc9457SAndroid Build Coastguard Worker .m(4)
6147*4bdc9457SAndroid Build Coastguard Worker .n(2)
6148*4bdc9457SAndroid Build Coastguard Worker .k(1)
6149*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6150*4bdc9457SAndroid Build Coastguard Worker }
6151*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,strided_cn)6152*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, strided_cn) {
6153*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6154*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6155*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6156*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6157*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6158*4bdc9457SAndroid Build Coastguard Worker .m(4)
6159*4bdc9457SAndroid Build Coastguard Worker .n(2)
6160*4bdc9457SAndroid Build Coastguard Worker .k(1)
6161*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
6162*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6163*4bdc9457SAndroid Build Coastguard Worker }
6164*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,k_eq_1_subtile)6165*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, k_eq_1_subtile) {
6166*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6167*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6168*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6169*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6170*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6171*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6172*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6173*4bdc9457SAndroid Build Coastguard Worker .m(m)
6174*4bdc9457SAndroid Build Coastguard Worker .n(n)
6175*4bdc9457SAndroid Build Coastguard Worker .k(1)
6176*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6177*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6178*4bdc9457SAndroid Build Coastguard Worker }
6179*4bdc9457SAndroid Build Coastguard Worker }
6180*4bdc9457SAndroid Build Coastguard Worker }
6181*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,k_eq_1_subtile_m)6182*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, k_eq_1_subtile_m) {
6183*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6184*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6185*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6186*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6187*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6188*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6189*4bdc9457SAndroid Build Coastguard Worker .m(m)
6190*4bdc9457SAndroid Build Coastguard Worker .n(2)
6191*4bdc9457SAndroid Build Coastguard Worker .k(1)
6192*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6193*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6194*4bdc9457SAndroid Build Coastguard Worker }
6195*4bdc9457SAndroid Build Coastguard Worker }
6196*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,k_eq_1_subtile_n)6197*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, k_eq_1_subtile_n) {
6198*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6199*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6200*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6201*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6202*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6203*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6204*4bdc9457SAndroid Build Coastguard Worker .m(4)
6205*4bdc9457SAndroid Build Coastguard Worker .n(n)
6206*4bdc9457SAndroid Build Coastguard Worker .k(1)
6207*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6208*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6209*4bdc9457SAndroid Build Coastguard Worker }
6210*4bdc9457SAndroid Build Coastguard Worker }
6211*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,k_gt_1)6212*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, k_gt_1) {
6213*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6214*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6215*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6216*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6217*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6218*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6219*4bdc9457SAndroid Build Coastguard Worker .m(4)
6220*4bdc9457SAndroid Build Coastguard Worker .n(2)
6221*4bdc9457SAndroid Build Coastguard Worker .k(k)
6222*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6223*4bdc9457SAndroid Build Coastguard Worker }
6224*4bdc9457SAndroid Build Coastguard Worker }
6225*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,k_gt_1_subtile)6226*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, k_gt_1_subtile) {
6227*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6228*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6229*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6230*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6231*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6232*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6233*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6234*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6235*4bdc9457SAndroid Build Coastguard Worker .m(m)
6236*4bdc9457SAndroid Build Coastguard Worker .n(n)
6237*4bdc9457SAndroid Build Coastguard Worker .k(k)
6238*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6239*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6240*4bdc9457SAndroid Build Coastguard Worker }
6241*4bdc9457SAndroid Build Coastguard Worker }
6242*4bdc9457SAndroid Build Coastguard Worker }
6243*4bdc9457SAndroid Build Coastguard Worker }
6244*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,n_gt_2)6245*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, n_gt_2) {
6246*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6247*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6248*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6249*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6250*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6251*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6252*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6253*4bdc9457SAndroid Build Coastguard Worker .m(4)
6254*4bdc9457SAndroid Build Coastguard Worker .n(n)
6255*4bdc9457SAndroid Build Coastguard Worker .k(k)
6256*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6257*4bdc9457SAndroid Build Coastguard Worker }
6258*4bdc9457SAndroid Build Coastguard Worker }
6259*4bdc9457SAndroid Build Coastguard Worker }
6260*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,n_gt_2_strided_cn)6261*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, n_gt_2_strided_cn) {
6262*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6263*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6264*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6265*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6266*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6267*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6268*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6269*4bdc9457SAndroid Build Coastguard Worker .m(4)
6270*4bdc9457SAndroid Build Coastguard Worker .n(n)
6271*4bdc9457SAndroid Build Coastguard Worker .k(k)
6272*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
6273*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6274*4bdc9457SAndroid Build Coastguard Worker }
6275*4bdc9457SAndroid Build Coastguard Worker }
6276*4bdc9457SAndroid Build Coastguard Worker }
6277*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,n_gt_2_subtile)6278*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, n_gt_2_subtile) {
6279*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6280*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6281*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6282*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6283*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6284*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6285*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6286*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6287*4bdc9457SAndroid Build Coastguard Worker .m(m)
6288*4bdc9457SAndroid Build Coastguard Worker .n(n)
6289*4bdc9457SAndroid Build Coastguard Worker .k(k)
6290*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6291*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6292*4bdc9457SAndroid Build Coastguard Worker }
6293*4bdc9457SAndroid Build Coastguard Worker }
6294*4bdc9457SAndroid Build Coastguard Worker }
6295*4bdc9457SAndroid Build Coastguard Worker }
6296*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,n_div_2)6297*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, n_div_2) {
6298*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
6299*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6300*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6301*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6302*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6303*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6304*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6305*4bdc9457SAndroid Build Coastguard Worker .m(4)
6306*4bdc9457SAndroid Build Coastguard Worker .n(n)
6307*4bdc9457SAndroid Build Coastguard Worker .k(k)
6308*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6309*4bdc9457SAndroid Build Coastguard Worker }
6310*4bdc9457SAndroid Build Coastguard Worker }
6311*4bdc9457SAndroid Build Coastguard Worker }
6312*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,n_div_2_strided_cn)6313*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, n_div_2_strided_cn) {
6314*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
6315*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6316*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6317*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6318*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6319*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6320*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6321*4bdc9457SAndroid Build Coastguard Worker .m(4)
6322*4bdc9457SAndroid Build Coastguard Worker .n(n)
6323*4bdc9457SAndroid Build Coastguard Worker .k(k)
6324*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
6325*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6326*4bdc9457SAndroid Build Coastguard Worker }
6327*4bdc9457SAndroid Build Coastguard Worker }
6328*4bdc9457SAndroid Build Coastguard Worker }
6329*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,n_div_2_subtile)6330*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, n_div_2_subtile) {
6331*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
6332*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6333*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6334*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6335*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6336*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6337*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6338*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6339*4bdc9457SAndroid Build Coastguard Worker .m(m)
6340*4bdc9457SAndroid Build Coastguard Worker .n(n)
6341*4bdc9457SAndroid Build Coastguard Worker .k(k)
6342*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6343*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6344*4bdc9457SAndroid Build Coastguard Worker }
6345*4bdc9457SAndroid Build Coastguard Worker }
6346*4bdc9457SAndroid Build Coastguard Worker }
6347*4bdc9457SAndroid Build Coastguard Worker }
6348*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,small_kernel)6349*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, small_kernel) {
6350*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6351*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6352*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6353*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6354*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6355*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6356*4bdc9457SAndroid Build Coastguard Worker .m(4)
6357*4bdc9457SAndroid Build Coastguard Worker .n(2)
6358*4bdc9457SAndroid Build Coastguard Worker .k(k)
6359*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6360*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6361*4bdc9457SAndroid Build Coastguard Worker }
6362*4bdc9457SAndroid Build Coastguard Worker }
6363*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,small_kernel_subtile)6364*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, small_kernel_subtile) {
6365*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6366*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6367*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6368*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6369*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6370*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6371*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6372*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6373*4bdc9457SAndroid Build Coastguard Worker .m(m)
6374*4bdc9457SAndroid Build Coastguard Worker .n(n)
6375*4bdc9457SAndroid Build Coastguard Worker .k(k)
6376*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6377*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6378*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6379*4bdc9457SAndroid Build Coastguard Worker }
6380*4bdc9457SAndroid Build Coastguard Worker }
6381*4bdc9457SAndroid Build Coastguard Worker }
6382*4bdc9457SAndroid Build Coastguard Worker }
6383*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,n_gt_2_small_kernel)6384*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, n_gt_2_small_kernel) {
6385*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6386*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6387*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6388*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6389*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6390*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6391*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6392*4bdc9457SAndroid Build Coastguard Worker .m(4)
6393*4bdc9457SAndroid Build Coastguard Worker .n(n)
6394*4bdc9457SAndroid Build Coastguard Worker .k(k)
6395*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6396*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6397*4bdc9457SAndroid Build Coastguard Worker }
6398*4bdc9457SAndroid Build Coastguard Worker }
6399*4bdc9457SAndroid Build Coastguard Worker }
6400*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,n_div_2_small_kernel)6401*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, n_div_2_small_kernel) {
6402*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
6403*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6404*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6405*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6406*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6407*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6408*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6409*4bdc9457SAndroid Build Coastguard Worker .m(4)
6410*4bdc9457SAndroid Build Coastguard Worker .n(n)
6411*4bdc9457SAndroid Build Coastguard Worker .k(k)
6412*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6413*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6414*4bdc9457SAndroid Build Coastguard Worker }
6415*4bdc9457SAndroid Build Coastguard Worker }
6416*4bdc9457SAndroid Build Coastguard Worker }
6417*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,strided_cm_subtile)6418*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, strided_cm_subtile) {
6419*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6420*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6421*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6422*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6423*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6424*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6425*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6426*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6427*4bdc9457SAndroid Build Coastguard Worker .m(m)
6428*4bdc9457SAndroid Build Coastguard Worker .n(n)
6429*4bdc9457SAndroid Build Coastguard Worker .k(k)
6430*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
6431*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6432*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6433*4bdc9457SAndroid Build Coastguard Worker }
6434*4bdc9457SAndroid Build Coastguard Worker }
6435*4bdc9457SAndroid Build Coastguard Worker }
6436*4bdc9457SAndroid Build Coastguard Worker }
6437*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,a_offset)6438*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, a_offset) {
6439*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6440*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6441*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6442*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6443*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6444*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6445*4bdc9457SAndroid Build Coastguard Worker .m(4)
6446*4bdc9457SAndroid Build Coastguard Worker .n(2)
6447*4bdc9457SAndroid Build Coastguard Worker .k(k)
6448*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6449*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
6450*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6451*4bdc9457SAndroid Build Coastguard Worker }
6452*4bdc9457SAndroid Build Coastguard Worker }
6453*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,zero)6454*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, zero) {
6455*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6456*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 4; mz++) {
6457*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6458*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6459*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6460*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6461*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6462*4bdc9457SAndroid Build Coastguard Worker .m(4)
6463*4bdc9457SAndroid Build Coastguard Worker .n(2)
6464*4bdc9457SAndroid Build Coastguard Worker .k(k)
6465*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6466*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
6467*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
6468*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6469*4bdc9457SAndroid Build Coastguard Worker }
6470*4bdc9457SAndroid Build Coastguard Worker }
6471*4bdc9457SAndroid Build Coastguard Worker }
6472*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__WASM,strided_cm)6473*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__WASM, strided_cm) {
6474*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6475*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6476*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6477*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6478*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6479*4bdc9457SAndroid Build Coastguard Worker .m(4)
6480*4bdc9457SAndroid Build Coastguard Worker .n(2)
6481*4bdc9457SAndroid Build Coastguard Worker .k(1)
6482*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
6483*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__wasm);
6484*4bdc9457SAndroid Build Coastguard Worker }
6485*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
6486*4bdc9457SAndroid Build Coastguard Worker
6487*4bdc9457SAndroid Build Coastguard Worker
6488*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_IGEMM_RELU_4X4__WASM,k_eq_1)6489*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, k_eq_1) {
6490*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6491*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6492*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6493*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6494*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6495*4bdc9457SAndroid Build Coastguard Worker .m(4)
6496*4bdc9457SAndroid Build Coastguard Worker .n(4)
6497*4bdc9457SAndroid Build Coastguard Worker .k(1)
6498*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6499*4bdc9457SAndroid Build Coastguard Worker }
6500*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,strided_cn)6501*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, strided_cn) {
6502*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6503*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6504*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6505*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6506*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6507*4bdc9457SAndroid Build Coastguard Worker .m(4)
6508*4bdc9457SAndroid Build Coastguard Worker .n(4)
6509*4bdc9457SAndroid Build Coastguard Worker .k(1)
6510*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6511*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6512*4bdc9457SAndroid Build Coastguard Worker }
6513*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,k_eq_1_subtile)6514*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, k_eq_1_subtile) {
6515*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6516*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6517*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6518*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6519*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6520*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6521*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6522*4bdc9457SAndroid Build Coastguard Worker .m(m)
6523*4bdc9457SAndroid Build Coastguard Worker .n(n)
6524*4bdc9457SAndroid Build Coastguard Worker .k(1)
6525*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6526*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6527*4bdc9457SAndroid Build Coastguard Worker }
6528*4bdc9457SAndroid Build Coastguard Worker }
6529*4bdc9457SAndroid Build Coastguard Worker }
6530*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,k_eq_1_subtile_m)6531*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, k_eq_1_subtile_m) {
6532*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6533*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6534*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6535*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6536*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6537*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6538*4bdc9457SAndroid Build Coastguard Worker .m(m)
6539*4bdc9457SAndroid Build Coastguard Worker .n(4)
6540*4bdc9457SAndroid Build Coastguard Worker .k(1)
6541*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6542*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6543*4bdc9457SAndroid Build Coastguard Worker }
6544*4bdc9457SAndroid Build Coastguard Worker }
6545*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,k_eq_1_subtile_n)6546*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, k_eq_1_subtile_n) {
6547*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6548*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6549*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6550*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6551*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6552*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6553*4bdc9457SAndroid Build Coastguard Worker .m(4)
6554*4bdc9457SAndroid Build Coastguard Worker .n(n)
6555*4bdc9457SAndroid Build Coastguard Worker .k(1)
6556*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6557*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6558*4bdc9457SAndroid Build Coastguard Worker }
6559*4bdc9457SAndroid Build Coastguard Worker }
6560*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,k_gt_1)6561*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, k_gt_1) {
6562*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6563*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6564*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6565*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6566*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6567*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6568*4bdc9457SAndroid Build Coastguard Worker .m(4)
6569*4bdc9457SAndroid Build Coastguard Worker .n(4)
6570*4bdc9457SAndroid Build Coastguard Worker .k(k)
6571*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6572*4bdc9457SAndroid Build Coastguard Worker }
6573*4bdc9457SAndroid Build Coastguard Worker }
6574*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,k_gt_1_subtile)6575*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, k_gt_1_subtile) {
6576*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6577*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6578*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6579*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6580*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6581*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6582*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6583*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6584*4bdc9457SAndroid Build Coastguard Worker .m(m)
6585*4bdc9457SAndroid Build Coastguard Worker .n(n)
6586*4bdc9457SAndroid Build Coastguard Worker .k(k)
6587*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6588*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6589*4bdc9457SAndroid Build Coastguard Worker }
6590*4bdc9457SAndroid Build Coastguard Worker }
6591*4bdc9457SAndroid Build Coastguard Worker }
6592*4bdc9457SAndroid Build Coastguard Worker }
6593*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,n_gt_4)6594*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, n_gt_4) {
6595*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6596*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6597*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6598*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6599*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6600*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6601*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6602*4bdc9457SAndroid Build Coastguard Worker .m(4)
6603*4bdc9457SAndroid Build Coastguard Worker .n(n)
6604*4bdc9457SAndroid Build Coastguard Worker .k(k)
6605*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6606*4bdc9457SAndroid Build Coastguard Worker }
6607*4bdc9457SAndroid Build Coastguard Worker }
6608*4bdc9457SAndroid Build Coastguard Worker }
6609*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,n_gt_4_strided_cn)6610*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, n_gt_4_strided_cn) {
6611*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6612*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6613*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6614*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6615*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6616*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6617*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6618*4bdc9457SAndroid Build Coastguard Worker .m(4)
6619*4bdc9457SAndroid Build Coastguard Worker .n(n)
6620*4bdc9457SAndroid Build Coastguard Worker .k(k)
6621*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6622*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6623*4bdc9457SAndroid Build Coastguard Worker }
6624*4bdc9457SAndroid Build Coastguard Worker }
6625*4bdc9457SAndroid Build Coastguard Worker }
6626*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,n_gt_4_subtile)6627*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, n_gt_4_subtile) {
6628*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6629*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6630*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6631*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6632*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6633*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6634*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6635*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6636*4bdc9457SAndroid Build Coastguard Worker .m(m)
6637*4bdc9457SAndroid Build Coastguard Worker .n(n)
6638*4bdc9457SAndroid Build Coastguard Worker .k(k)
6639*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6640*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6641*4bdc9457SAndroid Build Coastguard Worker }
6642*4bdc9457SAndroid Build Coastguard Worker }
6643*4bdc9457SAndroid Build Coastguard Worker }
6644*4bdc9457SAndroid Build Coastguard Worker }
6645*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,n_div_4)6646*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, n_div_4) {
6647*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6648*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6649*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6650*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6651*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6652*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6653*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6654*4bdc9457SAndroid Build Coastguard Worker .m(4)
6655*4bdc9457SAndroid Build Coastguard Worker .n(n)
6656*4bdc9457SAndroid Build Coastguard Worker .k(k)
6657*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6658*4bdc9457SAndroid Build Coastguard Worker }
6659*4bdc9457SAndroid Build Coastguard Worker }
6660*4bdc9457SAndroid Build Coastguard Worker }
6661*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,n_div_4_strided_cn)6662*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, n_div_4_strided_cn) {
6663*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6664*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6665*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6666*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6667*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6668*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6669*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6670*4bdc9457SAndroid Build Coastguard Worker .m(4)
6671*4bdc9457SAndroid Build Coastguard Worker .n(n)
6672*4bdc9457SAndroid Build Coastguard Worker .k(k)
6673*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6674*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6675*4bdc9457SAndroid Build Coastguard Worker }
6676*4bdc9457SAndroid Build Coastguard Worker }
6677*4bdc9457SAndroid Build Coastguard Worker }
6678*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,n_div_4_subtile)6679*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, n_div_4_subtile) {
6680*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6681*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6682*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6683*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6684*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6685*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6686*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6687*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6688*4bdc9457SAndroid Build Coastguard Worker .m(m)
6689*4bdc9457SAndroid Build Coastguard Worker .n(n)
6690*4bdc9457SAndroid Build Coastguard Worker .k(k)
6691*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6692*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6693*4bdc9457SAndroid Build Coastguard Worker }
6694*4bdc9457SAndroid Build Coastguard Worker }
6695*4bdc9457SAndroid Build Coastguard Worker }
6696*4bdc9457SAndroid Build Coastguard Worker }
6697*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,small_kernel)6698*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, small_kernel) {
6699*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6700*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6701*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6702*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6703*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6704*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6705*4bdc9457SAndroid Build Coastguard Worker .m(4)
6706*4bdc9457SAndroid Build Coastguard Worker .n(4)
6707*4bdc9457SAndroid Build Coastguard Worker .k(k)
6708*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6709*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6710*4bdc9457SAndroid Build Coastguard Worker }
6711*4bdc9457SAndroid Build Coastguard Worker }
6712*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,small_kernel_subtile)6713*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, small_kernel_subtile) {
6714*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6715*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6716*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6717*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6718*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6719*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6720*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6721*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6722*4bdc9457SAndroid Build Coastguard Worker .m(m)
6723*4bdc9457SAndroid Build Coastguard Worker .n(n)
6724*4bdc9457SAndroid Build Coastguard Worker .k(k)
6725*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6726*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6727*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6728*4bdc9457SAndroid Build Coastguard Worker }
6729*4bdc9457SAndroid Build Coastguard Worker }
6730*4bdc9457SAndroid Build Coastguard Worker }
6731*4bdc9457SAndroid Build Coastguard Worker }
6732*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,n_gt_4_small_kernel)6733*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, n_gt_4_small_kernel) {
6734*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6735*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6736*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6737*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6738*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6739*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6740*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6741*4bdc9457SAndroid Build Coastguard Worker .m(4)
6742*4bdc9457SAndroid Build Coastguard Worker .n(n)
6743*4bdc9457SAndroid Build Coastguard Worker .k(k)
6744*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6745*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6746*4bdc9457SAndroid Build Coastguard Worker }
6747*4bdc9457SAndroid Build Coastguard Worker }
6748*4bdc9457SAndroid Build Coastguard Worker }
6749*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,n_div_4_small_kernel)6750*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, n_div_4_small_kernel) {
6751*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6752*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6753*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6754*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6755*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6756*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6757*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6758*4bdc9457SAndroid Build Coastguard Worker .m(4)
6759*4bdc9457SAndroid Build Coastguard Worker .n(n)
6760*4bdc9457SAndroid Build Coastguard Worker .k(k)
6761*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6762*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6763*4bdc9457SAndroid Build Coastguard Worker }
6764*4bdc9457SAndroid Build Coastguard Worker }
6765*4bdc9457SAndroid Build Coastguard Worker }
6766*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,strided_cm_subtile)6767*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, strided_cm_subtile) {
6768*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6769*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6770*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6771*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6772*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6773*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6774*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6775*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6776*4bdc9457SAndroid Build Coastguard Worker .m(m)
6777*4bdc9457SAndroid Build Coastguard Worker .n(n)
6778*4bdc9457SAndroid Build Coastguard Worker .k(k)
6779*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6780*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6781*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6782*4bdc9457SAndroid Build Coastguard Worker }
6783*4bdc9457SAndroid Build Coastguard Worker }
6784*4bdc9457SAndroid Build Coastguard Worker }
6785*4bdc9457SAndroid Build Coastguard Worker }
6786*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,a_offset)6787*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, a_offset) {
6788*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6789*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6790*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6791*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6792*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6793*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6794*4bdc9457SAndroid Build Coastguard Worker .m(4)
6795*4bdc9457SAndroid Build Coastguard Worker .n(4)
6796*4bdc9457SAndroid Build Coastguard Worker .k(k)
6797*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6798*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
6799*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6800*4bdc9457SAndroid Build Coastguard Worker }
6801*4bdc9457SAndroid Build Coastguard Worker }
6802*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,zero)6803*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, zero) {
6804*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6805*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 4; mz++) {
6806*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6807*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6808*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6809*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6810*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6811*4bdc9457SAndroid Build Coastguard Worker .m(4)
6812*4bdc9457SAndroid Build Coastguard Worker .n(4)
6813*4bdc9457SAndroid Build Coastguard Worker .k(k)
6814*4bdc9457SAndroid Build Coastguard Worker .ks(3)
6815*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
6816*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
6817*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6818*4bdc9457SAndroid Build Coastguard Worker }
6819*4bdc9457SAndroid Build Coastguard Worker }
6820*4bdc9457SAndroid Build Coastguard Worker }
6821*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__WASM,strided_cm)6822*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__WASM, strided_cm) {
6823*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6824*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6825*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6826*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6827*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6828*4bdc9457SAndroid Build Coastguard Worker .m(4)
6829*4bdc9457SAndroid Build Coastguard Worker .n(4)
6830*4bdc9457SAndroid Build Coastguard Worker .k(1)
6831*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6832*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__wasm);
6833*4bdc9457SAndroid Build Coastguard Worker }
6834*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
6835*4bdc9457SAndroid Build Coastguard Worker
6836*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,k_eq_1)6837*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, k_eq_1) {
6838*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6839*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6840*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6841*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6842*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6843*4bdc9457SAndroid Build Coastguard Worker .m(1)
6844*4bdc9457SAndroid Build Coastguard Worker .n(4)
6845*4bdc9457SAndroid Build Coastguard Worker .k(1)
6846*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6847*4bdc9457SAndroid Build Coastguard Worker }
6848*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,strided_cn)6849*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, strided_cn) {
6850*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6851*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6852*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6853*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6854*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6855*4bdc9457SAndroid Build Coastguard Worker .m(1)
6856*4bdc9457SAndroid Build Coastguard Worker .n(4)
6857*4bdc9457SAndroid Build Coastguard Worker .k(1)
6858*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6859*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6860*4bdc9457SAndroid Build Coastguard Worker }
6861*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,k_eq_1_subtile)6862*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, k_eq_1_subtile) {
6863*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6864*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
6865*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6866*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6867*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6868*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6869*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6870*4bdc9457SAndroid Build Coastguard Worker .m(m)
6871*4bdc9457SAndroid Build Coastguard Worker .n(n)
6872*4bdc9457SAndroid Build Coastguard Worker .k(1)
6873*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6874*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6875*4bdc9457SAndroid Build Coastguard Worker }
6876*4bdc9457SAndroid Build Coastguard Worker }
6877*4bdc9457SAndroid Build Coastguard Worker }
6878*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,k_eq_1_subtile_m)6879*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, k_eq_1_subtile_m) {
6880*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
6881*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6882*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6883*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6884*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6885*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6886*4bdc9457SAndroid Build Coastguard Worker .m(m)
6887*4bdc9457SAndroid Build Coastguard Worker .n(4)
6888*4bdc9457SAndroid Build Coastguard Worker .k(1)
6889*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6890*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6891*4bdc9457SAndroid Build Coastguard Worker }
6892*4bdc9457SAndroid Build Coastguard Worker }
6893*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,k_eq_1_subtile_n)6894*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, k_eq_1_subtile_n) {
6895*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6896*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6897*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6898*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6899*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6900*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6901*4bdc9457SAndroid Build Coastguard Worker .m(1)
6902*4bdc9457SAndroid Build Coastguard Worker .n(n)
6903*4bdc9457SAndroid Build Coastguard Worker .k(1)
6904*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6905*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6906*4bdc9457SAndroid Build Coastguard Worker }
6907*4bdc9457SAndroid Build Coastguard Worker }
6908*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,k_gt_1)6909*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, k_gt_1) {
6910*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6911*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6912*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6913*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6914*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6915*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6916*4bdc9457SAndroid Build Coastguard Worker .m(1)
6917*4bdc9457SAndroid Build Coastguard Worker .n(4)
6918*4bdc9457SAndroid Build Coastguard Worker .k(k)
6919*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6920*4bdc9457SAndroid Build Coastguard Worker }
6921*4bdc9457SAndroid Build Coastguard Worker }
6922*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,k_gt_1_subtile)6923*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, k_gt_1_subtile) {
6924*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6925*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6926*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
6927*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6928*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6929*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6930*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6931*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6932*4bdc9457SAndroid Build Coastguard Worker .m(m)
6933*4bdc9457SAndroid Build Coastguard Worker .n(n)
6934*4bdc9457SAndroid Build Coastguard Worker .k(k)
6935*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6936*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6937*4bdc9457SAndroid Build Coastguard Worker }
6938*4bdc9457SAndroid Build Coastguard Worker }
6939*4bdc9457SAndroid Build Coastguard Worker }
6940*4bdc9457SAndroid Build Coastguard Worker }
6941*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,n_gt_4)6942*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, n_gt_4) {
6943*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6944*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6945*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6946*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6947*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6948*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6949*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6950*4bdc9457SAndroid Build Coastguard Worker .m(1)
6951*4bdc9457SAndroid Build Coastguard Worker .n(n)
6952*4bdc9457SAndroid Build Coastguard Worker .k(k)
6953*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6954*4bdc9457SAndroid Build Coastguard Worker }
6955*4bdc9457SAndroid Build Coastguard Worker }
6956*4bdc9457SAndroid Build Coastguard Worker }
6957*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,n_gt_4_strided_cn)6958*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, n_gt_4_strided_cn) {
6959*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6960*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6961*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6962*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6963*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6964*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6965*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6966*4bdc9457SAndroid Build Coastguard Worker .m(1)
6967*4bdc9457SAndroid Build Coastguard Worker .n(n)
6968*4bdc9457SAndroid Build Coastguard Worker .k(k)
6969*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6970*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6971*4bdc9457SAndroid Build Coastguard Worker }
6972*4bdc9457SAndroid Build Coastguard Worker }
6973*4bdc9457SAndroid Build Coastguard Worker }
6974*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,n_gt_4_subtile)6975*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, n_gt_4_subtile) {
6976*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6977*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6978*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
6979*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6980*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6981*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6982*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6983*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6984*4bdc9457SAndroid Build Coastguard Worker .m(m)
6985*4bdc9457SAndroid Build Coastguard Worker .n(n)
6986*4bdc9457SAndroid Build Coastguard Worker .k(k)
6987*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6988*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
6989*4bdc9457SAndroid Build Coastguard Worker }
6990*4bdc9457SAndroid Build Coastguard Worker }
6991*4bdc9457SAndroid Build Coastguard Worker }
6992*4bdc9457SAndroid Build Coastguard Worker }
6993*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,n_div_4)6994*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, n_div_4) {
6995*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6996*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6997*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6998*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6999*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7000*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7001*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7002*4bdc9457SAndroid Build Coastguard Worker .m(1)
7003*4bdc9457SAndroid Build Coastguard Worker .n(n)
7004*4bdc9457SAndroid Build Coastguard Worker .k(k)
7005*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7006*4bdc9457SAndroid Build Coastguard Worker }
7007*4bdc9457SAndroid Build Coastguard Worker }
7008*4bdc9457SAndroid Build Coastguard Worker }
7009*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,n_div_4_strided_cn)7010*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, n_div_4_strided_cn) {
7011*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7012*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7013*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7014*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7015*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7016*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7017*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7018*4bdc9457SAndroid Build Coastguard Worker .m(1)
7019*4bdc9457SAndroid Build Coastguard Worker .n(n)
7020*4bdc9457SAndroid Build Coastguard Worker .k(k)
7021*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7022*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7023*4bdc9457SAndroid Build Coastguard Worker }
7024*4bdc9457SAndroid Build Coastguard Worker }
7025*4bdc9457SAndroid Build Coastguard Worker }
7026*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,n_div_4_subtile)7027*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, n_div_4_subtile) {
7028*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7029*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7030*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
7031*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7032*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7033*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7034*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7035*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7036*4bdc9457SAndroid Build Coastguard Worker .m(m)
7037*4bdc9457SAndroid Build Coastguard Worker .n(n)
7038*4bdc9457SAndroid Build Coastguard Worker .k(k)
7039*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7040*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7041*4bdc9457SAndroid Build Coastguard Worker }
7042*4bdc9457SAndroid Build Coastguard Worker }
7043*4bdc9457SAndroid Build Coastguard Worker }
7044*4bdc9457SAndroid Build Coastguard Worker }
7045*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,small_kernel)7046*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, small_kernel) {
7047*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7048*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7049*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7050*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7051*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7052*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7053*4bdc9457SAndroid Build Coastguard Worker .m(1)
7054*4bdc9457SAndroid Build Coastguard Worker .n(4)
7055*4bdc9457SAndroid Build Coastguard Worker .k(k)
7056*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7057*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7058*4bdc9457SAndroid Build Coastguard Worker }
7059*4bdc9457SAndroid Build Coastguard Worker }
7060*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,small_kernel_subtile)7061*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, small_kernel_subtile) {
7062*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7063*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7064*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
7065*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7066*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7067*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7068*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7069*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7070*4bdc9457SAndroid Build Coastguard Worker .m(m)
7071*4bdc9457SAndroid Build Coastguard Worker .n(n)
7072*4bdc9457SAndroid Build Coastguard Worker .k(k)
7073*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7074*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7075*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7076*4bdc9457SAndroid Build Coastguard Worker }
7077*4bdc9457SAndroid Build Coastguard Worker }
7078*4bdc9457SAndroid Build Coastguard Worker }
7079*4bdc9457SAndroid Build Coastguard Worker }
7080*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,n_gt_4_small_kernel)7081*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, n_gt_4_small_kernel) {
7082*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7083*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7084*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7085*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7086*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7087*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7088*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7089*4bdc9457SAndroid Build Coastguard Worker .m(1)
7090*4bdc9457SAndroid Build Coastguard Worker .n(n)
7091*4bdc9457SAndroid Build Coastguard Worker .k(k)
7092*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7093*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7094*4bdc9457SAndroid Build Coastguard Worker }
7095*4bdc9457SAndroid Build Coastguard Worker }
7096*4bdc9457SAndroid Build Coastguard Worker }
7097*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,n_div_4_small_kernel)7098*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, n_div_4_small_kernel) {
7099*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7100*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7101*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7102*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7103*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7104*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7105*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7106*4bdc9457SAndroid Build Coastguard Worker .m(1)
7107*4bdc9457SAndroid Build Coastguard Worker .n(n)
7108*4bdc9457SAndroid Build Coastguard Worker .k(k)
7109*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7110*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7111*4bdc9457SAndroid Build Coastguard Worker }
7112*4bdc9457SAndroid Build Coastguard Worker }
7113*4bdc9457SAndroid Build Coastguard Worker }
7114*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,strided_cm_subtile)7115*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, strided_cm_subtile) {
7116*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7117*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7118*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
7119*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7120*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7121*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7122*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7123*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7124*4bdc9457SAndroid Build Coastguard Worker .m(m)
7125*4bdc9457SAndroid Build Coastguard Worker .n(n)
7126*4bdc9457SAndroid Build Coastguard Worker .k(k)
7127*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
7128*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7129*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7130*4bdc9457SAndroid Build Coastguard Worker }
7131*4bdc9457SAndroid Build Coastguard Worker }
7132*4bdc9457SAndroid Build Coastguard Worker }
7133*4bdc9457SAndroid Build Coastguard Worker }
7134*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,a_offset)7135*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, a_offset) {
7136*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7137*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7138*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7139*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7140*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7141*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7142*4bdc9457SAndroid Build Coastguard Worker .m(1)
7143*4bdc9457SAndroid Build Coastguard Worker .n(4)
7144*4bdc9457SAndroid Build Coastguard Worker .k(k)
7145*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7146*4bdc9457SAndroid Build Coastguard Worker .a_offset(7)
7147*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7148*4bdc9457SAndroid Build Coastguard Worker }
7149*4bdc9457SAndroid Build Coastguard Worker }
7150*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,zero)7151*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, zero) {
7152*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7153*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 1; mz++) {
7154*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7155*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7156*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7157*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7158*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7159*4bdc9457SAndroid Build Coastguard Worker .m(1)
7160*4bdc9457SAndroid Build Coastguard Worker .n(4)
7161*4bdc9457SAndroid Build Coastguard Worker .k(k)
7162*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7163*4bdc9457SAndroid Build Coastguard Worker .a_offset(7)
7164*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
7165*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7166*4bdc9457SAndroid Build Coastguard Worker }
7167*4bdc9457SAndroid Build Coastguard Worker }
7168*4bdc9457SAndroid Build Coastguard Worker }
7169*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_1X4__SCALAR,strided_cm)7170*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_1X4__SCALAR, strided_cm) {
7171*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7172*4bdc9457SAndroid Build Coastguard Worker .mr(1)
7173*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7174*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7175*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7176*4bdc9457SAndroid Build Coastguard Worker .m(1)
7177*4bdc9457SAndroid Build Coastguard Worker .n(4)
7178*4bdc9457SAndroid Build Coastguard Worker .k(1)
7179*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
7180*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_1x4__scalar);
7181*4bdc9457SAndroid Build Coastguard Worker }
7182*4bdc9457SAndroid Build Coastguard Worker
7183*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,k_eq_1)7184*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, k_eq_1) {
7185*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7186*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7187*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7188*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7189*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7190*4bdc9457SAndroid Build Coastguard Worker .m(4)
7191*4bdc9457SAndroid Build Coastguard Worker .n(2)
7192*4bdc9457SAndroid Build Coastguard Worker .k(1)
7193*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7194*4bdc9457SAndroid Build Coastguard Worker }
7195*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,strided_cn)7196*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, strided_cn) {
7197*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7198*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7199*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7200*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7201*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7202*4bdc9457SAndroid Build Coastguard Worker .m(4)
7203*4bdc9457SAndroid Build Coastguard Worker .n(2)
7204*4bdc9457SAndroid Build Coastguard Worker .k(1)
7205*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
7206*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7207*4bdc9457SAndroid Build Coastguard Worker }
7208*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,k_eq_1_subtile)7209*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, k_eq_1_subtile) {
7210*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
7211*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7212*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7213*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7214*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7215*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7216*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7217*4bdc9457SAndroid Build Coastguard Worker .m(m)
7218*4bdc9457SAndroid Build Coastguard Worker .n(n)
7219*4bdc9457SAndroid Build Coastguard Worker .k(1)
7220*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7221*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7222*4bdc9457SAndroid Build Coastguard Worker }
7223*4bdc9457SAndroid Build Coastguard Worker }
7224*4bdc9457SAndroid Build Coastguard Worker }
7225*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,k_eq_1_subtile_m)7226*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, k_eq_1_subtile_m) {
7227*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7228*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7229*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7230*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7231*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7232*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7233*4bdc9457SAndroid Build Coastguard Worker .m(m)
7234*4bdc9457SAndroid Build Coastguard Worker .n(2)
7235*4bdc9457SAndroid Build Coastguard Worker .k(1)
7236*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7237*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7238*4bdc9457SAndroid Build Coastguard Worker }
7239*4bdc9457SAndroid Build Coastguard Worker }
7240*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,k_eq_1_subtile_n)7241*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, k_eq_1_subtile_n) {
7242*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
7243*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7244*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7245*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7246*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7247*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7248*4bdc9457SAndroid Build Coastguard Worker .m(4)
7249*4bdc9457SAndroid Build Coastguard Worker .n(n)
7250*4bdc9457SAndroid Build Coastguard Worker .k(1)
7251*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7252*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7253*4bdc9457SAndroid Build Coastguard Worker }
7254*4bdc9457SAndroid Build Coastguard Worker }
7255*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,k_gt_1)7256*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, k_gt_1) {
7257*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7258*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7259*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7260*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7261*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7262*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7263*4bdc9457SAndroid Build Coastguard Worker .m(4)
7264*4bdc9457SAndroid Build Coastguard Worker .n(2)
7265*4bdc9457SAndroid Build Coastguard Worker .k(k)
7266*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7267*4bdc9457SAndroid Build Coastguard Worker }
7268*4bdc9457SAndroid Build Coastguard Worker }
7269*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,k_gt_1_subtile)7270*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, k_gt_1_subtile) {
7271*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7272*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
7273*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7274*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7275*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7276*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7277*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7278*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7279*4bdc9457SAndroid Build Coastguard Worker .m(m)
7280*4bdc9457SAndroid Build Coastguard Worker .n(n)
7281*4bdc9457SAndroid Build Coastguard Worker .k(k)
7282*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7283*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7284*4bdc9457SAndroid Build Coastguard Worker }
7285*4bdc9457SAndroid Build Coastguard Worker }
7286*4bdc9457SAndroid Build Coastguard Worker }
7287*4bdc9457SAndroid Build Coastguard Worker }
7288*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,n_gt_2)7289*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, n_gt_2) {
7290*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
7291*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7292*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7293*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7294*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7295*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7296*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7297*4bdc9457SAndroid Build Coastguard Worker .m(4)
7298*4bdc9457SAndroid Build Coastguard Worker .n(n)
7299*4bdc9457SAndroid Build Coastguard Worker .k(k)
7300*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7301*4bdc9457SAndroid Build Coastguard Worker }
7302*4bdc9457SAndroid Build Coastguard Worker }
7303*4bdc9457SAndroid Build Coastguard Worker }
7304*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,n_gt_2_strided_cn)7305*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, n_gt_2_strided_cn) {
7306*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
7307*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7308*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7309*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7310*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7311*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7312*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7313*4bdc9457SAndroid Build Coastguard Worker .m(4)
7314*4bdc9457SAndroid Build Coastguard Worker .n(n)
7315*4bdc9457SAndroid Build Coastguard Worker .k(k)
7316*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
7317*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7318*4bdc9457SAndroid Build Coastguard Worker }
7319*4bdc9457SAndroid Build Coastguard Worker }
7320*4bdc9457SAndroid Build Coastguard Worker }
7321*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,n_gt_2_subtile)7322*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, n_gt_2_subtile) {
7323*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
7324*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7325*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7326*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7327*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7328*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7329*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7330*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7331*4bdc9457SAndroid Build Coastguard Worker .m(m)
7332*4bdc9457SAndroid Build Coastguard Worker .n(n)
7333*4bdc9457SAndroid Build Coastguard Worker .k(k)
7334*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7335*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7336*4bdc9457SAndroid Build Coastguard Worker }
7337*4bdc9457SAndroid Build Coastguard Worker }
7338*4bdc9457SAndroid Build Coastguard Worker }
7339*4bdc9457SAndroid Build Coastguard Worker }
7340*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,n_div_2)7341*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, n_div_2) {
7342*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
7343*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7344*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7345*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7346*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7347*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7348*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7349*4bdc9457SAndroid Build Coastguard Worker .m(4)
7350*4bdc9457SAndroid Build Coastguard Worker .n(n)
7351*4bdc9457SAndroid Build Coastguard Worker .k(k)
7352*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7353*4bdc9457SAndroid Build Coastguard Worker }
7354*4bdc9457SAndroid Build Coastguard Worker }
7355*4bdc9457SAndroid Build Coastguard Worker }
7356*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,n_div_2_strided_cn)7357*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, n_div_2_strided_cn) {
7358*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
7359*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7360*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7361*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7362*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7363*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7364*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7365*4bdc9457SAndroid Build Coastguard Worker .m(4)
7366*4bdc9457SAndroid Build Coastguard Worker .n(n)
7367*4bdc9457SAndroid Build Coastguard Worker .k(k)
7368*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
7369*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7370*4bdc9457SAndroid Build Coastguard Worker }
7371*4bdc9457SAndroid Build Coastguard Worker }
7372*4bdc9457SAndroid Build Coastguard Worker }
7373*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,n_div_2_subtile)7374*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, n_div_2_subtile) {
7375*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
7376*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7377*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7378*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7379*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7380*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7381*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7382*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7383*4bdc9457SAndroid Build Coastguard Worker .m(m)
7384*4bdc9457SAndroid Build Coastguard Worker .n(n)
7385*4bdc9457SAndroid Build Coastguard Worker .k(k)
7386*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7387*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7388*4bdc9457SAndroid Build Coastguard Worker }
7389*4bdc9457SAndroid Build Coastguard Worker }
7390*4bdc9457SAndroid Build Coastguard Worker }
7391*4bdc9457SAndroid Build Coastguard Worker }
7392*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,small_kernel)7393*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, small_kernel) {
7394*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7395*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7396*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7397*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7398*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7399*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7400*4bdc9457SAndroid Build Coastguard Worker .m(4)
7401*4bdc9457SAndroid Build Coastguard Worker .n(2)
7402*4bdc9457SAndroid Build Coastguard Worker .k(k)
7403*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7404*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7405*4bdc9457SAndroid Build Coastguard Worker }
7406*4bdc9457SAndroid Build Coastguard Worker }
7407*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,small_kernel_subtile)7408*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, small_kernel_subtile) {
7409*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7410*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
7411*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7412*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7413*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7414*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7415*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7416*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7417*4bdc9457SAndroid Build Coastguard Worker .m(m)
7418*4bdc9457SAndroid Build Coastguard Worker .n(n)
7419*4bdc9457SAndroid Build Coastguard Worker .k(k)
7420*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7421*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7422*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7423*4bdc9457SAndroid Build Coastguard Worker }
7424*4bdc9457SAndroid Build Coastguard Worker }
7425*4bdc9457SAndroid Build Coastguard Worker }
7426*4bdc9457SAndroid Build Coastguard Worker }
7427*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,n_gt_2_small_kernel)7428*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, n_gt_2_small_kernel) {
7429*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
7430*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7431*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7432*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7433*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7434*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7435*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7436*4bdc9457SAndroid Build Coastguard Worker .m(4)
7437*4bdc9457SAndroid Build Coastguard Worker .n(n)
7438*4bdc9457SAndroid Build Coastguard Worker .k(k)
7439*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7440*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7441*4bdc9457SAndroid Build Coastguard Worker }
7442*4bdc9457SAndroid Build Coastguard Worker }
7443*4bdc9457SAndroid Build Coastguard Worker }
7444*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,n_div_2_small_kernel)7445*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, n_div_2_small_kernel) {
7446*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
7447*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7448*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7449*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7450*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7451*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7452*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7453*4bdc9457SAndroid Build Coastguard Worker .m(4)
7454*4bdc9457SAndroid Build Coastguard Worker .n(n)
7455*4bdc9457SAndroid Build Coastguard Worker .k(k)
7456*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7457*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7458*4bdc9457SAndroid Build Coastguard Worker }
7459*4bdc9457SAndroid Build Coastguard Worker }
7460*4bdc9457SAndroid Build Coastguard Worker }
7461*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,strided_cm_subtile)7462*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, strided_cm_subtile) {
7463*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7464*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
7465*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7466*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7467*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7468*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7469*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7470*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7471*4bdc9457SAndroid Build Coastguard Worker .m(m)
7472*4bdc9457SAndroid Build Coastguard Worker .n(n)
7473*4bdc9457SAndroid Build Coastguard Worker .k(k)
7474*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
7475*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7476*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7477*4bdc9457SAndroid Build Coastguard Worker }
7478*4bdc9457SAndroid Build Coastguard Worker }
7479*4bdc9457SAndroid Build Coastguard Worker }
7480*4bdc9457SAndroid Build Coastguard Worker }
7481*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,a_offset)7482*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, a_offset) {
7483*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7484*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7485*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7486*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7487*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7488*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7489*4bdc9457SAndroid Build Coastguard Worker .m(4)
7490*4bdc9457SAndroid Build Coastguard Worker .n(2)
7491*4bdc9457SAndroid Build Coastguard Worker .k(k)
7492*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7493*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
7494*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7495*4bdc9457SAndroid Build Coastguard Worker }
7496*4bdc9457SAndroid Build Coastguard Worker }
7497*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,zero)7498*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, zero) {
7499*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7500*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 4; mz++) {
7501*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7502*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7503*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7504*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7505*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7506*4bdc9457SAndroid Build Coastguard Worker .m(4)
7507*4bdc9457SAndroid Build Coastguard Worker .n(2)
7508*4bdc9457SAndroid Build Coastguard Worker .k(k)
7509*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7510*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
7511*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
7512*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7513*4bdc9457SAndroid Build Coastguard Worker }
7514*4bdc9457SAndroid Build Coastguard Worker }
7515*4bdc9457SAndroid Build Coastguard Worker }
7516*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X2__SCALAR,strided_cm)7517*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X2__SCALAR, strided_cm) {
7518*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7519*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7520*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7521*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7522*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7523*4bdc9457SAndroid Build Coastguard Worker .m(4)
7524*4bdc9457SAndroid Build Coastguard Worker .n(2)
7525*4bdc9457SAndroid Build Coastguard Worker .k(1)
7526*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
7527*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x2__scalar);
7528*4bdc9457SAndroid Build Coastguard Worker }
7529*4bdc9457SAndroid Build Coastguard Worker
7530*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,k_eq_1)7531*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, k_eq_1) {
7532*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7533*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7534*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7535*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7536*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7537*4bdc9457SAndroid Build Coastguard Worker .m(4)
7538*4bdc9457SAndroid Build Coastguard Worker .n(4)
7539*4bdc9457SAndroid Build Coastguard Worker .k(1)
7540*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7541*4bdc9457SAndroid Build Coastguard Worker }
7542*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,strided_cn)7543*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, strided_cn) {
7544*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7545*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7546*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7547*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7548*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7549*4bdc9457SAndroid Build Coastguard Worker .m(4)
7550*4bdc9457SAndroid Build Coastguard Worker .n(4)
7551*4bdc9457SAndroid Build Coastguard Worker .k(1)
7552*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7553*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7554*4bdc9457SAndroid Build Coastguard Worker }
7555*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,k_eq_1_subtile)7556*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, k_eq_1_subtile) {
7557*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7558*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7559*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7560*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7561*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7562*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7563*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7564*4bdc9457SAndroid Build Coastguard Worker .m(m)
7565*4bdc9457SAndroid Build Coastguard Worker .n(n)
7566*4bdc9457SAndroid Build Coastguard Worker .k(1)
7567*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7568*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7569*4bdc9457SAndroid Build Coastguard Worker }
7570*4bdc9457SAndroid Build Coastguard Worker }
7571*4bdc9457SAndroid Build Coastguard Worker }
7572*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,k_eq_1_subtile_m)7573*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, k_eq_1_subtile_m) {
7574*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7575*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7576*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7577*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7578*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7579*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7580*4bdc9457SAndroid Build Coastguard Worker .m(m)
7581*4bdc9457SAndroid Build Coastguard Worker .n(4)
7582*4bdc9457SAndroid Build Coastguard Worker .k(1)
7583*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7584*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7585*4bdc9457SAndroid Build Coastguard Worker }
7586*4bdc9457SAndroid Build Coastguard Worker }
7587*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,k_eq_1_subtile_n)7588*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, k_eq_1_subtile_n) {
7589*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7590*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7591*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7592*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7593*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7594*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7595*4bdc9457SAndroid Build Coastguard Worker .m(4)
7596*4bdc9457SAndroid Build Coastguard Worker .n(n)
7597*4bdc9457SAndroid Build Coastguard Worker .k(1)
7598*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7599*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7600*4bdc9457SAndroid Build Coastguard Worker }
7601*4bdc9457SAndroid Build Coastguard Worker }
7602*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,k_gt_1)7603*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, k_gt_1) {
7604*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7605*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7606*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7607*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7608*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7609*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7610*4bdc9457SAndroid Build Coastguard Worker .m(4)
7611*4bdc9457SAndroid Build Coastguard Worker .n(4)
7612*4bdc9457SAndroid Build Coastguard Worker .k(k)
7613*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7614*4bdc9457SAndroid Build Coastguard Worker }
7615*4bdc9457SAndroid Build Coastguard Worker }
7616*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,k_gt_1_subtile)7617*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, k_gt_1_subtile) {
7618*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7619*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7620*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7621*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7622*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7623*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7624*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7625*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7626*4bdc9457SAndroid Build Coastguard Worker .m(m)
7627*4bdc9457SAndroid Build Coastguard Worker .n(n)
7628*4bdc9457SAndroid Build Coastguard Worker .k(k)
7629*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7630*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7631*4bdc9457SAndroid Build Coastguard Worker }
7632*4bdc9457SAndroid Build Coastguard Worker }
7633*4bdc9457SAndroid Build Coastguard Worker }
7634*4bdc9457SAndroid Build Coastguard Worker }
7635*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,n_gt_4)7636*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, n_gt_4) {
7637*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7638*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7639*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7640*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7641*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7642*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7643*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7644*4bdc9457SAndroid Build Coastguard Worker .m(4)
7645*4bdc9457SAndroid Build Coastguard Worker .n(n)
7646*4bdc9457SAndroid Build Coastguard Worker .k(k)
7647*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7648*4bdc9457SAndroid Build Coastguard Worker }
7649*4bdc9457SAndroid Build Coastguard Worker }
7650*4bdc9457SAndroid Build Coastguard Worker }
7651*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,n_gt_4_strided_cn)7652*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, n_gt_4_strided_cn) {
7653*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7654*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7655*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7656*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7657*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7658*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7659*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7660*4bdc9457SAndroid Build Coastguard Worker .m(4)
7661*4bdc9457SAndroid Build Coastguard Worker .n(n)
7662*4bdc9457SAndroid Build Coastguard Worker .k(k)
7663*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7664*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7665*4bdc9457SAndroid Build Coastguard Worker }
7666*4bdc9457SAndroid Build Coastguard Worker }
7667*4bdc9457SAndroid Build Coastguard Worker }
7668*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,n_gt_4_subtile)7669*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, n_gt_4_subtile) {
7670*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7671*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7672*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7673*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7674*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7675*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7676*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7677*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7678*4bdc9457SAndroid Build Coastguard Worker .m(m)
7679*4bdc9457SAndroid Build Coastguard Worker .n(n)
7680*4bdc9457SAndroid Build Coastguard Worker .k(k)
7681*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7682*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7683*4bdc9457SAndroid Build Coastguard Worker }
7684*4bdc9457SAndroid Build Coastguard Worker }
7685*4bdc9457SAndroid Build Coastguard Worker }
7686*4bdc9457SAndroid Build Coastguard Worker }
7687*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,n_div_4)7688*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, n_div_4) {
7689*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7690*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7691*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7692*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7693*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7694*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7695*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7696*4bdc9457SAndroid Build Coastguard Worker .m(4)
7697*4bdc9457SAndroid Build Coastguard Worker .n(n)
7698*4bdc9457SAndroid Build Coastguard Worker .k(k)
7699*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7700*4bdc9457SAndroid Build Coastguard Worker }
7701*4bdc9457SAndroid Build Coastguard Worker }
7702*4bdc9457SAndroid Build Coastguard Worker }
7703*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,n_div_4_strided_cn)7704*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, n_div_4_strided_cn) {
7705*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7706*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7707*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7708*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7709*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7710*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7711*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7712*4bdc9457SAndroid Build Coastguard Worker .m(4)
7713*4bdc9457SAndroid Build Coastguard Worker .n(n)
7714*4bdc9457SAndroid Build Coastguard Worker .k(k)
7715*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7716*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7717*4bdc9457SAndroid Build Coastguard Worker }
7718*4bdc9457SAndroid Build Coastguard Worker }
7719*4bdc9457SAndroid Build Coastguard Worker }
7720*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,n_div_4_subtile)7721*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, n_div_4_subtile) {
7722*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7723*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7724*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7725*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7726*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7727*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7728*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7729*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7730*4bdc9457SAndroid Build Coastguard Worker .m(m)
7731*4bdc9457SAndroid Build Coastguard Worker .n(n)
7732*4bdc9457SAndroid Build Coastguard Worker .k(k)
7733*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7734*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7735*4bdc9457SAndroid Build Coastguard Worker }
7736*4bdc9457SAndroid Build Coastguard Worker }
7737*4bdc9457SAndroid Build Coastguard Worker }
7738*4bdc9457SAndroid Build Coastguard Worker }
7739*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,small_kernel)7740*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, small_kernel) {
7741*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7742*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7743*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7744*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7745*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7746*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7747*4bdc9457SAndroid Build Coastguard Worker .m(4)
7748*4bdc9457SAndroid Build Coastguard Worker .n(4)
7749*4bdc9457SAndroid Build Coastguard Worker .k(k)
7750*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7751*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7752*4bdc9457SAndroid Build Coastguard Worker }
7753*4bdc9457SAndroid Build Coastguard Worker }
7754*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,small_kernel_subtile)7755*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, small_kernel_subtile) {
7756*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7757*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7758*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7759*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7760*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7761*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7762*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7763*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7764*4bdc9457SAndroid Build Coastguard Worker .m(m)
7765*4bdc9457SAndroid Build Coastguard Worker .n(n)
7766*4bdc9457SAndroid Build Coastguard Worker .k(k)
7767*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7768*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7769*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7770*4bdc9457SAndroid Build Coastguard Worker }
7771*4bdc9457SAndroid Build Coastguard Worker }
7772*4bdc9457SAndroid Build Coastguard Worker }
7773*4bdc9457SAndroid Build Coastguard Worker }
7774*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,n_gt_4_small_kernel)7775*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, n_gt_4_small_kernel) {
7776*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7777*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7778*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7779*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7780*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7781*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7782*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7783*4bdc9457SAndroid Build Coastguard Worker .m(4)
7784*4bdc9457SAndroid Build Coastguard Worker .n(n)
7785*4bdc9457SAndroid Build Coastguard Worker .k(k)
7786*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7787*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7788*4bdc9457SAndroid Build Coastguard Worker }
7789*4bdc9457SAndroid Build Coastguard Worker }
7790*4bdc9457SAndroid Build Coastguard Worker }
7791*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,n_div_4_small_kernel)7792*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, n_div_4_small_kernel) {
7793*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7794*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7795*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7796*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7797*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7798*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7799*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7800*4bdc9457SAndroid Build Coastguard Worker .m(4)
7801*4bdc9457SAndroid Build Coastguard Worker .n(n)
7802*4bdc9457SAndroid Build Coastguard Worker .k(k)
7803*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7804*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7805*4bdc9457SAndroid Build Coastguard Worker }
7806*4bdc9457SAndroid Build Coastguard Worker }
7807*4bdc9457SAndroid Build Coastguard Worker }
7808*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,strided_cm_subtile)7809*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, strided_cm_subtile) {
7810*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7811*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7812*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7813*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7814*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7815*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7816*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7817*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7818*4bdc9457SAndroid Build Coastguard Worker .m(m)
7819*4bdc9457SAndroid Build Coastguard Worker .n(n)
7820*4bdc9457SAndroid Build Coastguard Worker .k(k)
7821*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
7822*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7823*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7824*4bdc9457SAndroid Build Coastguard Worker }
7825*4bdc9457SAndroid Build Coastguard Worker }
7826*4bdc9457SAndroid Build Coastguard Worker }
7827*4bdc9457SAndroid Build Coastguard Worker }
7828*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,a_offset)7829*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, a_offset) {
7830*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7831*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7832*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7833*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7834*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7835*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7836*4bdc9457SAndroid Build Coastguard Worker .m(4)
7837*4bdc9457SAndroid Build Coastguard Worker .n(4)
7838*4bdc9457SAndroid Build Coastguard Worker .k(k)
7839*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7840*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
7841*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7842*4bdc9457SAndroid Build Coastguard Worker }
7843*4bdc9457SAndroid Build Coastguard Worker }
7844*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,zero)7845*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, zero) {
7846*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7847*4bdc9457SAndroid Build Coastguard Worker for (uint32_t mz = 0; mz < 4; mz++) {
7848*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7849*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7850*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7851*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7852*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7853*4bdc9457SAndroid Build Coastguard Worker .m(4)
7854*4bdc9457SAndroid Build Coastguard Worker .n(4)
7855*4bdc9457SAndroid Build Coastguard Worker .k(k)
7856*4bdc9457SAndroid Build Coastguard Worker .ks(3)
7857*4bdc9457SAndroid Build Coastguard Worker .a_offset(23)
7858*4bdc9457SAndroid Build Coastguard Worker .zero_index(mz)
7859*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7860*4bdc9457SAndroid Build Coastguard Worker }
7861*4bdc9457SAndroid Build Coastguard Worker }
7862*4bdc9457SAndroid Build Coastguard Worker }
7863*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_IGEMM_RELU_4X4__SCALAR,strided_cm)7864*4bdc9457SAndroid Build Coastguard Worker TEST(F32_IGEMM_RELU_4X4__SCALAR, strided_cm) {
7865*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7866*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7867*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7868*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7869*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7870*4bdc9457SAndroid Build Coastguard Worker .m(4)
7871*4bdc9457SAndroid Build Coastguard Worker .n(4)
7872*4bdc9457SAndroid Build Coastguard Worker .k(1)
7873*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
7874*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_igemm_relu_ukernel_4x4__scalar);
7875*4bdc9457SAndroid Build Coastguard Worker }
7876