1*4bdc9457SAndroid Build Coastguard Worker // Copyright (c) Facebook, Inc. and its affiliates.
2*4bdc9457SAndroid Build Coastguard Worker // All rights reserved.
3*4bdc9457SAndroid Build Coastguard Worker //
4*4bdc9457SAndroid Build Coastguard Worker // Copyright 2019 Google LLC
5*4bdc9457SAndroid Build Coastguard Worker //
6*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
7*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
8*4bdc9457SAndroid Build Coastguard Worker //
9*4bdc9457SAndroid Build Coastguard Worker // Auto-generated file. Do not edit!
10*4bdc9457SAndroid Build Coastguard Worker // Specification: test/f32-gemm-relu.yaml
11*4bdc9457SAndroid Build Coastguard Worker // Generator: tools/generate-gemm-test.py
12*4bdc9457SAndroid Build Coastguard Worker
13*4bdc9457SAndroid Build Coastguard Worker
14*4bdc9457SAndroid Build Coastguard Worker #include <gtest/gtest.h>
15*4bdc9457SAndroid Build Coastguard Worker
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/allocator.h>
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h>
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/isa-checks.h>
19*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microparams-init.h>
20*4bdc9457SAndroid Build Coastguard Worker
21*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/gemm.h>
22*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/igemm.h>
23*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/ppmm.h>
24*4bdc9457SAndroid Build Coastguard Worker #include "gemm-microkernel-tester.h"
25*4bdc9457SAndroid Build Coastguard Worker
26*4bdc9457SAndroid Build Coastguard Worker
27*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_eq_1)28*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_eq_1) {
29*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
30*4bdc9457SAndroid Build Coastguard Worker .mr(3)
31*4bdc9457SAndroid Build Coastguard Worker .nr(8)
32*4bdc9457SAndroid Build Coastguard Worker .kr(1)
33*4bdc9457SAndroid Build Coastguard Worker .sr(1)
34*4bdc9457SAndroid Build Coastguard Worker .m(3)
35*4bdc9457SAndroid Build Coastguard Worker .n(8)
36*4bdc9457SAndroid Build Coastguard Worker .k(1)
37*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
38*4bdc9457SAndroid Build Coastguard Worker }
39*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,strided_cn)40*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, strided_cn) {
41*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
42*4bdc9457SAndroid Build Coastguard Worker .mr(3)
43*4bdc9457SAndroid Build Coastguard Worker .nr(8)
44*4bdc9457SAndroid Build Coastguard Worker .kr(1)
45*4bdc9457SAndroid Build Coastguard Worker .sr(1)
46*4bdc9457SAndroid Build Coastguard Worker .m(3)
47*4bdc9457SAndroid Build Coastguard Worker .n(8)
48*4bdc9457SAndroid Build Coastguard Worker .k(1)
49*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
50*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
51*4bdc9457SAndroid Build Coastguard Worker }
52*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_eq_1_strided_a)53*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_eq_1_strided_a) {
54*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
55*4bdc9457SAndroid Build Coastguard Worker .mr(3)
56*4bdc9457SAndroid Build Coastguard Worker .nr(8)
57*4bdc9457SAndroid Build Coastguard Worker .kr(1)
58*4bdc9457SAndroid Build Coastguard Worker .sr(1)
59*4bdc9457SAndroid Build Coastguard Worker .m(3)
60*4bdc9457SAndroid Build Coastguard Worker .n(8)
61*4bdc9457SAndroid Build Coastguard Worker .k(1)
62*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
63*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
64*4bdc9457SAndroid Build Coastguard Worker }
65*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)66*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
67*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
68*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
69*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
70*4bdc9457SAndroid Build Coastguard Worker .mr(3)
71*4bdc9457SAndroid Build Coastguard Worker .nr(8)
72*4bdc9457SAndroid Build Coastguard Worker .kr(1)
73*4bdc9457SAndroid Build Coastguard Worker .sr(1)
74*4bdc9457SAndroid Build Coastguard Worker .m(m)
75*4bdc9457SAndroid Build Coastguard Worker .n(n)
76*4bdc9457SAndroid Build Coastguard Worker .k(1)
77*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
78*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
79*4bdc9457SAndroid Build Coastguard Worker }
80*4bdc9457SAndroid Build Coastguard Worker }
81*4bdc9457SAndroid Build Coastguard Worker }
82*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)83*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
84*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
85*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
86*4bdc9457SAndroid Build Coastguard Worker .mr(3)
87*4bdc9457SAndroid Build Coastguard Worker .nr(8)
88*4bdc9457SAndroid Build Coastguard Worker .kr(1)
89*4bdc9457SAndroid Build Coastguard Worker .sr(1)
90*4bdc9457SAndroid Build Coastguard Worker .m(m)
91*4bdc9457SAndroid Build Coastguard Worker .n(8)
92*4bdc9457SAndroid Build Coastguard Worker .k(1)
93*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
94*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
95*4bdc9457SAndroid Build Coastguard Worker }
96*4bdc9457SAndroid Build Coastguard Worker }
97*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)98*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
99*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
100*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
101*4bdc9457SAndroid Build Coastguard Worker .mr(3)
102*4bdc9457SAndroid Build Coastguard Worker .nr(8)
103*4bdc9457SAndroid Build Coastguard Worker .kr(1)
104*4bdc9457SAndroid Build Coastguard Worker .sr(1)
105*4bdc9457SAndroid Build Coastguard Worker .m(3)
106*4bdc9457SAndroid Build Coastguard Worker .n(n)
107*4bdc9457SAndroid Build Coastguard Worker .k(1)
108*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
109*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
110*4bdc9457SAndroid Build Coastguard Worker }
111*4bdc9457SAndroid Build Coastguard Worker }
112*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_gt_1)113*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_gt_1) {
114*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
115*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
116*4bdc9457SAndroid Build Coastguard Worker .mr(3)
117*4bdc9457SAndroid Build Coastguard Worker .nr(8)
118*4bdc9457SAndroid Build Coastguard Worker .kr(1)
119*4bdc9457SAndroid Build Coastguard Worker .sr(1)
120*4bdc9457SAndroid Build Coastguard Worker .m(3)
121*4bdc9457SAndroid Build Coastguard Worker .n(8)
122*4bdc9457SAndroid Build Coastguard Worker .k(k)
123*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
124*4bdc9457SAndroid Build Coastguard Worker }
125*4bdc9457SAndroid Build Coastguard Worker }
126*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_gt_1_strided_a)127*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_gt_1_strided_a) {
128*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
129*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
130*4bdc9457SAndroid Build Coastguard Worker .mr(3)
131*4bdc9457SAndroid Build Coastguard Worker .nr(8)
132*4bdc9457SAndroid Build Coastguard Worker .kr(1)
133*4bdc9457SAndroid Build Coastguard Worker .sr(1)
134*4bdc9457SAndroid Build Coastguard Worker .m(3)
135*4bdc9457SAndroid Build Coastguard Worker .n(8)
136*4bdc9457SAndroid Build Coastguard Worker .k(k)
137*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
138*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
139*4bdc9457SAndroid Build Coastguard Worker }
140*4bdc9457SAndroid Build Coastguard Worker }
141*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)142*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
143*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
144*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
145*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
146*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
147*4bdc9457SAndroid Build Coastguard Worker .mr(3)
148*4bdc9457SAndroid Build Coastguard Worker .nr(8)
149*4bdc9457SAndroid Build Coastguard Worker .kr(1)
150*4bdc9457SAndroid Build Coastguard Worker .sr(1)
151*4bdc9457SAndroid Build Coastguard Worker .m(m)
152*4bdc9457SAndroid Build Coastguard Worker .n(n)
153*4bdc9457SAndroid Build Coastguard Worker .k(k)
154*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
155*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
156*4bdc9457SAndroid Build Coastguard Worker }
157*4bdc9457SAndroid Build Coastguard Worker }
158*4bdc9457SAndroid Build Coastguard Worker }
159*4bdc9457SAndroid Build Coastguard Worker }
160*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_gt_8)161*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_gt_8) {
162*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
163*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
164*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
165*4bdc9457SAndroid Build Coastguard Worker .mr(3)
166*4bdc9457SAndroid Build Coastguard Worker .nr(8)
167*4bdc9457SAndroid Build Coastguard Worker .kr(1)
168*4bdc9457SAndroid Build Coastguard Worker .sr(1)
169*4bdc9457SAndroid Build Coastguard Worker .m(3)
170*4bdc9457SAndroid Build Coastguard Worker .n(n)
171*4bdc9457SAndroid Build Coastguard Worker .k(k)
172*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
173*4bdc9457SAndroid Build Coastguard Worker }
174*4bdc9457SAndroid Build Coastguard Worker }
175*4bdc9457SAndroid Build Coastguard Worker }
176*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)177*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
178*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
179*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
180*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
181*4bdc9457SAndroid Build Coastguard Worker .mr(3)
182*4bdc9457SAndroid Build Coastguard Worker .nr(8)
183*4bdc9457SAndroid Build Coastguard Worker .kr(1)
184*4bdc9457SAndroid Build Coastguard Worker .sr(1)
185*4bdc9457SAndroid Build Coastguard Worker .m(3)
186*4bdc9457SAndroid Build Coastguard Worker .n(n)
187*4bdc9457SAndroid Build Coastguard Worker .k(k)
188*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
189*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
190*4bdc9457SAndroid Build Coastguard Worker }
191*4bdc9457SAndroid Build Coastguard Worker }
192*4bdc9457SAndroid Build Coastguard Worker }
193*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_a)194*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_a) {
195*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
196*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
197*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
198*4bdc9457SAndroid Build Coastguard Worker .mr(3)
199*4bdc9457SAndroid Build Coastguard Worker .nr(8)
200*4bdc9457SAndroid Build Coastguard Worker .kr(1)
201*4bdc9457SAndroid Build Coastguard Worker .sr(1)
202*4bdc9457SAndroid Build Coastguard Worker .m(3)
203*4bdc9457SAndroid Build Coastguard Worker .n(n)
204*4bdc9457SAndroid Build Coastguard Worker .k(k)
205*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
206*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
207*4bdc9457SAndroid Build Coastguard Worker }
208*4bdc9457SAndroid Build Coastguard Worker }
209*4bdc9457SAndroid Build Coastguard Worker }
210*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)211*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
212*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
213*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
214*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
215*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
216*4bdc9457SAndroid Build Coastguard Worker .mr(3)
217*4bdc9457SAndroid Build Coastguard Worker .nr(8)
218*4bdc9457SAndroid Build Coastguard Worker .kr(1)
219*4bdc9457SAndroid Build Coastguard Worker .sr(1)
220*4bdc9457SAndroid Build Coastguard Worker .m(m)
221*4bdc9457SAndroid Build Coastguard Worker .n(n)
222*4bdc9457SAndroid Build Coastguard Worker .k(k)
223*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
224*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
225*4bdc9457SAndroid Build Coastguard Worker }
226*4bdc9457SAndroid Build Coastguard Worker }
227*4bdc9457SAndroid Build Coastguard Worker }
228*4bdc9457SAndroid Build Coastguard Worker }
229*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_div_8)230*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_div_8) {
231*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
232*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
233*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
234*4bdc9457SAndroid Build Coastguard Worker .mr(3)
235*4bdc9457SAndroid Build Coastguard Worker .nr(8)
236*4bdc9457SAndroid Build Coastguard Worker .kr(1)
237*4bdc9457SAndroid Build Coastguard Worker .sr(1)
238*4bdc9457SAndroid Build Coastguard Worker .m(3)
239*4bdc9457SAndroid Build Coastguard Worker .n(n)
240*4bdc9457SAndroid Build Coastguard Worker .k(k)
241*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
242*4bdc9457SAndroid Build Coastguard Worker }
243*4bdc9457SAndroid Build Coastguard Worker }
244*4bdc9457SAndroid Build Coastguard Worker }
245*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)246*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
247*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
248*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
249*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
250*4bdc9457SAndroid Build Coastguard Worker .mr(3)
251*4bdc9457SAndroid Build Coastguard Worker .nr(8)
252*4bdc9457SAndroid Build Coastguard Worker .kr(1)
253*4bdc9457SAndroid Build Coastguard Worker .sr(1)
254*4bdc9457SAndroid Build Coastguard Worker .m(3)
255*4bdc9457SAndroid Build Coastguard Worker .n(n)
256*4bdc9457SAndroid Build Coastguard Worker .k(k)
257*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
258*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
259*4bdc9457SAndroid Build Coastguard Worker }
260*4bdc9457SAndroid Build Coastguard Worker }
261*4bdc9457SAndroid Build Coastguard Worker }
262*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_div_8_strided_a)263*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_div_8_strided_a) {
264*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
265*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
266*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
267*4bdc9457SAndroid Build Coastguard Worker .mr(3)
268*4bdc9457SAndroid Build Coastguard Worker .nr(8)
269*4bdc9457SAndroid Build Coastguard Worker .kr(1)
270*4bdc9457SAndroid Build Coastguard Worker .sr(1)
271*4bdc9457SAndroid Build Coastguard Worker .m(3)
272*4bdc9457SAndroid Build Coastguard Worker .n(n)
273*4bdc9457SAndroid Build Coastguard Worker .k(k)
274*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
275*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
276*4bdc9457SAndroid Build Coastguard Worker }
277*4bdc9457SAndroid Build Coastguard Worker }
278*4bdc9457SAndroid Build Coastguard Worker }
279*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)280*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
281*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
282*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
283*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
284*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
285*4bdc9457SAndroid Build Coastguard Worker .mr(3)
286*4bdc9457SAndroid Build Coastguard Worker .nr(8)
287*4bdc9457SAndroid Build Coastguard Worker .kr(1)
288*4bdc9457SAndroid Build Coastguard Worker .sr(1)
289*4bdc9457SAndroid Build Coastguard Worker .m(m)
290*4bdc9457SAndroid Build Coastguard Worker .n(n)
291*4bdc9457SAndroid Build Coastguard Worker .k(k)
292*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
293*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
294*4bdc9457SAndroid Build Coastguard Worker }
295*4bdc9457SAndroid Build Coastguard Worker }
296*4bdc9457SAndroid Build Coastguard Worker }
297*4bdc9457SAndroid Build Coastguard Worker }
298*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)299*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
300*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
301*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
302*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
303*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
304*4bdc9457SAndroid Build Coastguard Worker .mr(3)
305*4bdc9457SAndroid Build Coastguard Worker .nr(8)
306*4bdc9457SAndroid Build Coastguard Worker .kr(1)
307*4bdc9457SAndroid Build Coastguard Worker .sr(1)
308*4bdc9457SAndroid Build Coastguard Worker .m(m)
309*4bdc9457SAndroid Build Coastguard Worker .n(n)
310*4bdc9457SAndroid Build Coastguard Worker .k(k)
311*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
312*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
313*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
314*4bdc9457SAndroid Build Coastguard Worker }
315*4bdc9457SAndroid Build Coastguard Worker }
316*4bdc9457SAndroid Build Coastguard Worker }
317*4bdc9457SAndroid Build Coastguard Worker }
318*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT,strided_cm)319*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_LOADSPLAT, strided_cm) {
320*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
321*4bdc9457SAndroid Build Coastguard Worker .mr(3)
322*4bdc9457SAndroid Build Coastguard Worker .nr(8)
323*4bdc9457SAndroid Build Coastguard Worker .kr(1)
324*4bdc9457SAndroid Build Coastguard Worker .sr(1)
325*4bdc9457SAndroid Build Coastguard Worker .m(3)
326*4bdc9457SAndroid Build Coastguard Worker .n(8)
327*4bdc9457SAndroid Build Coastguard Worker .k(1)
328*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
329*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat);
330*4bdc9457SAndroid Build Coastguard Worker }
331*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
332*4bdc9457SAndroid Build Coastguard Worker
333*4bdc9457SAndroid Build Coastguard Worker
334*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_eq_4)335*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_eq_4) {
336*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
337*4bdc9457SAndroid Build Coastguard Worker .mr(3)
338*4bdc9457SAndroid Build Coastguard Worker .nr(8)
339*4bdc9457SAndroid Build Coastguard Worker .kr(1)
340*4bdc9457SAndroid Build Coastguard Worker .sr(1)
341*4bdc9457SAndroid Build Coastguard Worker .m(3)
342*4bdc9457SAndroid Build Coastguard Worker .n(8)
343*4bdc9457SAndroid Build Coastguard Worker .k(4)
344*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
345*4bdc9457SAndroid Build Coastguard Worker }
346*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,strided_cn)347*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, strided_cn) {
348*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
349*4bdc9457SAndroid Build Coastguard Worker .mr(3)
350*4bdc9457SAndroid Build Coastguard Worker .nr(8)
351*4bdc9457SAndroid Build Coastguard Worker .kr(1)
352*4bdc9457SAndroid Build Coastguard Worker .sr(1)
353*4bdc9457SAndroid Build Coastguard Worker .m(3)
354*4bdc9457SAndroid Build Coastguard Worker .n(8)
355*4bdc9457SAndroid Build Coastguard Worker .k(4)
356*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
357*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
358*4bdc9457SAndroid Build Coastguard Worker }
359*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_eq_4_strided_a)360*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_eq_4_strided_a) {
361*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
362*4bdc9457SAndroid Build Coastguard Worker .mr(3)
363*4bdc9457SAndroid Build Coastguard Worker .nr(8)
364*4bdc9457SAndroid Build Coastguard Worker .kr(1)
365*4bdc9457SAndroid Build Coastguard Worker .sr(1)
366*4bdc9457SAndroid Build Coastguard Worker .m(3)
367*4bdc9457SAndroid Build Coastguard Worker .n(8)
368*4bdc9457SAndroid Build Coastguard Worker .k(4)
369*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
370*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
371*4bdc9457SAndroid Build Coastguard Worker }
372*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_eq_4_subtile)373*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
374*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
375*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
376*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
377*4bdc9457SAndroid Build Coastguard Worker .mr(3)
378*4bdc9457SAndroid Build Coastguard Worker .nr(8)
379*4bdc9457SAndroid Build Coastguard Worker .kr(1)
380*4bdc9457SAndroid Build Coastguard Worker .sr(1)
381*4bdc9457SAndroid Build Coastguard Worker .m(m)
382*4bdc9457SAndroid Build Coastguard Worker .n(n)
383*4bdc9457SAndroid Build Coastguard Worker .k(4)
384*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
385*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
386*4bdc9457SAndroid Build Coastguard Worker }
387*4bdc9457SAndroid Build Coastguard Worker }
388*4bdc9457SAndroid Build Coastguard Worker }
389*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)390*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
391*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
392*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
393*4bdc9457SAndroid Build Coastguard Worker .mr(3)
394*4bdc9457SAndroid Build Coastguard Worker .nr(8)
395*4bdc9457SAndroid Build Coastguard Worker .kr(1)
396*4bdc9457SAndroid Build Coastguard Worker .sr(1)
397*4bdc9457SAndroid Build Coastguard Worker .m(m)
398*4bdc9457SAndroid Build Coastguard Worker .n(8)
399*4bdc9457SAndroid Build Coastguard Worker .k(4)
400*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
401*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
402*4bdc9457SAndroid Build Coastguard Worker }
403*4bdc9457SAndroid Build Coastguard Worker }
404*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)405*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
406*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
407*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
408*4bdc9457SAndroid Build Coastguard Worker .mr(3)
409*4bdc9457SAndroid Build Coastguard Worker .nr(8)
410*4bdc9457SAndroid Build Coastguard Worker .kr(1)
411*4bdc9457SAndroid Build Coastguard Worker .sr(1)
412*4bdc9457SAndroid Build Coastguard Worker .m(3)
413*4bdc9457SAndroid Build Coastguard Worker .n(n)
414*4bdc9457SAndroid Build Coastguard Worker .k(4)
415*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
416*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
417*4bdc9457SAndroid Build Coastguard Worker }
418*4bdc9457SAndroid Build Coastguard Worker }
419*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_lt_4)420*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_lt_4) {
421*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
422*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
423*4bdc9457SAndroid Build Coastguard Worker .mr(3)
424*4bdc9457SAndroid Build Coastguard Worker .nr(8)
425*4bdc9457SAndroid Build Coastguard Worker .kr(1)
426*4bdc9457SAndroid Build Coastguard Worker .sr(1)
427*4bdc9457SAndroid Build Coastguard Worker .m(3)
428*4bdc9457SAndroid Build Coastguard Worker .n(8)
429*4bdc9457SAndroid Build Coastguard Worker .k(k)
430*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
431*4bdc9457SAndroid Build Coastguard Worker }
432*4bdc9457SAndroid Build Coastguard Worker }
433*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_lt_4_strided_a)434*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_lt_4_strided_a) {
435*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
436*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
437*4bdc9457SAndroid Build Coastguard Worker .mr(3)
438*4bdc9457SAndroid Build Coastguard Worker .nr(8)
439*4bdc9457SAndroid Build Coastguard Worker .kr(1)
440*4bdc9457SAndroid Build Coastguard Worker .sr(1)
441*4bdc9457SAndroid Build Coastguard Worker .m(3)
442*4bdc9457SAndroid Build Coastguard Worker .n(8)
443*4bdc9457SAndroid Build Coastguard Worker .k(k)
444*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
445*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
446*4bdc9457SAndroid Build Coastguard Worker }
447*4bdc9457SAndroid Build Coastguard Worker }
448*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_lt_4_subtile)449*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
450*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
451*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
452*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
453*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
454*4bdc9457SAndroid Build Coastguard Worker .mr(3)
455*4bdc9457SAndroid Build Coastguard Worker .nr(8)
456*4bdc9457SAndroid Build Coastguard Worker .kr(1)
457*4bdc9457SAndroid Build Coastguard Worker .sr(1)
458*4bdc9457SAndroid Build Coastguard Worker .m(m)
459*4bdc9457SAndroid Build Coastguard Worker .n(n)
460*4bdc9457SAndroid Build Coastguard Worker .k(k)
461*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
462*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
463*4bdc9457SAndroid Build Coastguard Worker }
464*4bdc9457SAndroid Build Coastguard Worker }
465*4bdc9457SAndroid Build Coastguard Worker }
466*4bdc9457SAndroid Build Coastguard Worker }
467*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_gt_4)468*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_gt_4) {
469*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
470*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
471*4bdc9457SAndroid Build Coastguard Worker .mr(3)
472*4bdc9457SAndroid Build Coastguard Worker .nr(8)
473*4bdc9457SAndroid Build Coastguard Worker .kr(1)
474*4bdc9457SAndroid Build Coastguard Worker .sr(1)
475*4bdc9457SAndroid Build Coastguard Worker .m(3)
476*4bdc9457SAndroid Build Coastguard Worker .n(8)
477*4bdc9457SAndroid Build Coastguard Worker .k(k)
478*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
479*4bdc9457SAndroid Build Coastguard Worker }
480*4bdc9457SAndroid Build Coastguard Worker }
481*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_gt_4_strided_a)482*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_gt_4_strided_a) {
483*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
484*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
485*4bdc9457SAndroid Build Coastguard Worker .mr(3)
486*4bdc9457SAndroid Build Coastguard Worker .nr(8)
487*4bdc9457SAndroid Build Coastguard Worker .kr(1)
488*4bdc9457SAndroid Build Coastguard Worker .sr(1)
489*4bdc9457SAndroid Build Coastguard Worker .m(3)
490*4bdc9457SAndroid Build Coastguard Worker .n(8)
491*4bdc9457SAndroid Build Coastguard Worker .k(k)
492*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
493*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
494*4bdc9457SAndroid Build Coastguard Worker }
495*4bdc9457SAndroid Build Coastguard Worker }
496*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_gt_4_subtile)497*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
498*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
499*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
500*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
501*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
502*4bdc9457SAndroid Build Coastguard Worker .mr(3)
503*4bdc9457SAndroid Build Coastguard Worker .nr(8)
504*4bdc9457SAndroid Build Coastguard Worker .kr(1)
505*4bdc9457SAndroid Build Coastguard Worker .sr(1)
506*4bdc9457SAndroid Build Coastguard Worker .m(m)
507*4bdc9457SAndroid Build Coastguard Worker .n(n)
508*4bdc9457SAndroid Build Coastguard Worker .k(k)
509*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
510*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
511*4bdc9457SAndroid Build Coastguard Worker }
512*4bdc9457SAndroid Build Coastguard Worker }
513*4bdc9457SAndroid Build Coastguard Worker }
514*4bdc9457SAndroid Build Coastguard Worker }
515*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_div_4)516*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_div_4) {
517*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
518*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
519*4bdc9457SAndroid Build Coastguard Worker .mr(3)
520*4bdc9457SAndroid Build Coastguard Worker .nr(8)
521*4bdc9457SAndroid Build Coastguard Worker .kr(1)
522*4bdc9457SAndroid Build Coastguard Worker .sr(1)
523*4bdc9457SAndroid Build Coastguard Worker .m(3)
524*4bdc9457SAndroid Build Coastguard Worker .n(8)
525*4bdc9457SAndroid Build Coastguard Worker .k(k)
526*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
527*4bdc9457SAndroid Build Coastguard Worker }
528*4bdc9457SAndroid Build Coastguard Worker }
529*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_div_4_strided_a)530*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_div_4_strided_a) {
531*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
532*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
533*4bdc9457SAndroid Build Coastguard Worker .mr(3)
534*4bdc9457SAndroid Build Coastguard Worker .nr(8)
535*4bdc9457SAndroid Build Coastguard Worker .kr(1)
536*4bdc9457SAndroid Build Coastguard Worker .sr(1)
537*4bdc9457SAndroid Build Coastguard Worker .m(3)
538*4bdc9457SAndroid Build Coastguard Worker .n(8)
539*4bdc9457SAndroid Build Coastguard Worker .k(k)
540*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
541*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
542*4bdc9457SAndroid Build Coastguard Worker }
543*4bdc9457SAndroid Build Coastguard Worker }
544*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,k_div_4_subtile)545*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, k_div_4_subtile) {
546*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
547*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
548*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
549*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
550*4bdc9457SAndroid Build Coastguard Worker .mr(3)
551*4bdc9457SAndroid Build Coastguard Worker .nr(8)
552*4bdc9457SAndroid Build Coastguard Worker .kr(1)
553*4bdc9457SAndroid Build Coastguard Worker .sr(1)
554*4bdc9457SAndroid Build Coastguard Worker .m(m)
555*4bdc9457SAndroid Build Coastguard Worker .n(n)
556*4bdc9457SAndroid Build Coastguard Worker .k(k)
557*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
558*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
559*4bdc9457SAndroid Build Coastguard Worker }
560*4bdc9457SAndroid Build Coastguard Worker }
561*4bdc9457SAndroid Build Coastguard Worker }
562*4bdc9457SAndroid Build Coastguard Worker }
563*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,n_gt_8)564*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, n_gt_8) {
565*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
566*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
567*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
568*4bdc9457SAndroid Build Coastguard Worker .mr(3)
569*4bdc9457SAndroid Build Coastguard Worker .nr(8)
570*4bdc9457SAndroid Build Coastguard Worker .kr(1)
571*4bdc9457SAndroid Build Coastguard Worker .sr(1)
572*4bdc9457SAndroid Build Coastguard Worker .m(3)
573*4bdc9457SAndroid Build Coastguard Worker .n(n)
574*4bdc9457SAndroid Build Coastguard Worker .k(k)
575*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
576*4bdc9457SAndroid Build Coastguard Worker }
577*4bdc9457SAndroid Build Coastguard Worker }
578*4bdc9457SAndroid Build Coastguard Worker }
579*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)580*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
581*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
582*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
583*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
584*4bdc9457SAndroid Build Coastguard Worker .mr(3)
585*4bdc9457SAndroid Build Coastguard Worker .nr(8)
586*4bdc9457SAndroid Build Coastguard Worker .kr(1)
587*4bdc9457SAndroid Build Coastguard Worker .sr(1)
588*4bdc9457SAndroid Build Coastguard Worker .m(3)
589*4bdc9457SAndroid Build Coastguard Worker .n(n)
590*4bdc9457SAndroid Build Coastguard Worker .k(k)
591*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
592*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
593*4bdc9457SAndroid Build Coastguard Worker }
594*4bdc9457SAndroid Build Coastguard Worker }
595*4bdc9457SAndroid Build Coastguard Worker }
596*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,n_gt_8_strided_a)597*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, n_gt_8_strided_a) {
598*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
599*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
600*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
601*4bdc9457SAndroid Build Coastguard Worker .mr(3)
602*4bdc9457SAndroid Build Coastguard Worker .nr(8)
603*4bdc9457SAndroid Build Coastguard Worker .kr(1)
604*4bdc9457SAndroid Build Coastguard Worker .sr(1)
605*4bdc9457SAndroid Build Coastguard Worker .m(3)
606*4bdc9457SAndroid Build Coastguard Worker .n(n)
607*4bdc9457SAndroid Build Coastguard Worker .k(k)
608*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
609*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
610*4bdc9457SAndroid Build Coastguard Worker }
611*4bdc9457SAndroid Build Coastguard Worker }
612*4bdc9457SAndroid Build Coastguard Worker }
613*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,n_gt_8_subtile)614*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
615*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
616*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
617*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
618*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
619*4bdc9457SAndroid Build Coastguard Worker .mr(3)
620*4bdc9457SAndroid Build Coastguard Worker .nr(8)
621*4bdc9457SAndroid Build Coastguard Worker .kr(1)
622*4bdc9457SAndroid Build Coastguard Worker .sr(1)
623*4bdc9457SAndroid Build Coastguard Worker .m(m)
624*4bdc9457SAndroid Build Coastguard Worker .n(n)
625*4bdc9457SAndroid Build Coastguard Worker .k(k)
626*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
627*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
628*4bdc9457SAndroid Build Coastguard Worker }
629*4bdc9457SAndroid Build Coastguard Worker }
630*4bdc9457SAndroid Build Coastguard Worker }
631*4bdc9457SAndroid Build Coastguard Worker }
632*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,n_div_8)633*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, n_div_8) {
634*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
635*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
636*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
637*4bdc9457SAndroid Build Coastguard Worker .mr(3)
638*4bdc9457SAndroid Build Coastguard Worker .nr(8)
639*4bdc9457SAndroid Build Coastguard Worker .kr(1)
640*4bdc9457SAndroid Build Coastguard Worker .sr(1)
641*4bdc9457SAndroid Build Coastguard Worker .m(3)
642*4bdc9457SAndroid Build Coastguard Worker .n(n)
643*4bdc9457SAndroid Build Coastguard Worker .k(k)
644*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
645*4bdc9457SAndroid Build Coastguard Worker }
646*4bdc9457SAndroid Build Coastguard Worker }
647*4bdc9457SAndroid Build Coastguard Worker }
648*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,n_div_8_strided_cn)649*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
650*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
651*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
652*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
653*4bdc9457SAndroid Build Coastguard Worker .mr(3)
654*4bdc9457SAndroid Build Coastguard Worker .nr(8)
655*4bdc9457SAndroid Build Coastguard Worker .kr(1)
656*4bdc9457SAndroid Build Coastguard Worker .sr(1)
657*4bdc9457SAndroid Build Coastguard Worker .m(3)
658*4bdc9457SAndroid Build Coastguard Worker .n(n)
659*4bdc9457SAndroid Build Coastguard Worker .k(k)
660*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
661*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
662*4bdc9457SAndroid Build Coastguard Worker }
663*4bdc9457SAndroid Build Coastguard Worker }
664*4bdc9457SAndroid Build Coastguard Worker }
665*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,n_div_8_strided_a)666*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, n_div_8_strided_a) {
667*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
668*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
669*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
670*4bdc9457SAndroid Build Coastguard Worker .mr(3)
671*4bdc9457SAndroid Build Coastguard Worker .nr(8)
672*4bdc9457SAndroid Build Coastguard Worker .kr(1)
673*4bdc9457SAndroid Build Coastguard Worker .sr(1)
674*4bdc9457SAndroid Build Coastguard Worker .m(3)
675*4bdc9457SAndroid Build Coastguard Worker .n(n)
676*4bdc9457SAndroid Build Coastguard Worker .k(k)
677*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
678*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
679*4bdc9457SAndroid Build Coastguard Worker }
680*4bdc9457SAndroid Build Coastguard Worker }
681*4bdc9457SAndroid Build Coastguard Worker }
682*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,n_div_8_subtile)683*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, n_div_8_subtile) {
684*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
685*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
686*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
687*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
688*4bdc9457SAndroid Build Coastguard Worker .mr(3)
689*4bdc9457SAndroid Build Coastguard Worker .nr(8)
690*4bdc9457SAndroid Build Coastguard Worker .kr(1)
691*4bdc9457SAndroid Build Coastguard Worker .sr(1)
692*4bdc9457SAndroid Build Coastguard Worker .m(m)
693*4bdc9457SAndroid Build Coastguard Worker .n(n)
694*4bdc9457SAndroid Build Coastguard Worker .k(k)
695*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
696*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
697*4bdc9457SAndroid Build Coastguard Worker }
698*4bdc9457SAndroid Build Coastguard Worker }
699*4bdc9457SAndroid Build Coastguard Worker }
700*4bdc9457SAndroid Build Coastguard Worker }
701*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,strided_cm_subtile)702*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, strided_cm_subtile) {
703*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
704*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
705*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
706*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
707*4bdc9457SAndroid Build Coastguard Worker .mr(3)
708*4bdc9457SAndroid Build Coastguard Worker .nr(8)
709*4bdc9457SAndroid Build Coastguard Worker .kr(1)
710*4bdc9457SAndroid Build Coastguard Worker .sr(1)
711*4bdc9457SAndroid Build Coastguard Worker .m(m)
712*4bdc9457SAndroid Build Coastguard Worker .n(n)
713*4bdc9457SAndroid Build Coastguard Worker .k(k)
714*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
715*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
716*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
717*4bdc9457SAndroid Build Coastguard Worker }
718*4bdc9457SAndroid Build Coastguard Worker }
719*4bdc9457SAndroid Build Coastguard Worker }
720*4bdc9457SAndroid Build Coastguard Worker }
721*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT,strided_cm)722*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMSIMD_SPLAT, strided_cm) {
723*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
724*4bdc9457SAndroid Build Coastguard Worker .mr(3)
725*4bdc9457SAndroid Build Coastguard Worker .nr(8)
726*4bdc9457SAndroid Build Coastguard Worker .kr(1)
727*4bdc9457SAndroid Build Coastguard Worker .sr(1)
728*4bdc9457SAndroid Build Coastguard Worker .m(3)
729*4bdc9457SAndroid Build Coastguard Worker .n(8)
730*4bdc9457SAndroid Build Coastguard Worker .k(4)
731*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
732*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat);
733*4bdc9457SAndroid Build Coastguard Worker }
734*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
735*4bdc9457SAndroid Build Coastguard Worker
736*4bdc9457SAndroid Build Coastguard Worker
737*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_eq_4)738*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_eq_4) {
739*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
740*4bdc9457SAndroid Build Coastguard Worker .mr(3)
741*4bdc9457SAndroid Build Coastguard Worker .nr(8)
742*4bdc9457SAndroid Build Coastguard Worker .kr(1)
743*4bdc9457SAndroid Build Coastguard Worker .sr(4)
744*4bdc9457SAndroid Build Coastguard Worker .m(3)
745*4bdc9457SAndroid Build Coastguard Worker .n(8)
746*4bdc9457SAndroid Build Coastguard Worker .k(4)
747*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
748*4bdc9457SAndroid Build Coastguard Worker }
749*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,strided_cn)750*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, strided_cn) {
751*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
752*4bdc9457SAndroid Build Coastguard Worker .mr(3)
753*4bdc9457SAndroid Build Coastguard Worker .nr(8)
754*4bdc9457SAndroid Build Coastguard Worker .kr(1)
755*4bdc9457SAndroid Build Coastguard Worker .sr(4)
756*4bdc9457SAndroid Build Coastguard Worker .m(3)
757*4bdc9457SAndroid Build Coastguard Worker .n(8)
758*4bdc9457SAndroid Build Coastguard Worker .k(4)
759*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
760*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
761*4bdc9457SAndroid Build Coastguard Worker }
762*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_eq_4_strided_a)763*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_eq_4_strided_a) {
764*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
765*4bdc9457SAndroid Build Coastguard Worker .mr(3)
766*4bdc9457SAndroid Build Coastguard Worker .nr(8)
767*4bdc9457SAndroid Build Coastguard Worker .kr(1)
768*4bdc9457SAndroid Build Coastguard Worker .sr(4)
769*4bdc9457SAndroid Build Coastguard Worker .m(3)
770*4bdc9457SAndroid Build Coastguard Worker .n(8)
771*4bdc9457SAndroid Build Coastguard Worker .k(4)
772*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
773*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
774*4bdc9457SAndroid Build Coastguard Worker }
775*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_eq_4_subtile)776*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_eq_4_subtile) {
777*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
778*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
779*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
780*4bdc9457SAndroid Build Coastguard Worker .mr(3)
781*4bdc9457SAndroid Build Coastguard Worker .nr(8)
782*4bdc9457SAndroid Build Coastguard Worker .kr(1)
783*4bdc9457SAndroid Build Coastguard Worker .sr(4)
784*4bdc9457SAndroid Build Coastguard Worker .m(m)
785*4bdc9457SAndroid Build Coastguard Worker .n(n)
786*4bdc9457SAndroid Build Coastguard Worker .k(4)
787*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
788*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
789*4bdc9457SAndroid Build Coastguard Worker }
790*4bdc9457SAndroid Build Coastguard Worker }
791*4bdc9457SAndroid Build Coastguard Worker }
792*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_eq_4_subtile_m)793*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_eq_4_subtile_m) {
794*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
795*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
796*4bdc9457SAndroid Build Coastguard Worker .mr(3)
797*4bdc9457SAndroid Build Coastguard Worker .nr(8)
798*4bdc9457SAndroid Build Coastguard Worker .kr(1)
799*4bdc9457SAndroid Build Coastguard Worker .sr(4)
800*4bdc9457SAndroid Build Coastguard Worker .m(m)
801*4bdc9457SAndroid Build Coastguard Worker .n(8)
802*4bdc9457SAndroid Build Coastguard Worker .k(4)
803*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
804*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
805*4bdc9457SAndroid Build Coastguard Worker }
806*4bdc9457SAndroid Build Coastguard Worker }
807*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_eq_4_subtile_n)808*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_eq_4_subtile_n) {
809*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
810*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
811*4bdc9457SAndroid Build Coastguard Worker .mr(3)
812*4bdc9457SAndroid Build Coastguard Worker .nr(8)
813*4bdc9457SAndroid Build Coastguard Worker .kr(1)
814*4bdc9457SAndroid Build Coastguard Worker .sr(4)
815*4bdc9457SAndroid Build Coastguard Worker .m(3)
816*4bdc9457SAndroid Build Coastguard Worker .n(n)
817*4bdc9457SAndroid Build Coastguard Worker .k(4)
818*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
819*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
820*4bdc9457SAndroid Build Coastguard Worker }
821*4bdc9457SAndroid Build Coastguard Worker }
822*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_lt_4)823*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_lt_4) {
824*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
825*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
826*4bdc9457SAndroid Build Coastguard Worker .mr(3)
827*4bdc9457SAndroid Build Coastguard Worker .nr(8)
828*4bdc9457SAndroid Build Coastguard Worker .kr(1)
829*4bdc9457SAndroid Build Coastguard Worker .sr(4)
830*4bdc9457SAndroid Build Coastguard Worker .m(3)
831*4bdc9457SAndroid Build Coastguard Worker .n(8)
832*4bdc9457SAndroid Build Coastguard Worker .k(k)
833*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
834*4bdc9457SAndroid Build Coastguard Worker }
835*4bdc9457SAndroid Build Coastguard Worker }
836*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_lt_4_strided_a)837*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_lt_4_strided_a) {
838*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
839*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
840*4bdc9457SAndroid Build Coastguard Worker .mr(3)
841*4bdc9457SAndroid Build Coastguard Worker .nr(8)
842*4bdc9457SAndroid Build Coastguard Worker .kr(1)
843*4bdc9457SAndroid Build Coastguard Worker .sr(4)
844*4bdc9457SAndroid Build Coastguard Worker .m(3)
845*4bdc9457SAndroid Build Coastguard Worker .n(8)
846*4bdc9457SAndroid Build Coastguard Worker .k(k)
847*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
848*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
849*4bdc9457SAndroid Build Coastguard Worker }
850*4bdc9457SAndroid Build Coastguard Worker }
851*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_lt_4_subtile)852*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_lt_4_subtile) {
853*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
854*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
855*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
856*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
857*4bdc9457SAndroid Build Coastguard Worker .mr(3)
858*4bdc9457SAndroid Build Coastguard Worker .nr(8)
859*4bdc9457SAndroid Build Coastguard Worker .kr(1)
860*4bdc9457SAndroid Build Coastguard Worker .sr(4)
861*4bdc9457SAndroid Build Coastguard Worker .m(m)
862*4bdc9457SAndroid Build Coastguard Worker .n(n)
863*4bdc9457SAndroid Build Coastguard Worker .k(k)
864*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
865*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
866*4bdc9457SAndroid Build Coastguard Worker }
867*4bdc9457SAndroid Build Coastguard Worker }
868*4bdc9457SAndroid Build Coastguard Worker }
869*4bdc9457SAndroid Build Coastguard Worker }
870*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_gt_4)871*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_gt_4) {
872*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
873*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
874*4bdc9457SAndroid Build Coastguard Worker .mr(3)
875*4bdc9457SAndroid Build Coastguard Worker .nr(8)
876*4bdc9457SAndroid Build Coastguard Worker .kr(1)
877*4bdc9457SAndroid Build Coastguard Worker .sr(4)
878*4bdc9457SAndroid Build Coastguard Worker .m(3)
879*4bdc9457SAndroid Build Coastguard Worker .n(8)
880*4bdc9457SAndroid Build Coastguard Worker .k(k)
881*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
882*4bdc9457SAndroid Build Coastguard Worker }
883*4bdc9457SAndroid Build Coastguard Worker }
884*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_gt_4_strided_a)885*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_gt_4_strided_a) {
886*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
887*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
888*4bdc9457SAndroid Build Coastguard Worker .mr(3)
889*4bdc9457SAndroid Build Coastguard Worker .nr(8)
890*4bdc9457SAndroid Build Coastguard Worker .kr(1)
891*4bdc9457SAndroid Build Coastguard Worker .sr(4)
892*4bdc9457SAndroid Build Coastguard Worker .m(3)
893*4bdc9457SAndroid Build Coastguard Worker .n(8)
894*4bdc9457SAndroid Build Coastguard Worker .k(k)
895*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
896*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
897*4bdc9457SAndroid Build Coastguard Worker }
898*4bdc9457SAndroid Build Coastguard Worker }
899*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_gt_4_subtile)900*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_gt_4_subtile) {
901*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
902*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
903*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
904*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
905*4bdc9457SAndroid Build Coastguard Worker .mr(3)
906*4bdc9457SAndroid Build Coastguard Worker .nr(8)
907*4bdc9457SAndroid Build Coastguard Worker .kr(1)
908*4bdc9457SAndroid Build Coastguard Worker .sr(4)
909*4bdc9457SAndroid Build Coastguard Worker .m(m)
910*4bdc9457SAndroid Build Coastguard Worker .n(n)
911*4bdc9457SAndroid Build Coastguard Worker .k(k)
912*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
913*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
914*4bdc9457SAndroid Build Coastguard Worker }
915*4bdc9457SAndroid Build Coastguard Worker }
916*4bdc9457SAndroid Build Coastguard Worker }
917*4bdc9457SAndroid Build Coastguard Worker }
918*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_div_4)919*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_div_4) {
920*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
921*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
922*4bdc9457SAndroid Build Coastguard Worker .mr(3)
923*4bdc9457SAndroid Build Coastguard Worker .nr(8)
924*4bdc9457SAndroid Build Coastguard Worker .kr(1)
925*4bdc9457SAndroid Build Coastguard Worker .sr(4)
926*4bdc9457SAndroid Build Coastguard Worker .m(3)
927*4bdc9457SAndroid Build Coastguard Worker .n(8)
928*4bdc9457SAndroid Build Coastguard Worker .k(k)
929*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
930*4bdc9457SAndroid Build Coastguard Worker }
931*4bdc9457SAndroid Build Coastguard Worker }
932*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_div_4_strided_a)933*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_div_4_strided_a) {
934*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
935*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
936*4bdc9457SAndroid Build Coastguard Worker .mr(3)
937*4bdc9457SAndroid Build Coastguard Worker .nr(8)
938*4bdc9457SAndroid Build Coastguard Worker .kr(1)
939*4bdc9457SAndroid Build Coastguard Worker .sr(4)
940*4bdc9457SAndroid Build Coastguard Worker .m(3)
941*4bdc9457SAndroid Build Coastguard Worker .n(8)
942*4bdc9457SAndroid Build Coastguard Worker .k(k)
943*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
944*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
945*4bdc9457SAndroid Build Coastguard Worker }
946*4bdc9457SAndroid Build Coastguard Worker }
947*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,k_div_4_subtile)948*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, k_div_4_subtile) {
949*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
950*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
951*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
952*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
953*4bdc9457SAndroid Build Coastguard Worker .mr(3)
954*4bdc9457SAndroid Build Coastguard Worker .nr(8)
955*4bdc9457SAndroid Build Coastguard Worker .kr(1)
956*4bdc9457SAndroid Build Coastguard Worker .sr(4)
957*4bdc9457SAndroid Build Coastguard Worker .m(m)
958*4bdc9457SAndroid Build Coastguard Worker .n(n)
959*4bdc9457SAndroid Build Coastguard Worker .k(k)
960*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
961*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
962*4bdc9457SAndroid Build Coastguard Worker }
963*4bdc9457SAndroid Build Coastguard Worker }
964*4bdc9457SAndroid Build Coastguard Worker }
965*4bdc9457SAndroid Build Coastguard Worker }
966*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,n_gt_8)967*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, n_gt_8) {
968*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
969*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
970*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
971*4bdc9457SAndroid Build Coastguard Worker .mr(3)
972*4bdc9457SAndroid Build Coastguard Worker .nr(8)
973*4bdc9457SAndroid Build Coastguard Worker .kr(1)
974*4bdc9457SAndroid Build Coastguard Worker .sr(4)
975*4bdc9457SAndroid Build Coastguard Worker .m(3)
976*4bdc9457SAndroid Build Coastguard Worker .n(n)
977*4bdc9457SAndroid Build Coastguard Worker .k(k)
978*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
979*4bdc9457SAndroid Build Coastguard Worker }
980*4bdc9457SAndroid Build Coastguard Worker }
981*4bdc9457SAndroid Build Coastguard Worker }
982*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,n_gt_8_strided_cn)983*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, n_gt_8_strided_cn) {
984*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
985*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
986*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
987*4bdc9457SAndroid Build Coastguard Worker .mr(3)
988*4bdc9457SAndroid Build Coastguard Worker .nr(8)
989*4bdc9457SAndroid Build Coastguard Worker .kr(1)
990*4bdc9457SAndroid Build Coastguard Worker .sr(4)
991*4bdc9457SAndroid Build Coastguard Worker .m(3)
992*4bdc9457SAndroid Build Coastguard Worker .n(n)
993*4bdc9457SAndroid Build Coastguard Worker .k(k)
994*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
995*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
996*4bdc9457SAndroid Build Coastguard Worker }
997*4bdc9457SAndroid Build Coastguard Worker }
998*4bdc9457SAndroid Build Coastguard Worker }
999*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,n_gt_8_strided_a)1000*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, n_gt_8_strided_a) {
1001*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1002*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1003*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1004*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1005*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1006*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1007*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1008*4bdc9457SAndroid Build Coastguard Worker .m(3)
1009*4bdc9457SAndroid Build Coastguard Worker .n(n)
1010*4bdc9457SAndroid Build Coastguard Worker .k(k)
1011*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1012*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
1013*4bdc9457SAndroid Build Coastguard Worker }
1014*4bdc9457SAndroid Build Coastguard Worker }
1015*4bdc9457SAndroid Build Coastguard Worker }
1016*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,n_gt_8_subtile)1017*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, n_gt_8_subtile) {
1018*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1019*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1020*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1021*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1022*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1023*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1024*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1025*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1026*4bdc9457SAndroid Build Coastguard Worker .m(m)
1027*4bdc9457SAndroid Build Coastguard Worker .n(n)
1028*4bdc9457SAndroid Build Coastguard Worker .k(k)
1029*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1030*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
1031*4bdc9457SAndroid Build Coastguard Worker }
1032*4bdc9457SAndroid Build Coastguard Worker }
1033*4bdc9457SAndroid Build Coastguard Worker }
1034*4bdc9457SAndroid Build Coastguard Worker }
1035*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,n_div_8)1036*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, n_div_8) {
1037*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1038*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1039*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1040*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1041*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1042*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1043*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1044*4bdc9457SAndroid Build Coastguard Worker .m(3)
1045*4bdc9457SAndroid Build Coastguard Worker .n(n)
1046*4bdc9457SAndroid Build Coastguard Worker .k(k)
1047*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
1048*4bdc9457SAndroid Build Coastguard Worker }
1049*4bdc9457SAndroid Build Coastguard Worker }
1050*4bdc9457SAndroid Build Coastguard Worker }
1051*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,n_div_8_strided_cn)1052*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, n_div_8_strided_cn) {
1053*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1054*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1055*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1056*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1057*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1058*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1059*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1060*4bdc9457SAndroid Build Coastguard Worker .m(3)
1061*4bdc9457SAndroid Build Coastguard Worker .n(n)
1062*4bdc9457SAndroid Build Coastguard Worker .k(k)
1063*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1064*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
1065*4bdc9457SAndroid Build Coastguard Worker }
1066*4bdc9457SAndroid Build Coastguard Worker }
1067*4bdc9457SAndroid Build Coastguard Worker }
1068*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,n_div_8_strided_a)1069*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, n_div_8_strided_a) {
1070*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1071*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1072*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1073*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1074*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1075*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1076*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1077*4bdc9457SAndroid Build Coastguard Worker .m(3)
1078*4bdc9457SAndroid Build Coastguard Worker .n(n)
1079*4bdc9457SAndroid Build Coastguard Worker .k(k)
1080*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1081*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
1082*4bdc9457SAndroid Build Coastguard Worker }
1083*4bdc9457SAndroid Build Coastguard Worker }
1084*4bdc9457SAndroid Build Coastguard Worker }
1085*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,n_div_8_subtile)1086*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, n_div_8_subtile) {
1087*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1088*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1089*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1090*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1091*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1092*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1093*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1094*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1095*4bdc9457SAndroid Build Coastguard Worker .m(m)
1096*4bdc9457SAndroid Build Coastguard Worker .n(n)
1097*4bdc9457SAndroid Build Coastguard Worker .k(k)
1098*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1099*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
1100*4bdc9457SAndroid Build Coastguard Worker }
1101*4bdc9457SAndroid Build Coastguard Worker }
1102*4bdc9457SAndroid Build Coastguard Worker }
1103*4bdc9457SAndroid Build Coastguard Worker }
1104*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,strided_cm_subtile)1105*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, strided_cm_subtile) {
1106*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1107*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1108*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1109*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1110*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1111*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1112*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1113*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1114*4bdc9457SAndroid Build Coastguard Worker .m(m)
1115*4bdc9457SAndroid Build Coastguard Worker .n(n)
1116*4bdc9457SAndroid Build Coastguard Worker .k(k)
1117*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1118*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1119*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
1120*4bdc9457SAndroid Build Coastguard Worker }
1121*4bdc9457SAndroid Build Coastguard Worker }
1122*4bdc9457SAndroid Build Coastguard Worker }
1123*4bdc9457SAndroid Build Coastguard Worker }
1124*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMSIMD,strided_cm)1125*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMSIMD, strided_cm) {
1126*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1127*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1128*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1129*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1130*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1131*4bdc9457SAndroid Build Coastguard Worker .m(3)
1132*4bdc9457SAndroid Build Coastguard Worker .n(8)
1133*4bdc9457SAndroid Build Coastguard Worker .k(4)
1134*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1135*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmsimd);
1136*4bdc9457SAndroid Build Coastguard Worker }
1137*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1138*4bdc9457SAndroid Build Coastguard Worker
1139*4bdc9457SAndroid Build Coastguard Worker
1140*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_eq_4)1141*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_eq_4) {
1142*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1143*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1144*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1145*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1146*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1147*4bdc9457SAndroid Build Coastguard Worker .m(4)
1148*4bdc9457SAndroid Build Coastguard Worker .n(2)
1149*4bdc9457SAndroid Build Coastguard Worker .k(4)
1150*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1151*4bdc9457SAndroid Build Coastguard Worker }
1152*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,strided_cn)1153*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, strided_cn) {
1154*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1155*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1156*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1157*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1158*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1159*4bdc9457SAndroid Build Coastguard Worker .m(4)
1160*4bdc9457SAndroid Build Coastguard Worker .n(2)
1161*4bdc9457SAndroid Build Coastguard Worker .k(4)
1162*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
1163*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1164*4bdc9457SAndroid Build Coastguard Worker }
1165*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_eq_4_strided_a)1166*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_eq_4_strided_a) {
1167*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1168*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1169*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1170*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1171*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1172*4bdc9457SAndroid Build Coastguard Worker .m(4)
1173*4bdc9457SAndroid Build Coastguard Worker .n(2)
1174*4bdc9457SAndroid Build Coastguard Worker .k(4)
1175*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1176*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1177*4bdc9457SAndroid Build Coastguard Worker }
1178*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_eq_4_subtile)1179*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_eq_4_subtile) {
1180*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1181*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1182*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1183*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1184*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1185*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1186*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1187*4bdc9457SAndroid Build Coastguard Worker .m(m)
1188*4bdc9457SAndroid Build Coastguard Worker .n(n)
1189*4bdc9457SAndroid Build Coastguard Worker .k(4)
1190*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1191*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1192*4bdc9457SAndroid Build Coastguard Worker }
1193*4bdc9457SAndroid Build Coastguard Worker }
1194*4bdc9457SAndroid Build Coastguard Worker }
1195*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_eq_4_subtile_m)1196*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_eq_4_subtile_m) {
1197*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1198*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1199*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1200*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1201*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1202*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1203*4bdc9457SAndroid Build Coastguard Worker .m(m)
1204*4bdc9457SAndroid Build Coastguard Worker .n(2)
1205*4bdc9457SAndroid Build Coastguard Worker .k(4)
1206*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1207*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1208*4bdc9457SAndroid Build Coastguard Worker }
1209*4bdc9457SAndroid Build Coastguard Worker }
1210*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_eq_4_subtile_n)1211*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_eq_4_subtile_n) {
1212*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1213*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1214*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1215*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1216*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1217*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1218*4bdc9457SAndroid Build Coastguard Worker .m(4)
1219*4bdc9457SAndroid Build Coastguard Worker .n(n)
1220*4bdc9457SAndroid Build Coastguard Worker .k(4)
1221*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1222*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1223*4bdc9457SAndroid Build Coastguard Worker }
1224*4bdc9457SAndroid Build Coastguard Worker }
1225*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_lt_4)1226*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_lt_4) {
1227*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1228*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1229*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1230*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1231*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1232*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1233*4bdc9457SAndroid Build Coastguard Worker .m(4)
1234*4bdc9457SAndroid Build Coastguard Worker .n(2)
1235*4bdc9457SAndroid Build Coastguard Worker .k(k)
1236*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1237*4bdc9457SAndroid Build Coastguard Worker }
1238*4bdc9457SAndroid Build Coastguard Worker }
1239*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_lt_4_strided_a)1240*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_lt_4_strided_a) {
1241*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1242*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1243*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1244*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1245*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1246*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1247*4bdc9457SAndroid Build Coastguard Worker .m(4)
1248*4bdc9457SAndroid Build Coastguard Worker .n(2)
1249*4bdc9457SAndroid Build Coastguard Worker .k(k)
1250*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1251*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1252*4bdc9457SAndroid Build Coastguard Worker }
1253*4bdc9457SAndroid Build Coastguard Worker }
1254*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_lt_4_subtile)1255*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_lt_4_subtile) {
1256*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1257*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1258*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1259*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1260*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1261*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1262*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1263*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1264*4bdc9457SAndroid Build Coastguard Worker .m(m)
1265*4bdc9457SAndroid Build Coastguard Worker .n(n)
1266*4bdc9457SAndroid Build Coastguard Worker .k(k)
1267*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1268*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1269*4bdc9457SAndroid Build Coastguard Worker }
1270*4bdc9457SAndroid Build Coastguard Worker }
1271*4bdc9457SAndroid Build Coastguard Worker }
1272*4bdc9457SAndroid Build Coastguard Worker }
1273*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_gt_4)1274*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_gt_4) {
1275*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1276*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1277*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1278*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1279*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1280*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1281*4bdc9457SAndroid Build Coastguard Worker .m(4)
1282*4bdc9457SAndroid Build Coastguard Worker .n(2)
1283*4bdc9457SAndroid Build Coastguard Worker .k(k)
1284*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1285*4bdc9457SAndroid Build Coastguard Worker }
1286*4bdc9457SAndroid Build Coastguard Worker }
1287*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_gt_4_strided_a)1288*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_gt_4_strided_a) {
1289*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1290*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1291*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1292*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1293*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1294*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1295*4bdc9457SAndroid Build Coastguard Worker .m(4)
1296*4bdc9457SAndroid Build Coastguard Worker .n(2)
1297*4bdc9457SAndroid Build Coastguard Worker .k(k)
1298*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
1299*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1300*4bdc9457SAndroid Build Coastguard Worker }
1301*4bdc9457SAndroid Build Coastguard Worker }
1302*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_gt_4_subtile)1303*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_gt_4_subtile) {
1304*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1305*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1306*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1307*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1308*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1309*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1310*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1311*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1312*4bdc9457SAndroid Build Coastguard Worker .m(m)
1313*4bdc9457SAndroid Build Coastguard Worker .n(n)
1314*4bdc9457SAndroid Build Coastguard Worker .k(k)
1315*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1316*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1317*4bdc9457SAndroid Build Coastguard Worker }
1318*4bdc9457SAndroid Build Coastguard Worker }
1319*4bdc9457SAndroid Build Coastguard Worker }
1320*4bdc9457SAndroid Build Coastguard Worker }
1321*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_div_4)1322*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_div_4) {
1323*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1324*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1325*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1326*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1327*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1328*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1329*4bdc9457SAndroid Build Coastguard Worker .m(4)
1330*4bdc9457SAndroid Build Coastguard Worker .n(2)
1331*4bdc9457SAndroid Build Coastguard Worker .k(k)
1332*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1333*4bdc9457SAndroid Build Coastguard Worker }
1334*4bdc9457SAndroid Build Coastguard Worker }
1335*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_div_4_strided_a)1336*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_div_4_strided_a) {
1337*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1338*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1339*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1340*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1341*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1342*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1343*4bdc9457SAndroid Build Coastguard Worker .m(4)
1344*4bdc9457SAndroid Build Coastguard Worker .n(2)
1345*4bdc9457SAndroid Build Coastguard Worker .k(k)
1346*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
1347*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1348*4bdc9457SAndroid Build Coastguard Worker }
1349*4bdc9457SAndroid Build Coastguard Worker }
1350*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,k_div_4_subtile)1351*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, k_div_4_subtile) {
1352*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1353*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1354*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1355*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1356*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1357*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1358*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1359*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1360*4bdc9457SAndroid Build Coastguard Worker .m(m)
1361*4bdc9457SAndroid Build Coastguard Worker .n(n)
1362*4bdc9457SAndroid Build Coastguard Worker .k(k)
1363*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1364*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1365*4bdc9457SAndroid Build Coastguard Worker }
1366*4bdc9457SAndroid Build Coastguard Worker }
1367*4bdc9457SAndroid Build Coastguard Worker }
1368*4bdc9457SAndroid Build Coastguard Worker }
1369*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,n_gt_2)1370*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, n_gt_2) {
1371*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1372*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1373*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1374*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1375*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1376*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1377*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1378*4bdc9457SAndroid Build Coastguard Worker .m(4)
1379*4bdc9457SAndroid Build Coastguard Worker .n(n)
1380*4bdc9457SAndroid Build Coastguard Worker .k(k)
1381*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1382*4bdc9457SAndroid Build Coastguard Worker }
1383*4bdc9457SAndroid Build Coastguard Worker }
1384*4bdc9457SAndroid Build Coastguard Worker }
1385*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,n_gt_2_strided_cn)1386*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, n_gt_2_strided_cn) {
1387*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1388*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1389*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1390*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1391*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1392*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1393*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1394*4bdc9457SAndroid Build Coastguard Worker .m(4)
1395*4bdc9457SAndroid Build Coastguard Worker .n(n)
1396*4bdc9457SAndroid Build Coastguard Worker .k(k)
1397*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
1398*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1399*4bdc9457SAndroid Build Coastguard Worker }
1400*4bdc9457SAndroid Build Coastguard Worker }
1401*4bdc9457SAndroid Build Coastguard Worker }
1402*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,n_gt_2_strided_a)1403*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, n_gt_2_strided_a) {
1404*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1405*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1406*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1407*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1408*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1409*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1410*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1411*4bdc9457SAndroid Build Coastguard Worker .m(4)
1412*4bdc9457SAndroid Build Coastguard Worker .n(n)
1413*4bdc9457SAndroid Build Coastguard Worker .k(k)
1414*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1415*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1416*4bdc9457SAndroid Build Coastguard Worker }
1417*4bdc9457SAndroid Build Coastguard Worker }
1418*4bdc9457SAndroid Build Coastguard Worker }
1419*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,n_gt_2_subtile)1420*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, n_gt_2_subtile) {
1421*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1422*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1423*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1424*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1425*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1426*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1427*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1428*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1429*4bdc9457SAndroid Build Coastguard Worker .m(m)
1430*4bdc9457SAndroid Build Coastguard Worker .n(n)
1431*4bdc9457SAndroid Build Coastguard Worker .k(k)
1432*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1433*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1434*4bdc9457SAndroid Build Coastguard Worker }
1435*4bdc9457SAndroid Build Coastguard Worker }
1436*4bdc9457SAndroid Build Coastguard Worker }
1437*4bdc9457SAndroid Build Coastguard Worker }
1438*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,n_div_2)1439*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, n_div_2) {
1440*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1441*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1442*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1443*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1444*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1445*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1446*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1447*4bdc9457SAndroid Build Coastguard Worker .m(4)
1448*4bdc9457SAndroid Build Coastguard Worker .n(n)
1449*4bdc9457SAndroid Build Coastguard Worker .k(k)
1450*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1451*4bdc9457SAndroid Build Coastguard Worker }
1452*4bdc9457SAndroid Build Coastguard Worker }
1453*4bdc9457SAndroid Build Coastguard Worker }
1454*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,n_div_2_strided_cn)1455*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, n_div_2_strided_cn) {
1456*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1457*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1458*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1459*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1460*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1461*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1462*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1463*4bdc9457SAndroid Build Coastguard Worker .m(4)
1464*4bdc9457SAndroid Build Coastguard Worker .n(n)
1465*4bdc9457SAndroid Build Coastguard Worker .k(k)
1466*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
1467*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1468*4bdc9457SAndroid Build Coastguard Worker }
1469*4bdc9457SAndroid Build Coastguard Worker }
1470*4bdc9457SAndroid Build Coastguard Worker }
1471*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,n_div_2_strided_a)1472*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, n_div_2_strided_a) {
1473*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1474*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1475*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1476*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1477*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1478*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1479*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1480*4bdc9457SAndroid Build Coastguard Worker .m(4)
1481*4bdc9457SAndroid Build Coastguard Worker .n(n)
1482*4bdc9457SAndroid Build Coastguard Worker .k(k)
1483*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1484*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1485*4bdc9457SAndroid Build Coastguard Worker }
1486*4bdc9457SAndroid Build Coastguard Worker }
1487*4bdc9457SAndroid Build Coastguard Worker }
1488*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,n_div_2_subtile)1489*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, n_div_2_subtile) {
1490*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1491*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1492*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1493*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1494*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1495*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1496*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1497*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1498*4bdc9457SAndroid Build Coastguard Worker .m(m)
1499*4bdc9457SAndroid Build Coastguard Worker .n(n)
1500*4bdc9457SAndroid Build Coastguard Worker .k(k)
1501*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1502*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1503*4bdc9457SAndroid Build Coastguard Worker }
1504*4bdc9457SAndroid Build Coastguard Worker }
1505*4bdc9457SAndroid Build Coastguard Worker }
1506*4bdc9457SAndroid Build Coastguard Worker }
1507*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,strided_cm_subtile)1508*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, strided_cm_subtile) {
1509*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1510*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1511*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1512*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1513*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1514*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1515*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1516*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1517*4bdc9457SAndroid Build Coastguard Worker .m(m)
1518*4bdc9457SAndroid Build Coastguard Worker .n(n)
1519*4bdc9457SAndroid Build Coastguard Worker .k(k)
1520*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
1521*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1522*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1523*4bdc9457SAndroid Build Coastguard Worker }
1524*4bdc9457SAndroid Build Coastguard Worker }
1525*4bdc9457SAndroid Build Coastguard Worker }
1526*4bdc9457SAndroid Build Coastguard Worker }
1527*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMSIMD,strided_cm)1528*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMSIMD, strided_cm) {
1529*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1530*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1531*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1532*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1533*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1534*4bdc9457SAndroid Build Coastguard Worker .m(4)
1535*4bdc9457SAndroid Build Coastguard Worker .n(2)
1536*4bdc9457SAndroid Build Coastguard Worker .k(4)
1537*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
1538*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmsimd);
1539*4bdc9457SAndroid Build Coastguard Worker }
1540*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1541*4bdc9457SAndroid Build Coastguard Worker
1542*4bdc9457SAndroid Build Coastguard Worker
1543*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_eq_1)1544*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_eq_1) {
1545*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1546*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1547*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1548*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1549*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1550*4bdc9457SAndroid Build Coastguard Worker .m(4)
1551*4bdc9457SAndroid Build Coastguard Worker .n(8)
1552*4bdc9457SAndroid Build Coastguard Worker .k(1)
1553*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1554*4bdc9457SAndroid Build Coastguard Worker }
1555*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,strided_cn)1556*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, strided_cn) {
1557*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1558*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1559*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1560*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1561*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1562*4bdc9457SAndroid Build Coastguard Worker .m(4)
1563*4bdc9457SAndroid Build Coastguard Worker .n(8)
1564*4bdc9457SAndroid Build Coastguard Worker .k(1)
1565*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1566*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1567*4bdc9457SAndroid Build Coastguard Worker }
1568*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_eq_1_strided_a)1569*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_eq_1_strided_a) {
1570*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1571*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1572*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1573*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1574*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1575*4bdc9457SAndroid Build Coastguard Worker .m(4)
1576*4bdc9457SAndroid Build Coastguard Worker .n(8)
1577*4bdc9457SAndroid Build Coastguard Worker .k(1)
1578*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
1579*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1580*4bdc9457SAndroid Build Coastguard Worker }
1581*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)1582*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
1583*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1584*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1585*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1586*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1587*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1588*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1589*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1590*4bdc9457SAndroid Build Coastguard Worker .m(m)
1591*4bdc9457SAndroid Build Coastguard Worker .n(n)
1592*4bdc9457SAndroid Build Coastguard Worker .k(1)
1593*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1594*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1595*4bdc9457SAndroid Build Coastguard Worker }
1596*4bdc9457SAndroid Build Coastguard Worker }
1597*4bdc9457SAndroid Build Coastguard Worker }
1598*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)1599*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
1600*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1601*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1602*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1603*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1604*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1605*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1606*4bdc9457SAndroid Build Coastguard Worker .m(m)
1607*4bdc9457SAndroid Build Coastguard Worker .n(8)
1608*4bdc9457SAndroid Build Coastguard Worker .k(1)
1609*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1610*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1611*4bdc9457SAndroid Build Coastguard Worker }
1612*4bdc9457SAndroid Build Coastguard Worker }
1613*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)1614*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
1615*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1616*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1617*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1618*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1619*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1620*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1621*4bdc9457SAndroid Build Coastguard Worker .m(4)
1622*4bdc9457SAndroid Build Coastguard Worker .n(n)
1623*4bdc9457SAndroid Build Coastguard Worker .k(1)
1624*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1625*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1626*4bdc9457SAndroid Build Coastguard Worker }
1627*4bdc9457SAndroid Build Coastguard Worker }
1628*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_gt_1)1629*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_gt_1) {
1630*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
1631*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1632*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1633*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1634*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1635*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1636*4bdc9457SAndroid Build Coastguard Worker .m(4)
1637*4bdc9457SAndroid Build Coastguard Worker .n(8)
1638*4bdc9457SAndroid Build Coastguard Worker .k(k)
1639*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1640*4bdc9457SAndroid Build Coastguard Worker }
1641*4bdc9457SAndroid Build Coastguard Worker }
1642*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_gt_1_strided_a)1643*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_gt_1_strided_a) {
1644*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
1645*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1646*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1647*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1648*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1649*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1650*4bdc9457SAndroid Build Coastguard Worker .m(4)
1651*4bdc9457SAndroid Build Coastguard Worker .n(8)
1652*4bdc9457SAndroid Build Coastguard Worker .k(k)
1653*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
1654*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1655*4bdc9457SAndroid Build Coastguard Worker }
1656*4bdc9457SAndroid Build Coastguard Worker }
1657*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)1658*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
1659*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
1660*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1661*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1662*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1663*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1664*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1665*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1666*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1667*4bdc9457SAndroid Build Coastguard Worker .m(m)
1668*4bdc9457SAndroid Build Coastguard Worker .n(n)
1669*4bdc9457SAndroid Build Coastguard Worker .k(k)
1670*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1671*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1672*4bdc9457SAndroid Build Coastguard Worker }
1673*4bdc9457SAndroid Build Coastguard Worker }
1674*4bdc9457SAndroid Build Coastguard Worker }
1675*4bdc9457SAndroid Build Coastguard Worker }
1676*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_gt_8)1677*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_gt_8) {
1678*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1679*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
1680*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1681*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1682*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1683*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1684*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1685*4bdc9457SAndroid Build Coastguard Worker .m(4)
1686*4bdc9457SAndroid Build Coastguard Worker .n(n)
1687*4bdc9457SAndroid Build Coastguard Worker .k(k)
1688*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1689*4bdc9457SAndroid Build Coastguard Worker }
1690*4bdc9457SAndroid Build Coastguard Worker }
1691*4bdc9457SAndroid Build Coastguard Worker }
1692*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)1693*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
1694*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1695*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
1696*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1697*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1698*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1699*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1700*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1701*4bdc9457SAndroid Build Coastguard Worker .m(4)
1702*4bdc9457SAndroid Build Coastguard Worker .n(n)
1703*4bdc9457SAndroid Build Coastguard Worker .k(k)
1704*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1705*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1706*4bdc9457SAndroid Build Coastguard Worker }
1707*4bdc9457SAndroid Build Coastguard Worker }
1708*4bdc9457SAndroid Build Coastguard Worker }
1709*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_a)1710*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_a) {
1711*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1712*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
1713*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1714*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1715*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1716*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1717*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1718*4bdc9457SAndroid Build Coastguard Worker .m(4)
1719*4bdc9457SAndroid Build Coastguard Worker .n(n)
1720*4bdc9457SAndroid Build Coastguard Worker .k(k)
1721*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1722*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1723*4bdc9457SAndroid Build Coastguard Worker }
1724*4bdc9457SAndroid Build Coastguard Worker }
1725*4bdc9457SAndroid Build Coastguard Worker }
1726*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)1727*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
1728*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1729*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
1730*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1731*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1732*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1733*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1734*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1735*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1736*4bdc9457SAndroid Build Coastguard Worker .m(m)
1737*4bdc9457SAndroid Build Coastguard Worker .n(n)
1738*4bdc9457SAndroid Build Coastguard Worker .k(k)
1739*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1740*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1741*4bdc9457SAndroid Build Coastguard Worker }
1742*4bdc9457SAndroid Build Coastguard Worker }
1743*4bdc9457SAndroid Build Coastguard Worker }
1744*4bdc9457SAndroid Build Coastguard Worker }
1745*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_div_8)1746*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_div_8) {
1747*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1748*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
1749*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1750*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1751*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1752*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1753*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1754*4bdc9457SAndroid Build Coastguard Worker .m(4)
1755*4bdc9457SAndroid Build Coastguard Worker .n(n)
1756*4bdc9457SAndroid Build Coastguard Worker .k(k)
1757*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1758*4bdc9457SAndroid Build Coastguard Worker }
1759*4bdc9457SAndroid Build Coastguard Worker }
1760*4bdc9457SAndroid Build Coastguard Worker }
1761*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)1762*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
1763*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1764*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
1765*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1766*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1767*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1768*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1769*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1770*4bdc9457SAndroid Build Coastguard Worker .m(4)
1771*4bdc9457SAndroid Build Coastguard Worker .n(n)
1772*4bdc9457SAndroid Build Coastguard Worker .k(k)
1773*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1774*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1775*4bdc9457SAndroid Build Coastguard Worker }
1776*4bdc9457SAndroid Build Coastguard Worker }
1777*4bdc9457SAndroid Build Coastguard Worker }
1778*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_div_8_strided_a)1779*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_div_8_strided_a) {
1780*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1781*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
1782*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1783*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1784*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1785*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1786*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1787*4bdc9457SAndroid Build Coastguard Worker .m(4)
1788*4bdc9457SAndroid Build Coastguard Worker .n(n)
1789*4bdc9457SAndroid Build Coastguard Worker .k(k)
1790*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1791*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1792*4bdc9457SAndroid Build Coastguard Worker }
1793*4bdc9457SAndroid Build Coastguard Worker }
1794*4bdc9457SAndroid Build Coastguard Worker }
1795*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)1796*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
1797*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1798*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
1799*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1800*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1801*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1802*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1803*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1804*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1805*4bdc9457SAndroid Build Coastguard Worker .m(m)
1806*4bdc9457SAndroid Build Coastguard Worker .n(n)
1807*4bdc9457SAndroid Build Coastguard Worker .k(k)
1808*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1809*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1810*4bdc9457SAndroid Build Coastguard Worker }
1811*4bdc9457SAndroid Build Coastguard Worker }
1812*4bdc9457SAndroid Build Coastguard Worker }
1813*4bdc9457SAndroid Build Coastguard Worker }
1814*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)1815*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
1816*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
1817*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1818*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1819*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1820*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1821*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1822*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1823*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1824*4bdc9457SAndroid Build Coastguard Worker .m(m)
1825*4bdc9457SAndroid Build Coastguard Worker .n(n)
1826*4bdc9457SAndroid Build Coastguard Worker .k(k)
1827*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1828*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1829*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1830*4bdc9457SAndroid Build Coastguard Worker }
1831*4bdc9457SAndroid Build Coastguard Worker }
1832*4bdc9457SAndroid Build Coastguard Worker }
1833*4bdc9457SAndroid Build Coastguard Worker }
1834*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT,strided_cm)1835*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_LOADSPLAT, strided_cm) {
1836*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1837*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1838*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1839*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1840*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1841*4bdc9457SAndroid Build Coastguard Worker .m(4)
1842*4bdc9457SAndroid Build Coastguard Worker .n(8)
1843*4bdc9457SAndroid Build Coastguard Worker .k(1)
1844*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1845*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_loadsplat);
1846*4bdc9457SAndroid Build Coastguard Worker }
1847*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1848*4bdc9457SAndroid Build Coastguard Worker
1849*4bdc9457SAndroid Build Coastguard Worker
1850*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_eq_4)1851*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_eq_4) {
1852*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1853*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1854*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1855*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1856*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1857*4bdc9457SAndroid Build Coastguard Worker .m(4)
1858*4bdc9457SAndroid Build Coastguard Worker .n(8)
1859*4bdc9457SAndroid Build Coastguard Worker .k(4)
1860*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1861*4bdc9457SAndroid Build Coastguard Worker }
1862*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,strided_cn)1863*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, strided_cn) {
1864*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1865*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1866*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1867*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1868*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1869*4bdc9457SAndroid Build Coastguard Worker .m(4)
1870*4bdc9457SAndroid Build Coastguard Worker .n(8)
1871*4bdc9457SAndroid Build Coastguard Worker .k(4)
1872*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1873*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1874*4bdc9457SAndroid Build Coastguard Worker }
1875*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_eq_4_strided_a)1876*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_eq_4_strided_a) {
1877*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1878*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1879*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1880*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1881*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1882*4bdc9457SAndroid Build Coastguard Worker .m(4)
1883*4bdc9457SAndroid Build Coastguard Worker .n(8)
1884*4bdc9457SAndroid Build Coastguard Worker .k(4)
1885*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1886*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1887*4bdc9457SAndroid Build Coastguard Worker }
1888*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_eq_4_subtile)1889*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_eq_4_subtile) {
1890*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1891*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1892*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1893*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1894*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1895*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1896*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1897*4bdc9457SAndroid Build Coastguard Worker .m(m)
1898*4bdc9457SAndroid Build Coastguard Worker .n(n)
1899*4bdc9457SAndroid Build Coastguard Worker .k(4)
1900*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1901*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1902*4bdc9457SAndroid Build Coastguard Worker }
1903*4bdc9457SAndroid Build Coastguard Worker }
1904*4bdc9457SAndroid Build Coastguard Worker }
1905*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_eq_4_subtile_m)1906*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_eq_4_subtile_m) {
1907*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1908*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1909*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1910*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1911*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1912*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1913*4bdc9457SAndroid Build Coastguard Worker .m(m)
1914*4bdc9457SAndroid Build Coastguard Worker .n(8)
1915*4bdc9457SAndroid Build Coastguard Worker .k(4)
1916*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1917*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1918*4bdc9457SAndroid Build Coastguard Worker }
1919*4bdc9457SAndroid Build Coastguard Worker }
1920*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_eq_4_subtile_n)1921*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_eq_4_subtile_n) {
1922*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1923*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1924*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1925*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1926*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1927*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1928*4bdc9457SAndroid Build Coastguard Worker .m(4)
1929*4bdc9457SAndroid Build Coastguard Worker .n(n)
1930*4bdc9457SAndroid Build Coastguard Worker .k(4)
1931*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1932*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1933*4bdc9457SAndroid Build Coastguard Worker }
1934*4bdc9457SAndroid Build Coastguard Worker }
1935*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_lt_4)1936*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_lt_4) {
1937*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1938*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1939*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1940*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1941*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1942*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1943*4bdc9457SAndroid Build Coastguard Worker .m(4)
1944*4bdc9457SAndroid Build Coastguard Worker .n(8)
1945*4bdc9457SAndroid Build Coastguard Worker .k(k)
1946*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1947*4bdc9457SAndroid Build Coastguard Worker }
1948*4bdc9457SAndroid Build Coastguard Worker }
1949*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_lt_4_strided_a)1950*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_lt_4_strided_a) {
1951*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1952*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1953*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1954*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1955*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1956*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1957*4bdc9457SAndroid Build Coastguard Worker .m(4)
1958*4bdc9457SAndroid Build Coastguard Worker .n(8)
1959*4bdc9457SAndroid Build Coastguard Worker .k(k)
1960*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1961*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1962*4bdc9457SAndroid Build Coastguard Worker }
1963*4bdc9457SAndroid Build Coastguard Worker }
1964*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_lt_4_subtile)1965*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_lt_4_subtile) {
1966*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1967*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1968*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1969*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1970*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1971*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1972*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1973*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1974*4bdc9457SAndroid Build Coastguard Worker .m(m)
1975*4bdc9457SAndroid Build Coastguard Worker .n(n)
1976*4bdc9457SAndroid Build Coastguard Worker .k(k)
1977*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1978*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1979*4bdc9457SAndroid Build Coastguard Worker }
1980*4bdc9457SAndroid Build Coastguard Worker }
1981*4bdc9457SAndroid Build Coastguard Worker }
1982*4bdc9457SAndroid Build Coastguard Worker }
1983*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_gt_4)1984*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_gt_4) {
1985*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1986*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1987*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1988*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1989*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1990*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1991*4bdc9457SAndroid Build Coastguard Worker .m(4)
1992*4bdc9457SAndroid Build Coastguard Worker .n(8)
1993*4bdc9457SAndroid Build Coastguard Worker .k(k)
1994*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
1995*4bdc9457SAndroid Build Coastguard Worker }
1996*4bdc9457SAndroid Build Coastguard Worker }
1997*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_gt_4_strided_a)1998*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_gt_4_strided_a) {
1999*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2000*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2001*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2002*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2003*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2004*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2005*4bdc9457SAndroid Build Coastguard Worker .m(4)
2006*4bdc9457SAndroid Build Coastguard Worker .n(8)
2007*4bdc9457SAndroid Build Coastguard Worker .k(k)
2008*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
2009*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2010*4bdc9457SAndroid Build Coastguard Worker }
2011*4bdc9457SAndroid Build Coastguard Worker }
2012*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_gt_4_subtile)2013*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_gt_4_subtile) {
2014*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2015*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2016*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2017*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2018*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2019*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2020*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2021*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2022*4bdc9457SAndroid Build Coastguard Worker .m(m)
2023*4bdc9457SAndroid Build Coastguard Worker .n(n)
2024*4bdc9457SAndroid Build Coastguard Worker .k(k)
2025*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2026*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2027*4bdc9457SAndroid Build Coastguard Worker }
2028*4bdc9457SAndroid Build Coastguard Worker }
2029*4bdc9457SAndroid Build Coastguard Worker }
2030*4bdc9457SAndroid Build Coastguard Worker }
2031*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_div_4)2032*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_div_4) {
2033*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2034*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2035*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2036*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2037*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2038*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2039*4bdc9457SAndroid Build Coastguard Worker .m(4)
2040*4bdc9457SAndroid Build Coastguard Worker .n(8)
2041*4bdc9457SAndroid Build Coastguard Worker .k(k)
2042*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2043*4bdc9457SAndroid Build Coastguard Worker }
2044*4bdc9457SAndroid Build Coastguard Worker }
2045*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_div_4_strided_a)2046*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_div_4_strided_a) {
2047*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2048*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2049*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2050*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2051*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2052*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2053*4bdc9457SAndroid Build Coastguard Worker .m(4)
2054*4bdc9457SAndroid Build Coastguard Worker .n(8)
2055*4bdc9457SAndroid Build Coastguard Worker .k(k)
2056*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
2057*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2058*4bdc9457SAndroid Build Coastguard Worker }
2059*4bdc9457SAndroid Build Coastguard Worker }
2060*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,k_div_4_subtile)2061*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, k_div_4_subtile) {
2062*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2063*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2064*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2065*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2066*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2067*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2068*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2069*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2070*4bdc9457SAndroid Build Coastguard Worker .m(m)
2071*4bdc9457SAndroid Build Coastguard Worker .n(n)
2072*4bdc9457SAndroid Build Coastguard Worker .k(k)
2073*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2074*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2075*4bdc9457SAndroid Build Coastguard Worker }
2076*4bdc9457SAndroid Build Coastguard Worker }
2077*4bdc9457SAndroid Build Coastguard Worker }
2078*4bdc9457SAndroid Build Coastguard Worker }
2079*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,n_gt_8)2080*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, n_gt_8) {
2081*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2082*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2083*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2084*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2085*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2086*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2087*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2088*4bdc9457SAndroid Build Coastguard Worker .m(4)
2089*4bdc9457SAndroid Build Coastguard Worker .n(n)
2090*4bdc9457SAndroid Build Coastguard Worker .k(k)
2091*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2092*4bdc9457SAndroid Build Coastguard Worker }
2093*4bdc9457SAndroid Build Coastguard Worker }
2094*4bdc9457SAndroid Build Coastguard Worker }
2095*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,n_gt_8_strided_cn)2096*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, n_gt_8_strided_cn) {
2097*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2098*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2099*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2100*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2101*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2102*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2103*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2104*4bdc9457SAndroid Build Coastguard Worker .m(4)
2105*4bdc9457SAndroid Build Coastguard Worker .n(n)
2106*4bdc9457SAndroid Build Coastguard Worker .k(k)
2107*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2108*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2109*4bdc9457SAndroid Build Coastguard Worker }
2110*4bdc9457SAndroid Build Coastguard Worker }
2111*4bdc9457SAndroid Build Coastguard Worker }
2112*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,n_gt_8_strided_a)2113*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, n_gt_8_strided_a) {
2114*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2115*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2116*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2117*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2118*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2119*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2120*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2121*4bdc9457SAndroid Build Coastguard Worker .m(4)
2122*4bdc9457SAndroid Build Coastguard Worker .n(n)
2123*4bdc9457SAndroid Build Coastguard Worker .k(k)
2124*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
2125*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2126*4bdc9457SAndroid Build Coastguard Worker }
2127*4bdc9457SAndroid Build Coastguard Worker }
2128*4bdc9457SAndroid Build Coastguard Worker }
2129*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,n_gt_8_subtile)2130*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, n_gt_8_subtile) {
2131*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2132*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2133*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2134*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2135*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2136*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2137*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2138*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2139*4bdc9457SAndroid Build Coastguard Worker .m(m)
2140*4bdc9457SAndroid Build Coastguard Worker .n(n)
2141*4bdc9457SAndroid Build Coastguard Worker .k(k)
2142*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2143*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2144*4bdc9457SAndroid Build Coastguard Worker }
2145*4bdc9457SAndroid Build Coastguard Worker }
2146*4bdc9457SAndroid Build Coastguard Worker }
2147*4bdc9457SAndroid Build Coastguard Worker }
2148*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,n_div_8)2149*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, n_div_8) {
2150*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2151*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2152*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2153*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2154*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2155*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2156*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2157*4bdc9457SAndroid Build Coastguard Worker .m(4)
2158*4bdc9457SAndroid Build Coastguard Worker .n(n)
2159*4bdc9457SAndroid Build Coastguard Worker .k(k)
2160*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2161*4bdc9457SAndroid Build Coastguard Worker }
2162*4bdc9457SAndroid Build Coastguard Worker }
2163*4bdc9457SAndroid Build Coastguard Worker }
2164*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,n_div_8_strided_cn)2165*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, n_div_8_strided_cn) {
2166*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2167*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2168*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2169*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2170*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2171*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2172*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2173*4bdc9457SAndroid Build Coastguard Worker .m(4)
2174*4bdc9457SAndroid Build Coastguard Worker .n(n)
2175*4bdc9457SAndroid Build Coastguard Worker .k(k)
2176*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2177*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2178*4bdc9457SAndroid Build Coastguard Worker }
2179*4bdc9457SAndroid Build Coastguard Worker }
2180*4bdc9457SAndroid Build Coastguard Worker }
2181*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,n_div_8_strided_a)2182*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, n_div_8_strided_a) {
2183*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2184*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2185*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2186*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2187*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2188*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2189*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2190*4bdc9457SAndroid Build Coastguard Worker .m(4)
2191*4bdc9457SAndroid Build Coastguard Worker .n(n)
2192*4bdc9457SAndroid Build Coastguard Worker .k(k)
2193*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
2194*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2195*4bdc9457SAndroid Build Coastguard Worker }
2196*4bdc9457SAndroid Build Coastguard Worker }
2197*4bdc9457SAndroid Build Coastguard Worker }
2198*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,n_div_8_subtile)2199*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, n_div_8_subtile) {
2200*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2201*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2202*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2203*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2204*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2205*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2206*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2207*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2208*4bdc9457SAndroid Build Coastguard Worker .m(m)
2209*4bdc9457SAndroid Build Coastguard Worker .n(n)
2210*4bdc9457SAndroid Build Coastguard Worker .k(k)
2211*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2212*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2213*4bdc9457SAndroid Build Coastguard Worker }
2214*4bdc9457SAndroid Build Coastguard Worker }
2215*4bdc9457SAndroid Build Coastguard Worker }
2216*4bdc9457SAndroid Build Coastguard Worker }
2217*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,strided_cm_subtile)2218*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, strided_cm_subtile) {
2219*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2220*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2221*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2222*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2223*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2224*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2225*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2226*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2227*4bdc9457SAndroid Build Coastguard Worker .m(m)
2228*4bdc9457SAndroid Build Coastguard Worker .n(n)
2229*4bdc9457SAndroid Build Coastguard Worker .k(k)
2230*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2231*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2232*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2233*4bdc9457SAndroid Build Coastguard Worker }
2234*4bdc9457SAndroid Build Coastguard Worker }
2235*4bdc9457SAndroid Build Coastguard Worker }
2236*4bdc9457SAndroid Build Coastguard Worker }
2237*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMSIMD,strided_cm)2238*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMSIMD, strided_cm) {
2239*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2240*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2241*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2242*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2243*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2244*4bdc9457SAndroid Build Coastguard Worker .m(4)
2245*4bdc9457SAndroid Build Coastguard Worker .n(8)
2246*4bdc9457SAndroid Build Coastguard Worker .k(4)
2247*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2248*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmsimd);
2249*4bdc9457SAndroid Build Coastguard Worker }
2250*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2251*4bdc9457SAndroid Build Coastguard Worker
2252*4bdc9457SAndroid Build Coastguard Worker
2253*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_eq_1)2254*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_eq_1) {
2255*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2256*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2257*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2258*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2259*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2260*4bdc9457SAndroid Build Coastguard Worker .m(5)
2261*4bdc9457SAndroid Build Coastguard Worker .n(8)
2262*4bdc9457SAndroid Build Coastguard Worker .k(1)
2263*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2264*4bdc9457SAndroid Build Coastguard Worker }
2265*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,strided_cn)2266*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, strided_cn) {
2267*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2268*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2269*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2270*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2271*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2272*4bdc9457SAndroid Build Coastguard Worker .m(5)
2273*4bdc9457SAndroid Build Coastguard Worker .n(8)
2274*4bdc9457SAndroid Build Coastguard Worker .k(1)
2275*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2276*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2277*4bdc9457SAndroid Build Coastguard Worker }
2278*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_eq_1_strided_a)2279*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_eq_1_strided_a) {
2280*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2281*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2282*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2283*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2284*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2285*4bdc9457SAndroid Build Coastguard Worker .m(5)
2286*4bdc9457SAndroid Build Coastguard Worker .n(8)
2287*4bdc9457SAndroid Build Coastguard Worker .k(1)
2288*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
2289*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2290*4bdc9457SAndroid Build Coastguard Worker }
2291*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)2292*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
2293*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2294*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2295*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2296*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2297*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2298*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2299*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2300*4bdc9457SAndroid Build Coastguard Worker .m(m)
2301*4bdc9457SAndroid Build Coastguard Worker .n(n)
2302*4bdc9457SAndroid Build Coastguard Worker .k(1)
2303*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2304*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2305*4bdc9457SAndroid Build Coastguard Worker }
2306*4bdc9457SAndroid Build Coastguard Worker }
2307*4bdc9457SAndroid Build Coastguard Worker }
2308*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)2309*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
2310*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2311*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2312*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2313*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2314*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2315*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2316*4bdc9457SAndroid Build Coastguard Worker .m(m)
2317*4bdc9457SAndroid Build Coastguard Worker .n(8)
2318*4bdc9457SAndroid Build Coastguard Worker .k(1)
2319*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2320*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2321*4bdc9457SAndroid Build Coastguard Worker }
2322*4bdc9457SAndroid Build Coastguard Worker }
2323*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)2324*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
2325*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2326*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2327*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2328*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2329*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2330*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2331*4bdc9457SAndroid Build Coastguard Worker .m(5)
2332*4bdc9457SAndroid Build Coastguard Worker .n(n)
2333*4bdc9457SAndroid Build Coastguard Worker .k(1)
2334*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2335*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2336*4bdc9457SAndroid Build Coastguard Worker }
2337*4bdc9457SAndroid Build Coastguard Worker }
2338*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_gt_1)2339*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_gt_1) {
2340*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2341*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2342*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2343*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2344*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2345*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2346*4bdc9457SAndroid Build Coastguard Worker .m(5)
2347*4bdc9457SAndroid Build Coastguard Worker .n(8)
2348*4bdc9457SAndroid Build Coastguard Worker .k(k)
2349*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2350*4bdc9457SAndroid Build Coastguard Worker }
2351*4bdc9457SAndroid Build Coastguard Worker }
2352*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_gt_1_strided_a)2353*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_gt_1_strided_a) {
2354*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2355*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2356*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2357*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2358*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2359*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2360*4bdc9457SAndroid Build Coastguard Worker .m(5)
2361*4bdc9457SAndroid Build Coastguard Worker .n(8)
2362*4bdc9457SAndroid Build Coastguard Worker .k(k)
2363*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
2364*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2365*4bdc9457SAndroid Build Coastguard Worker }
2366*4bdc9457SAndroid Build Coastguard Worker }
2367*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)2368*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
2369*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2370*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2371*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2372*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2373*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2374*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2375*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2376*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2377*4bdc9457SAndroid Build Coastguard Worker .m(m)
2378*4bdc9457SAndroid Build Coastguard Worker .n(n)
2379*4bdc9457SAndroid Build Coastguard Worker .k(k)
2380*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2381*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2382*4bdc9457SAndroid Build Coastguard Worker }
2383*4bdc9457SAndroid Build Coastguard Worker }
2384*4bdc9457SAndroid Build Coastguard Worker }
2385*4bdc9457SAndroid Build Coastguard Worker }
2386*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_gt_8)2387*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_gt_8) {
2388*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2389*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2390*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2391*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2392*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2393*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2394*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2395*4bdc9457SAndroid Build Coastguard Worker .m(5)
2396*4bdc9457SAndroid Build Coastguard Worker .n(n)
2397*4bdc9457SAndroid Build Coastguard Worker .k(k)
2398*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2399*4bdc9457SAndroid Build Coastguard Worker }
2400*4bdc9457SAndroid Build Coastguard Worker }
2401*4bdc9457SAndroid Build Coastguard Worker }
2402*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)2403*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
2404*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2405*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2406*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2407*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2408*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2409*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2410*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2411*4bdc9457SAndroid Build Coastguard Worker .m(5)
2412*4bdc9457SAndroid Build Coastguard Worker .n(n)
2413*4bdc9457SAndroid Build Coastguard Worker .k(k)
2414*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2415*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2416*4bdc9457SAndroid Build Coastguard Worker }
2417*4bdc9457SAndroid Build Coastguard Worker }
2418*4bdc9457SAndroid Build Coastguard Worker }
2419*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_a)2420*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_a) {
2421*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2422*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2423*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2424*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2425*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2426*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2427*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2428*4bdc9457SAndroid Build Coastguard Worker .m(5)
2429*4bdc9457SAndroid Build Coastguard Worker .n(n)
2430*4bdc9457SAndroid Build Coastguard Worker .k(k)
2431*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2432*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2433*4bdc9457SAndroid Build Coastguard Worker }
2434*4bdc9457SAndroid Build Coastguard Worker }
2435*4bdc9457SAndroid Build Coastguard Worker }
2436*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)2437*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
2438*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2439*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2440*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2441*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2442*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2443*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2444*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2445*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2446*4bdc9457SAndroid Build Coastguard Worker .m(m)
2447*4bdc9457SAndroid Build Coastguard Worker .n(n)
2448*4bdc9457SAndroid Build Coastguard Worker .k(k)
2449*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2450*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2451*4bdc9457SAndroid Build Coastguard Worker }
2452*4bdc9457SAndroid Build Coastguard Worker }
2453*4bdc9457SAndroid Build Coastguard Worker }
2454*4bdc9457SAndroid Build Coastguard Worker }
2455*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_div_8)2456*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_div_8) {
2457*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2458*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2459*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2460*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2461*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2462*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2463*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2464*4bdc9457SAndroid Build Coastguard Worker .m(5)
2465*4bdc9457SAndroid Build Coastguard Worker .n(n)
2466*4bdc9457SAndroid Build Coastguard Worker .k(k)
2467*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2468*4bdc9457SAndroid Build Coastguard Worker }
2469*4bdc9457SAndroid Build Coastguard Worker }
2470*4bdc9457SAndroid Build Coastguard Worker }
2471*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)2472*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
2473*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2474*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2475*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2476*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2477*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2478*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2479*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2480*4bdc9457SAndroid Build Coastguard Worker .m(5)
2481*4bdc9457SAndroid Build Coastguard Worker .n(n)
2482*4bdc9457SAndroid Build Coastguard Worker .k(k)
2483*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2484*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2485*4bdc9457SAndroid Build Coastguard Worker }
2486*4bdc9457SAndroid Build Coastguard Worker }
2487*4bdc9457SAndroid Build Coastguard Worker }
2488*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_div_8_strided_a)2489*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_div_8_strided_a) {
2490*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2491*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2492*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2493*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2494*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2495*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2496*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2497*4bdc9457SAndroid Build Coastguard Worker .m(5)
2498*4bdc9457SAndroid Build Coastguard Worker .n(n)
2499*4bdc9457SAndroid Build Coastguard Worker .k(k)
2500*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2501*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2502*4bdc9457SAndroid Build Coastguard Worker }
2503*4bdc9457SAndroid Build Coastguard Worker }
2504*4bdc9457SAndroid Build Coastguard Worker }
2505*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)2506*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
2507*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2508*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2509*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2510*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2511*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2512*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2513*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2514*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2515*4bdc9457SAndroid Build Coastguard Worker .m(m)
2516*4bdc9457SAndroid Build Coastguard Worker .n(n)
2517*4bdc9457SAndroid Build Coastguard Worker .k(k)
2518*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2519*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2520*4bdc9457SAndroid Build Coastguard Worker }
2521*4bdc9457SAndroid Build Coastguard Worker }
2522*4bdc9457SAndroid Build Coastguard Worker }
2523*4bdc9457SAndroid Build Coastguard Worker }
2524*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)2525*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
2526*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2527*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2528*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2529*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2530*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2531*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2532*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2533*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2534*4bdc9457SAndroid Build Coastguard Worker .m(m)
2535*4bdc9457SAndroid Build Coastguard Worker .n(n)
2536*4bdc9457SAndroid Build Coastguard Worker .k(k)
2537*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2538*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2539*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2540*4bdc9457SAndroid Build Coastguard Worker }
2541*4bdc9457SAndroid Build Coastguard Worker }
2542*4bdc9457SAndroid Build Coastguard Worker }
2543*4bdc9457SAndroid Build Coastguard Worker }
2544*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT,strided_cm)2545*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_LOADSPLAT, strided_cm) {
2546*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2547*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2548*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2549*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2550*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2551*4bdc9457SAndroid Build Coastguard Worker .m(5)
2552*4bdc9457SAndroid Build Coastguard Worker .n(8)
2553*4bdc9457SAndroid Build Coastguard Worker .k(1)
2554*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2555*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_loadsplat);
2556*4bdc9457SAndroid Build Coastguard Worker }
2557*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2558*4bdc9457SAndroid Build Coastguard Worker
2559*4bdc9457SAndroid Build Coastguard Worker
2560*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_eq_4)2561*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_eq_4) {
2562*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2563*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2564*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2565*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2566*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2567*4bdc9457SAndroid Build Coastguard Worker .m(5)
2568*4bdc9457SAndroid Build Coastguard Worker .n(8)
2569*4bdc9457SAndroid Build Coastguard Worker .k(4)
2570*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2571*4bdc9457SAndroid Build Coastguard Worker }
2572*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,strided_cn)2573*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, strided_cn) {
2574*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2575*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2576*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2577*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2578*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2579*4bdc9457SAndroid Build Coastguard Worker .m(5)
2580*4bdc9457SAndroid Build Coastguard Worker .n(8)
2581*4bdc9457SAndroid Build Coastguard Worker .k(4)
2582*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2583*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2584*4bdc9457SAndroid Build Coastguard Worker }
2585*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_eq_4_strided_a)2586*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_eq_4_strided_a) {
2587*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2588*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2589*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2590*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2591*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2592*4bdc9457SAndroid Build Coastguard Worker .m(5)
2593*4bdc9457SAndroid Build Coastguard Worker .n(8)
2594*4bdc9457SAndroid Build Coastguard Worker .k(4)
2595*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2596*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2597*4bdc9457SAndroid Build Coastguard Worker }
2598*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_eq_4_subtile)2599*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_eq_4_subtile) {
2600*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2601*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2602*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2603*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2604*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2605*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2606*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2607*4bdc9457SAndroid Build Coastguard Worker .m(m)
2608*4bdc9457SAndroid Build Coastguard Worker .n(n)
2609*4bdc9457SAndroid Build Coastguard Worker .k(4)
2610*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2611*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2612*4bdc9457SAndroid Build Coastguard Worker }
2613*4bdc9457SAndroid Build Coastguard Worker }
2614*4bdc9457SAndroid Build Coastguard Worker }
2615*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_eq_4_subtile_m)2616*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_eq_4_subtile_m) {
2617*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2618*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2619*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2620*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2621*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2622*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2623*4bdc9457SAndroid Build Coastguard Worker .m(m)
2624*4bdc9457SAndroid Build Coastguard Worker .n(8)
2625*4bdc9457SAndroid Build Coastguard Worker .k(4)
2626*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2627*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2628*4bdc9457SAndroid Build Coastguard Worker }
2629*4bdc9457SAndroid Build Coastguard Worker }
2630*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_eq_4_subtile_n)2631*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_eq_4_subtile_n) {
2632*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2633*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2634*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2635*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2636*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2637*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2638*4bdc9457SAndroid Build Coastguard Worker .m(5)
2639*4bdc9457SAndroid Build Coastguard Worker .n(n)
2640*4bdc9457SAndroid Build Coastguard Worker .k(4)
2641*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2642*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2643*4bdc9457SAndroid Build Coastguard Worker }
2644*4bdc9457SAndroid Build Coastguard Worker }
2645*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_lt_4)2646*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_lt_4) {
2647*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2648*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2649*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2650*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2651*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2652*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2653*4bdc9457SAndroid Build Coastguard Worker .m(5)
2654*4bdc9457SAndroid Build Coastguard Worker .n(8)
2655*4bdc9457SAndroid Build Coastguard Worker .k(k)
2656*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2657*4bdc9457SAndroid Build Coastguard Worker }
2658*4bdc9457SAndroid Build Coastguard Worker }
2659*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_lt_4_strided_a)2660*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_lt_4_strided_a) {
2661*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2662*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2663*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2664*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2665*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2666*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2667*4bdc9457SAndroid Build Coastguard Worker .m(5)
2668*4bdc9457SAndroid Build Coastguard Worker .n(8)
2669*4bdc9457SAndroid Build Coastguard Worker .k(k)
2670*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2671*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2672*4bdc9457SAndroid Build Coastguard Worker }
2673*4bdc9457SAndroid Build Coastguard Worker }
2674*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_lt_4_subtile)2675*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_lt_4_subtile) {
2676*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2677*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2678*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2679*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2680*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2681*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2682*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2683*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2684*4bdc9457SAndroid Build Coastguard Worker .m(m)
2685*4bdc9457SAndroid Build Coastguard Worker .n(n)
2686*4bdc9457SAndroid Build Coastguard Worker .k(k)
2687*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2688*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2689*4bdc9457SAndroid Build Coastguard Worker }
2690*4bdc9457SAndroid Build Coastguard Worker }
2691*4bdc9457SAndroid Build Coastguard Worker }
2692*4bdc9457SAndroid Build Coastguard Worker }
2693*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_gt_4)2694*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_gt_4) {
2695*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2696*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2697*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2698*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2699*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2700*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2701*4bdc9457SAndroid Build Coastguard Worker .m(5)
2702*4bdc9457SAndroid Build Coastguard Worker .n(8)
2703*4bdc9457SAndroid Build Coastguard Worker .k(k)
2704*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2705*4bdc9457SAndroid Build Coastguard Worker }
2706*4bdc9457SAndroid Build Coastguard Worker }
2707*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_gt_4_strided_a)2708*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_gt_4_strided_a) {
2709*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2710*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2711*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2712*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2713*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2714*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2715*4bdc9457SAndroid Build Coastguard Worker .m(5)
2716*4bdc9457SAndroid Build Coastguard Worker .n(8)
2717*4bdc9457SAndroid Build Coastguard Worker .k(k)
2718*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
2719*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2720*4bdc9457SAndroid Build Coastguard Worker }
2721*4bdc9457SAndroid Build Coastguard Worker }
2722*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_gt_4_subtile)2723*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_gt_4_subtile) {
2724*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2725*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2726*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2727*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2728*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2729*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2730*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2731*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2732*4bdc9457SAndroid Build Coastguard Worker .m(m)
2733*4bdc9457SAndroid Build Coastguard Worker .n(n)
2734*4bdc9457SAndroid Build Coastguard Worker .k(k)
2735*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2736*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2737*4bdc9457SAndroid Build Coastguard Worker }
2738*4bdc9457SAndroid Build Coastguard Worker }
2739*4bdc9457SAndroid Build Coastguard Worker }
2740*4bdc9457SAndroid Build Coastguard Worker }
2741*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_div_4)2742*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_div_4) {
2743*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2744*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2745*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2746*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2747*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2748*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2749*4bdc9457SAndroid Build Coastguard Worker .m(5)
2750*4bdc9457SAndroid Build Coastguard Worker .n(8)
2751*4bdc9457SAndroid Build Coastguard Worker .k(k)
2752*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2753*4bdc9457SAndroid Build Coastguard Worker }
2754*4bdc9457SAndroid Build Coastguard Worker }
2755*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_div_4_strided_a)2756*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_div_4_strided_a) {
2757*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2758*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2759*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2760*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2761*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2762*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2763*4bdc9457SAndroid Build Coastguard Worker .m(5)
2764*4bdc9457SAndroid Build Coastguard Worker .n(8)
2765*4bdc9457SAndroid Build Coastguard Worker .k(k)
2766*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
2767*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2768*4bdc9457SAndroid Build Coastguard Worker }
2769*4bdc9457SAndroid Build Coastguard Worker }
2770*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,k_div_4_subtile)2771*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, k_div_4_subtile) {
2772*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2773*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2774*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2775*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2776*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2777*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2778*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2779*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2780*4bdc9457SAndroid Build Coastguard Worker .m(m)
2781*4bdc9457SAndroid Build Coastguard Worker .n(n)
2782*4bdc9457SAndroid Build Coastguard Worker .k(k)
2783*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2784*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2785*4bdc9457SAndroid Build Coastguard Worker }
2786*4bdc9457SAndroid Build Coastguard Worker }
2787*4bdc9457SAndroid Build Coastguard Worker }
2788*4bdc9457SAndroid Build Coastguard Worker }
2789*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,n_gt_8)2790*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, n_gt_8) {
2791*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2792*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2793*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2794*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2795*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2796*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2797*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2798*4bdc9457SAndroid Build Coastguard Worker .m(5)
2799*4bdc9457SAndroid Build Coastguard Worker .n(n)
2800*4bdc9457SAndroid Build Coastguard Worker .k(k)
2801*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2802*4bdc9457SAndroid Build Coastguard Worker }
2803*4bdc9457SAndroid Build Coastguard Worker }
2804*4bdc9457SAndroid Build Coastguard Worker }
2805*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,n_gt_8_strided_cn)2806*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, n_gt_8_strided_cn) {
2807*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2808*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2809*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2810*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2811*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2812*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2813*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2814*4bdc9457SAndroid Build Coastguard Worker .m(5)
2815*4bdc9457SAndroid Build Coastguard Worker .n(n)
2816*4bdc9457SAndroid Build Coastguard Worker .k(k)
2817*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2818*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2819*4bdc9457SAndroid Build Coastguard Worker }
2820*4bdc9457SAndroid Build Coastguard Worker }
2821*4bdc9457SAndroid Build Coastguard Worker }
2822*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,n_gt_8_strided_a)2823*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, n_gt_8_strided_a) {
2824*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2825*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2826*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2827*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2828*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2829*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2830*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2831*4bdc9457SAndroid Build Coastguard Worker .m(5)
2832*4bdc9457SAndroid Build Coastguard Worker .n(n)
2833*4bdc9457SAndroid Build Coastguard Worker .k(k)
2834*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
2835*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2836*4bdc9457SAndroid Build Coastguard Worker }
2837*4bdc9457SAndroid Build Coastguard Worker }
2838*4bdc9457SAndroid Build Coastguard Worker }
2839*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,n_gt_8_subtile)2840*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, n_gt_8_subtile) {
2841*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2842*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2843*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2844*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2845*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2846*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2847*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2848*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2849*4bdc9457SAndroid Build Coastguard Worker .m(m)
2850*4bdc9457SAndroid Build Coastguard Worker .n(n)
2851*4bdc9457SAndroid Build Coastguard Worker .k(k)
2852*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2853*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2854*4bdc9457SAndroid Build Coastguard Worker }
2855*4bdc9457SAndroid Build Coastguard Worker }
2856*4bdc9457SAndroid Build Coastguard Worker }
2857*4bdc9457SAndroid Build Coastguard Worker }
2858*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,n_div_8)2859*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, n_div_8) {
2860*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2861*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2862*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2863*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2864*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2865*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2866*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2867*4bdc9457SAndroid Build Coastguard Worker .m(5)
2868*4bdc9457SAndroid Build Coastguard Worker .n(n)
2869*4bdc9457SAndroid Build Coastguard Worker .k(k)
2870*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2871*4bdc9457SAndroid Build Coastguard Worker }
2872*4bdc9457SAndroid Build Coastguard Worker }
2873*4bdc9457SAndroid Build Coastguard Worker }
2874*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,n_div_8_strided_cn)2875*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, n_div_8_strided_cn) {
2876*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2877*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2878*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2879*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2880*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2881*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2882*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2883*4bdc9457SAndroid Build Coastguard Worker .m(5)
2884*4bdc9457SAndroid Build Coastguard Worker .n(n)
2885*4bdc9457SAndroid Build Coastguard Worker .k(k)
2886*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2887*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2888*4bdc9457SAndroid Build Coastguard Worker }
2889*4bdc9457SAndroid Build Coastguard Worker }
2890*4bdc9457SAndroid Build Coastguard Worker }
2891*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,n_div_8_strided_a)2892*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, n_div_8_strided_a) {
2893*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2894*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2895*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2896*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2897*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2898*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2899*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2900*4bdc9457SAndroid Build Coastguard Worker .m(5)
2901*4bdc9457SAndroid Build Coastguard Worker .n(n)
2902*4bdc9457SAndroid Build Coastguard Worker .k(k)
2903*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
2904*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2905*4bdc9457SAndroid Build Coastguard Worker }
2906*4bdc9457SAndroid Build Coastguard Worker }
2907*4bdc9457SAndroid Build Coastguard Worker }
2908*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,n_div_8_subtile)2909*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, n_div_8_subtile) {
2910*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2911*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2912*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2913*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2914*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2915*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2916*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2917*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2918*4bdc9457SAndroid Build Coastguard Worker .m(m)
2919*4bdc9457SAndroid Build Coastguard Worker .n(n)
2920*4bdc9457SAndroid Build Coastguard Worker .k(k)
2921*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2922*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2923*4bdc9457SAndroid Build Coastguard Worker }
2924*4bdc9457SAndroid Build Coastguard Worker }
2925*4bdc9457SAndroid Build Coastguard Worker }
2926*4bdc9457SAndroid Build Coastguard Worker }
2927*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,strided_cm_subtile)2928*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, strided_cm_subtile) {
2929*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2930*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2931*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2932*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2933*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2934*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2935*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2936*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2937*4bdc9457SAndroid Build Coastguard Worker .m(m)
2938*4bdc9457SAndroid Build Coastguard Worker .n(n)
2939*4bdc9457SAndroid Build Coastguard Worker .k(k)
2940*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2941*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2942*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2943*4bdc9457SAndroid Build Coastguard Worker }
2944*4bdc9457SAndroid Build Coastguard Worker }
2945*4bdc9457SAndroid Build Coastguard Worker }
2946*4bdc9457SAndroid Build Coastguard Worker }
2947*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMSIMD,strided_cm)2948*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMSIMD, strided_cm) {
2949*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2950*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2951*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2952*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2953*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2954*4bdc9457SAndroid Build Coastguard Worker .m(5)
2955*4bdc9457SAndroid Build Coastguard Worker .n(8)
2956*4bdc9457SAndroid Build Coastguard Worker .k(4)
2957*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2958*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmsimd);
2959*4bdc9457SAndroid Build Coastguard Worker }
2960*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2961*4bdc9457SAndroid Build Coastguard Worker
2962*4bdc9457SAndroid Build Coastguard Worker
2963*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_eq_4)2964*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_eq_4) {
2965*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2966*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2967*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2968*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2969*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2970*4bdc9457SAndroid Build Coastguard Worker .m(6)
2971*4bdc9457SAndroid Build Coastguard Worker .n(8)
2972*4bdc9457SAndroid Build Coastguard Worker .k(4)
2973*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
2974*4bdc9457SAndroid Build Coastguard Worker }
2975*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,strided_cn)2976*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, strided_cn) {
2977*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2978*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2979*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2980*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2981*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2982*4bdc9457SAndroid Build Coastguard Worker .m(6)
2983*4bdc9457SAndroid Build Coastguard Worker .n(8)
2984*4bdc9457SAndroid Build Coastguard Worker .k(4)
2985*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2986*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
2987*4bdc9457SAndroid Build Coastguard Worker }
2988*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_eq_4_strided_a)2989*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_eq_4_strided_a) {
2990*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2991*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2992*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2993*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2994*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2995*4bdc9457SAndroid Build Coastguard Worker .m(6)
2996*4bdc9457SAndroid Build Coastguard Worker .n(8)
2997*4bdc9457SAndroid Build Coastguard Worker .k(4)
2998*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2999*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3000*4bdc9457SAndroid Build Coastguard Worker }
3001*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_eq_4_subtile)3002*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
3003*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3004*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3005*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3006*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3007*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3008*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3009*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3010*4bdc9457SAndroid Build Coastguard Worker .m(m)
3011*4bdc9457SAndroid Build Coastguard Worker .n(n)
3012*4bdc9457SAndroid Build Coastguard Worker .k(4)
3013*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3014*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3015*4bdc9457SAndroid Build Coastguard Worker }
3016*4bdc9457SAndroid Build Coastguard Worker }
3017*4bdc9457SAndroid Build Coastguard Worker }
3018*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)3019*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
3020*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3021*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3022*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3023*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3024*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3025*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3026*4bdc9457SAndroid Build Coastguard Worker .m(m)
3027*4bdc9457SAndroid Build Coastguard Worker .n(8)
3028*4bdc9457SAndroid Build Coastguard Worker .k(4)
3029*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3030*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3031*4bdc9457SAndroid Build Coastguard Worker }
3032*4bdc9457SAndroid Build Coastguard Worker }
3033*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)3034*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
3035*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3036*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3037*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3038*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3039*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3040*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3041*4bdc9457SAndroid Build Coastguard Worker .m(6)
3042*4bdc9457SAndroid Build Coastguard Worker .n(n)
3043*4bdc9457SAndroid Build Coastguard Worker .k(4)
3044*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3045*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3046*4bdc9457SAndroid Build Coastguard Worker }
3047*4bdc9457SAndroid Build Coastguard Worker }
3048*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_lt_4)3049*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_lt_4) {
3050*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3051*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3052*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3053*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3054*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3055*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3056*4bdc9457SAndroid Build Coastguard Worker .m(6)
3057*4bdc9457SAndroid Build Coastguard Worker .n(8)
3058*4bdc9457SAndroid Build Coastguard Worker .k(k)
3059*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3060*4bdc9457SAndroid Build Coastguard Worker }
3061*4bdc9457SAndroid Build Coastguard Worker }
3062*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_lt_4_strided_a)3063*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_lt_4_strided_a) {
3064*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3065*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3066*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3067*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3068*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3069*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3070*4bdc9457SAndroid Build Coastguard Worker .m(6)
3071*4bdc9457SAndroid Build Coastguard Worker .n(8)
3072*4bdc9457SAndroid Build Coastguard Worker .k(k)
3073*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3074*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3075*4bdc9457SAndroid Build Coastguard Worker }
3076*4bdc9457SAndroid Build Coastguard Worker }
3077*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_lt_4_subtile)3078*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
3079*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3080*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3081*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3082*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3083*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3084*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3085*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3086*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3087*4bdc9457SAndroid Build Coastguard Worker .m(m)
3088*4bdc9457SAndroid Build Coastguard Worker .n(n)
3089*4bdc9457SAndroid Build Coastguard Worker .k(k)
3090*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3091*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3092*4bdc9457SAndroid Build Coastguard Worker }
3093*4bdc9457SAndroid Build Coastguard Worker }
3094*4bdc9457SAndroid Build Coastguard Worker }
3095*4bdc9457SAndroid Build Coastguard Worker }
3096*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_gt_4)3097*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_gt_4) {
3098*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3099*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3100*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3101*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3102*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3103*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3104*4bdc9457SAndroid Build Coastguard Worker .m(6)
3105*4bdc9457SAndroid Build Coastguard Worker .n(8)
3106*4bdc9457SAndroid Build Coastguard Worker .k(k)
3107*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3108*4bdc9457SAndroid Build Coastguard Worker }
3109*4bdc9457SAndroid Build Coastguard Worker }
3110*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_gt_4_strided_a)3111*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_gt_4_strided_a) {
3112*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3113*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3114*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3115*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3116*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3117*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3118*4bdc9457SAndroid Build Coastguard Worker .m(6)
3119*4bdc9457SAndroid Build Coastguard Worker .n(8)
3120*4bdc9457SAndroid Build Coastguard Worker .k(k)
3121*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
3122*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3123*4bdc9457SAndroid Build Coastguard Worker }
3124*4bdc9457SAndroid Build Coastguard Worker }
3125*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_gt_4_subtile)3126*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
3127*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3128*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3129*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3130*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3131*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3132*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3133*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3134*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3135*4bdc9457SAndroid Build Coastguard Worker .m(m)
3136*4bdc9457SAndroid Build Coastguard Worker .n(n)
3137*4bdc9457SAndroid Build Coastguard Worker .k(k)
3138*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3139*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3140*4bdc9457SAndroid Build Coastguard Worker }
3141*4bdc9457SAndroid Build Coastguard Worker }
3142*4bdc9457SAndroid Build Coastguard Worker }
3143*4bdc9457SAndroid Build Coastguard Worker }
3144*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_div_4)3145*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_div_4) {
3146*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3147*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3148*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3149*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3150*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3151*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3152*4bdc9457SAndroid Build Coastguard Worker .m(6)
3153*4bdc9457SAndroid Build Coastguard Worker .n(8)
3154*4bdc9457SAndroid Build Coastguard Worker .k(k)
3155*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3156*4bdc9457SAndroid Build Coastguard Worker }
3157*4bdc9457SAndroid Build Coastguard Worker }
3158*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_div_4_strided_a)3159*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_div_4_strided_a) {
3160*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3161*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3162*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3163*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3164*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3165*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3166*4bdc9457SAndroid Build Coastguard Worker .m(6)
3167*4bdc9457SAndroid Build Coastguard Worker .n(8)
3168*4bdc9457SAndroid Build Coastguard Worker .k(k)
3169*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
3170*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3171*4bdc9457SAndroid Build Coastguard Worker }
3172*4bdc9457SAndroid Build Coastguard Worker }
3173*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,k_div_4_subtile)3174*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, k_div_4_subtile) {
3175*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3176*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3177*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3178*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3179*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3180*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3181*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3182*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3183*4bdc9457SAndroid Build Coastguard Worker .m(m)
3184*4bdc9457SAndroid Build Coastguard Worker .n(n)
3185*4bdc9457SAndroid Build Coastguard Worker .k(k)
3186*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3187*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3188*4bdc9457SAndroid Build Coastguard Worker }
3189*4bdc9457SAndroid Build Coastguard Worker }
3190*4bdc9457SAndroid Build Coastguard Worker }
3191*4bdc9457SAndroid Build Coastguard Worker }
3192*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,n_gt_8)3193*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, n_gt_8) {
3194*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3195*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3196*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3197*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3198*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3199*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3200*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3201*4bdc9457SAndroid Build Coastguard Worker .m(6)
3202*4bdc9457SAndroid Build Coastguard Worker .n(n)
3203*4bdc9457SAndroid Build Coastguard Worker .k(k)
3204*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3205*4bdc9457SAndroid Build Coastguard Worker }
3206*4bdc9457SAndroid Build Coastguard Worker }
3207*4bdc9457SAndroid Build Coastguard Worker }
3208*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)3209*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
3210*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3211*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3212*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3213*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3214*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3215*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3216*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3217*4bdc9457SAndroid Build Coastguard Worker .m(6)
3218*4bdc9457SAndroid Build Coastguard Worker .n(n)
3219*4bdc9457SAndroid Build Coastguard Worker .k(k)
3220*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3221*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3222*4bdc9457SAndroid Build Coastguard Worker }
3223*4bdc9457SAndroid Build Coastguard Worker }
3224*4bdc9457SAndroid Build Coastguard Worker }
3225*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,n_gt_8_strided_a)3226*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, n_gt_8_strided_a) {
3227*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3228*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3229*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3230*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3231*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3232*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3233*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3234*4bdc9457SAndroid Build Coastguard Worker .m(6)
3235*4bdc9457SAndroid Build Coastguard Worker .n(n)
3236*4bdc9457SAndroid Build Coastguard Worker .k(k)
3237*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3238*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3239*4bdc9457SAndroid Build Coastguard Worker }
3240*4bdc9457SAndroid Build Coastguard Worker }
3241*4bdc9457SAndroid Build Coastguard Worker }
3242*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,n_gt_8_subtile)3243*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
3244*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3245*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3246*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3247*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3248*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3249*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3250*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3251*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3252*4bdc9457SAndroid Build Coastguard Worker .m(m)
3253*4bdc9457SAndroid Build Coastguard Worker .n(n)
3254*4bdc9457SAndroid Build Coastguard Worker .k(k)
3255*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3256*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3257*4bdc9457SAndroid Build Coastguard Worker }
3258*4bdc9457SAndroid Build Coastguard Worker }
3259*4bdc9457SAndroid Build Coastguard Worker }
3260*4bdc9457SAndroid Build Coastguard Worker }
3261*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,n_div_8)3262*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, n_div_8) {
3263*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3264*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3265*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3266*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3267*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3268*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3269*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3270*4bdc9457SAndroid Build Coastguard Worker .m(6)
3271*4bdc9457SAndroid Build Coastguard Worker .n(n)
3272*4bdc9457SAndroid Build Coastguard Worker .k(k)
3273*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3274*4bdc9457SAndroid Build Coastguard Worker }
3275*4bdc9457SAndroid Build Coastguard Worker }
3276*4bdc9457SAndroid Build Coastguard Worker }
3277*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,n_div_8_strided_cn)3278*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
3279*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3280*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3281*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3282*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3283*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3284*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3285*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3286*4bdc9457SAndroid Build Coastguard Worker .m(6)
3287*4bdc9457SAndroid Build Coastguard Worker .n(n)
3288*4bdc9457SAndroid Build Coastguard Worker .k(k)
3289*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3290*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3291*4bdc9457SAndroid Build Coastguard Worker }
3292*4bdc9457SAndroid Build Coastguard Worker }
3293*4bdc9457SAndroid Build Coastguard Worker }
3294*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,n_div_8_strided_a)3295*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, n_div_8_strided_a) {
3296*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3297*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3298*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3299*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3300*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3301*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3302*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3303*4bdc9457SAndroid Build Coastguard Worker .m(6)
3304*4bdc9457SAndroid Build Coastguard Worker .n(n)
3305*4bdc9457SAndroid Build Coastguard Worker .k(k)
3306*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3307*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3308*4bdc9457SAndroid Build Coastguard Worker }
3309*4bdc9457SAndroid Build Coastguard Worker }
3310*4bdc9457SAndroid Build Coastguard Worker }
3311*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,n_div_8_subtile)3312*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, n_div_8_subtile) {
3313*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3314*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3315*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3316*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3317*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3318*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3319*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3320*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3321*4bdc9457SAndroid Build Coastguard Worker .m(m)
3322*4bdc9457SAndroid Build Coastguard Worker .n(n)
3323*4bdc9457SAndroid Build Coastguard Worker .k(k)
3324*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3325*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3326*4bdc9457SAndroid Build Coastguard Worker }
3327*4bdc9457SAndroid Build Coastguard Worker }
3328*4bdc9457SAndroid Build Coastguard Worker }
3329*4bdc9457SAndroid Build Coastguard Worker }
3330*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,strided_cm_subtile)3331*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, strided_cm_subtile) {
3332*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3333*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3334*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3335*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3336*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3337*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3338*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3339*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3340*4bdc9457SAndroid Build Coastguard Worker .m(m)
3341*4bdc9457SAndroid Build Coastguard Worker .n(n)
3342*4bdc9457SAndroid Build Coastguard Worker .k(k)
3343*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3344*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3345*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3346*4bdc9457SAndroid Build Coastguard Worker }
3347*4bdc9457SAndroid Build Coastguard Worker }
3348*4bdc9457SAndroid Build Coastguard Worker }
3349*4bdc9457SAndroid Build Coastguard Worker }
3350*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT,strided_cm)3351*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_SPLAT, strided_cm) {
3352*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3353*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3354*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3355*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3356*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3357*4bdc9457SAndroid Build Coastguard Worker .m(6)
3358*4bdc9457SAndroid Build Coastguard Worker .n(8)
3359*4bdc9457SAndroid Build Coastguard Worker .k(4)
3360*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3361*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_splat);
3362*4bdc9457SAndroid Build Coastguard Worker }
3363*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
3364*4bdc9457SAndroid Build Coastguard Worker
3365*4bdc9457SAndroid Build Coastguard Worker
3366*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)3367*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
3368*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3369*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3370*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3371*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3372*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3373*4bdc9457SAndroid Build Coastguard Worker .m(1)
3374*4bdc9457SAndroid Build Coastguard Worker .n(8)
3375*4bdc9457SAndroid Build Coastguard Worker .k(1)
3376*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3377*4bdc9457SAndroid Build Coastguard Worker }
3378*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)3379*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
3380*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3381*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3382*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3383*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3384*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3385*4bdc9457SAndroid Build Coastguard Worker .m(1)
3386*4bdc9457SAndroid Build Coastguard Worker .n(8)
3387*4bdc9457SAndroid Build Coastguard Worker .k(1)
3388*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3389*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3390*4bdc9457SAndroid Build Coastguard Worker }
3391*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)3392*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
3393*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3394*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3395*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3396*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3397*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3398*4bdc9457SAndroid Build Coastguard Worker .m(1)
3399*4bdc9457SAndroid Build Coastguard Worker .n(8)
3400*4bdc9457SAndroid Build Coastguard Worker .k(1)
3401*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
3402*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3403*4bdc9457SAndroid Build Coastguard Worker }
3404*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)3405*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
3406*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3407*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3408*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3409*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3410*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3411*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3412*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3413*4bdc9457SAndroid Build Coastguard Worker .m(m)
3414*4bdc9457SAndroid Build Coastguard Worker .n(n)
3415*4bdc9457SAndroid Build Coastguard Worker .k(1)
3416*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3417*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3418*4bdc9457SAndroid Build Coastguard Worker }
3419*4bdc9457SAndroid Build Coastguard Worker }
3420*4bdc9457SAndroid Build Coastguard Worker }
3421*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)3422*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
3423*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3424*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3425*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3426*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3427*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3428*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3429*4bdc9457SAndroid Build Coastguard Worker .m(m)
3430*4bdc9457SAndroid Build Coastguard Worker .n(8)
3431*4bdc9457SAndroid Build Coastguard Worker .k(1)
3432*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3433*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3434*4bdc9457SAndroid Build Coastguard Worker }
3435*4bdc9457SAndroid Build Coastguard Worker }
3436*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)3437*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
3438*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3439*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3440*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3441*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3442*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3443*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3444*4bdc9457SAndroid Build Coastguard Worker .m(1)
3445*4bdc9457SAndroid Build Coastguard Worker .n(n)
3446*4bdc9457SAndroid Build Coastguard Worker .k(1)
3447*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3448*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3449*4bdc9457SAndroid Build Coastguard Worker }
3450*4bdc9457SAndroid Build Coastguard Worker }
3451*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)3452*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
3453*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3454*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3455*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3456*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3457*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3458*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3459*4bdc9457SAndroid Build Coastguard Worker .m(1)
3460*4bdc9457SAndroid Build Coastguard Worker .n(8)
3461*4bdc9457SAndroid Build Coastguard Worker .k(k)
3462*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3463*4bdc9457SAndroid Build Coastguard Worker }
3464*4bdc9457SAndroid Build Coastguard Worker }
3465*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)3466*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
3467*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3468*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3469*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3470*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3471*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3472*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3473*4bdc9457SAndroid Build Coastguard Worker .m(1)
3474*4bdc9457SAndroid Build Coastguard Worker .n(8)
3475*4bdc9457SAndroid Build Coastguard Worker .k(k)
3476*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
3477*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3478*4bdc9457SAndroid Build Coastguard Worker }
3479*4bdc9457SAndroid Build Coastguard Worker }
3480*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)3481*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
3482*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3483*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3484*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3485*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3486*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3487*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3488*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3489*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3490*4bdc9457SAndroid Build Coastguard Worker .m(m)
3491*4bdc9457SAndroid Build Coastguard Worker .n(n)
3492*4bdc9457SAndroid Build Coastguard Worker .k(k)
3493*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3494*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3495*4bdc9457SAndroid Build Coastguard Worker }
3496*4bdc9457SAndroid Build Coastguard Worker }
3497*4bdc9457SAndroid Build Coastguard Worker }
3498*4bdc9457SAndroid Build Coastguard Worker }
3499*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)3500*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
3501*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3502*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3503*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3504*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3505*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3506*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3507*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3508*4bdc9457SAndroid Build Coastguard Worker .m(1)
3509*4bdc9457SAndroid Build Coastguard Worker .n(n)
3510*4bdc9457SAndroid Build Coastguard Worker .k(k)
3511*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3512*4bdc9457SAndroid Build Coastguard Worker }
3513*4bdc9457SAndroid Build Coastguard Worker }
3514*4bdc9457SAndroid Build Coastguard Worker }
3515*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)3516*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
3517*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3518*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3519*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3520*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3521*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3522*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3523*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3524*4bdc9457SAndroid Build Coastguard Worker .m(1)
3525*4bdc9457SAndroid Build Coastguard Worker .n(n)
3526*4bdc9457SAndroid Build Coastguard Worker .k(k)
3527*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3528*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3529*4bdc9457SAndroid Build Coastguard Worker }
3530*4bdc9457SAndroid Build Coastguard Worker }
3531*4bdc9457SAndroid Build Coastguard Worker }
3532*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)3533*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
3534*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3535*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3536*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3537*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3538*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3539*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3540*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3541*4bdc9457SAndroid Build Coastguard Worker .m(1)
3542*4bdc9457SAndroid Build Coastguard Worker .n(n)
3543*4bdc9457SAndroid Build Coastguard Worker .k(k)
3544*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3545*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3546*4bdc9457SAndroid Build Coastguard Worker }
3547*4bdc9457SAndroid Build Coastguard Worker }
3548*4bdc9457SAndroid Build Coastguard Worker }
3549*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)3550*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
3551*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3552*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3553*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3554*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3555*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3556*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3557*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3558*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3559*4bdc9457SAndroid Build Coastguard Worker .m(m)
3560*4bdc9457SAndroid Build Coastguard Worker .n(n)
3561*4bdc9457SAndroid Build Coastguard Worker .k(k)
3562*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3563*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3564*4bdc9457SAndroid Build Coastguard Worker }
3565*4bdc9457SAndroid Build Coastguard Worker }
3566*4bdc9457SAndroid Build Coastguard Worker }
3567*4bdc9457SAndroid Build Coastguard Worker }
3568*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)3569*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
3570*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3571*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3572*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3573*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3574*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3575*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3576*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3577*4bdc9457SAndroid Build Coastguard Worker .m(1)
3578*4bdc9457SAndroid Build Coastguard Worker .n(n)
3579*4bdc9457SAndroid Build Coastguard Worker .k(k)
3580*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3581*4bdc9457SAndroid Build Coastguard Worker }
3582*4bdc9457SAndroid Build Coastguard Worker }
3583*4bdc9457SAndroid Build Coastguard Worker }
3584*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)3585*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
3586*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3587*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3588*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3589*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3590*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3591*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3592*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3593*4bdc9457SAndroid Build Coastguard Worker .m(1)
3594*4bdc9457SAndroid Build Coastguard Worker .n(n)
3595*4bdc9457SAndroid Build Coastguard Worker .k(k)
3596*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3597*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3598*4bdc9457SAndroid Build Coastguard Worker }
3599*4bdc9457SAndroid Build Coastguard Worker }
3600*4bdc9457SAndroid Build Coastguard Worker }
3601*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)3602*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
3603*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3604*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3605*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3606*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3607*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3608*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3609*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3610*4bdc9457SAndroid Build Coastguard Worker .m(1)
3611*4bdc9457SAndroid Build Coastguard Worker .n(n)
3612*4bdc9457SAndroid Build Coastguard Worker .k(k)
3613*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3614*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3615*4bdc9457SAndroid Build Coastguard Worker }
3616*4bdc9457SAndroid Build Coastguard Worker }
3617*4bdc9457SAndroid Build Coastguard Worker }
3618*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)3619*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
3620*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3621*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3622*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3623*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3624*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3625*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3626*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3627*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3628*4bdc9457SAndroid Build Coastguard Worker .m(m)
3629*4bdc9457SAndroid Build Coastguard Worker .n(n)
3630*4bdc9457SAndroid Build Coastguard Worker .k(k)
3631*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3632*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3633*4bdc9457SAndroid Build Coastguard Worker }
3634*4bdc9457SAndroid Build Coastguard Worker }
3635*4bdc9457SAndroid Build Coastguard Worker }
3636*4bdc9457SAndroid Build Coastguard Worker }
3637*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)3638*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
3639*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3640*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3641*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3642*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3643*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3644*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3645*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3646*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3647*4bdc9457SAndroid Build Coastguard Worker .m(m)
3648*4bdc9457SAndroid Build Coastguard Worker .n(n)
3649*4bdc9457SAndroid Build Coastguard Worker .k(k)
3650*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3651*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3652*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3653*4bdc9457SAndroid Build Coastguard Worker }
3654*4bdc9457SAndroid Build Coastguard Worker }
3655*4bdc9457SAndroid Build Coastguard Worker }
3656*4bdc9457SAndroid Build Coastguard Worker }
3657*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)3658*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
3659*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3660*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3661*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3662*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3663*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3664*4bdc9457SAndroid Build Coastguard Worker .m(1)
3665*4bdc9457SAndroid Build Coastguard Worker .n(8)
3666*4bdc9457SAndroid Build Coastguard Worker .k(1)
3667*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3668*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3669*4bdc9457SAndroid Build Coastguard Worker }
3670*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
3671*4bdc9457SAndroid Build Coastguard Worker
3672*4bdc9457SAndroid Build Coastguard Worker
3673*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)3674*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
3675*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3676*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3677*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3678*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3679*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3680*4bdc9457SAndroid Build Coastguard Worker .m(1)
3681*4bdc9457SAndroid Build Coastguard Worker .n(8)
3682*4bdc9457SAndroid Build Coastguard Worker .k(4)
3683*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3684*4bdc9457SAndroid Build Coastguard Worker }
3685*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,strided_cn)3686*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
3687*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3688*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3689*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3690*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3691*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3692*4bdc9457SAndroid Build Coastguard Worker .m(1)
3693*4bdc9457SAndroid Build Coastguard Worker .n(8)
3694*4bdc9457SAndroid Build Coastguard Worker .k(4)
3695*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3696*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3697*4bdc9457SAndroid Build Coastguard Worker }
3698*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_strided_a)3699*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_strided_a) {
3700*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3701*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3702*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3703*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3704*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3705*4bdc9457SAndroid Build Coastguard Worker .m(1)
3706*4bdc9457SAndroid Build Coastguard Worker .n(8)
3707*4bdc9457SAndroid Build Coastguard Worker .k(4)
3708*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3709*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3710*4bdc9457SAndroid Build Coastguard Worker }
3711*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)3712*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
3713*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3714*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3715*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3716*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3717*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3718*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3719*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3720*4bdc9457SAndroid Build Coastguard Worker .m(m)
3721*4bdc9457SAndroid Build Coastguard Worker .n(n)
3722*4bdc9457SAndroid Build Coastguard Worker .k(4)
3723*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3724*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3725*4bdc9457SAndroid Build Coastguard Worker }
3726*4bdc9457SAndroid Build Coastguard Worker }
3727*4bdc9457SAndroid Build Coastguard Worker }
3728*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)3729*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
3730*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3731*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3732*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3733*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3734*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3735*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3736*4bdc9457SAndroid Build Coastguard Worker .m(m)
3737*4bdc9457SAndroid Build Coastguard Worker .n(8)
3738*4bdc9457SAndroid Build Coastguard Worker .k(4)
3739*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3740*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3741*4bdc9457SAndroid Build Coastguard Worker }
3742*4bdc9457SAndroid Build Coastguard Worker }
3743*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)3744*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
3745*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3746*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3747*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3748*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3749*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3750*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3751*4bdc9457SAndroid Build Coastguard Worker .m(1)
3752*4bdc9457SAndroid Build Coastguard Worker .n(n)
3753*4bdc9457SAndroid Build Coastguard Worker .k(4)
3754*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3755*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3756*4bdc9457SAndroid Build Coastguard Worker }
3757*4bdc9457SAndroid Build Coastguard Worker }
3758*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)3759*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
3760*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3761*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3762*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3763*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3764*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3765*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3766*4bdc9457SAndroid Build Coastguard Worker .m(1)
3767*4bdc9457SAndroid Build Coastguard Worker .n(8)
3768*4bdc9457SAndroid Build Coastguard Worker .k(k)
3769*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3770*4bdc9457SAndroid Build Coastguard Worker }
3771*4bdc9457SAndroid Build Coastguard Worker }
3772*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_strided_a)3773*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_strided_a) {
3774*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3775*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3776*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3777*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3778*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3779*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3780*4bdc9457SAndroid Build Coastguard Worker .m(1)
3781*4bdc9457SAndroid Build Coastguard Worker .n(8)
3782*4bdc9457SAndroid Build Coastguard Worker .k(k)
3783*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3784*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3785*4bdc9457SAndroid Build Coastguard Worker }
3786*4bdc9457SAndroid Build Coastguard Worker }
3787*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)3788*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
3789*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3790*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3791*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3792*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3793*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3794*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3795*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3796*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3797*4bdc9457SAndroid Build Coastguard Worker .m(m)
3798*4bdc9457SAndroid Build Coastguard Worker .n(n)
3799*4bdc9457SAndroid Build Coastguard Worker .k(k)
3800*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3801*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3802*4bdc9457SAndroid Build Coastguard Worker }
3803*4bdc9457SAndroid Build Coastguard Worker }
3804*4bdc9457SAndroid Build Coastguard Worker }
3805*4bdc9457SAndroid Build Coastguard Worker }
3806*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)3807*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
3808*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3809*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3810*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3811*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3812*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3813*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3814*4bdc9457SAndroid Build Coastguard Worker .m(1)
3815*4bdc9457SAndroid Build Coastguard Worker .n(8)
3816*4bdc9457SAndroid Build Coastguard Worker .k(k)
3817*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3818*4bdc9457SAndroid Build Coastguard Worker }
3819*4bdc9457SAndroid Build Coastguard Worker }
3820*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_strided_a)3821*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_strided_a) {
3822*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3823*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3824*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3825*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3826*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3827*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3828*4bdc9457SAndroid Build Coastguard Worker .m(1)
3829*4bdc9457SAndroid Build Coastguard Worker .n(8)
3830*4bdc9457SAndroid Build Coastguard Worker .k(k)
3831*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
3832*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3833*4bdc9457SAndroid Build Coastguard Worker }
3834*4bdc9457SAndroid Build Coastguard Worker }
3835*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)3836*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
3837*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3838*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3839*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3840*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3841*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3842*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3843*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3844*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3845*4bdc9457SAndroid Build Coastguard Worker .m(m)
3846*4bdc9457SAndroid Build Coastguard Worker .n(n)
3847*4bdc9457SAndroid Build Coastguard Worker .k(k)
3848*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3849*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3850*4bdc9457SAndroid Build Coastguard Worker }
3851*4bdc9457SAndroid Build Coastguard Worker }
3852*4bdc9457SAndroid Build Coastguard Worker }
3853*4bdc9457SAndroid Build Coastguard Worker }
3854*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_div_4)3855*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
3856*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3857*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3858*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3859*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3860*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3861*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3862*4bdc9457SAndroid Build Coastguard Worker .m(1)
3863*4bdc9457SAndroid Build Coastguard Worker .n(8)
3864*4bdc9457SAndroid Build Coastguard Worker .k(k)
3865*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3866*4bdc9457SAndroid Build Coastguard Worker }
3867*4bdc9457SAndroid Build Coastguard Worker }
3868*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_div_4_strided_a)3869*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_div_4_strided_a) {
3870*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3871*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3872*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3873*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3874*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3875*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3876*4bdc9457SAndroid Build Coastguard Worker .m(1)
3877*4bdc9457SAndroid Build Coastguard Worker .n(8)
3878*4bdc9457SAndroid Build Coastguard Worker .k(k)
3879*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
3880*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3881*4bdc9457SAndroid Build Coastguard Worker }
3882*4bdc9457SAndroid Build Coastguard Worker }
3883*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)3884*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
3885*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3886*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3887*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3888*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3889*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3890*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3891*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3892*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3893*4bdc9457SAndroid Build Coastguard Worker .m(m)
3894*4bdc9457SAndroid Build Coastguard Worker .n(n)
3895*4bdc9457SAndroid Build Coastguard Worker .k(k)
3896*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3897*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3898*4bdc9457SAndroid Build Coastguard Worker }
3899*4bdc9457SAndroid Build Coastguard Worker }
3900*4bdc9457SAndroid Build Coastguard Worker }
3901*4bdc9457SAndroid Build Coastguard Worker }
3902*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)3903*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
3904*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3905*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3906*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3907*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3908*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3909*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3910*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3911*4bdc9457SAndroid Build Coastguard Worker .m(1)
3912*4bdc9457SAndroid Build Coastguard Worker .n(n)
3913*4bdc9457SAndroid Build Coastguard Worker .k(k)
3914*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3915*4bdc9457SAndroid Build Coastguard Worker }
3916*4bdc9457SAndroid Build Coastguard Worker }
3917*4bdc9457SAndroid Build Coastguard Worker }
3918*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)3919*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
3920*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3921*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3922*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3923*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3924*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3925*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3926*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3927*4bdc9457SAndroid Build Coastguard Worker .m(1)
3928*4bdc9457SAndroid Build Coastguard Worker .n(n)
3929*4bdc9457SAndroid Build Coastguard Worker .k(k)
3930*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3931*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3932*4bdc9457SAndroid Build Coastguard Worker }
3933*4bdc9457SAndroid Build Coastguard Worker }
3934*4bdc9457SAndroid Build Coastguard Worker }
3935*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_a)3936*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_a) {
3937*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3938*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3939*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3940*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3941*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3942*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3943*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3944*4bdc9457SAndroid Build Coastguard Worker .m(1)
3945*4bdc9457SAndroid Build Coastguard Worker .n(n)
3946*4bdc9457SAndroid Build Coastguard Worker .k(k)
3947*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3948*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3949*4bdc9457SAndroid Build Coastguard Worker }
3950*4bdc9457SAndroid Build Coastguard Worker }
3951*4bdc9457SAndroid Build Coastguard Worker }
3952*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)3953*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
3954*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3955*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3956*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3957*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3958*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3959*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3960*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3961*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3962*4bdc9457SAndroid Build Coastguard Worker .m(m)
3963*4bdc9457SAndroid Build Coastguard Worker .n(n)
3964*4bdc9457SAndroid Build Coastguard Worker .k(k)
3965*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3966*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3967*4bdc9457SAndroid Build Coastguard Worker }
3968*4bdc9457SAndroid Build Coastguard Worker }
3969*4bdc9457SAndroid Build Coastguard Worker }
3970*4bdc9457SAndroid Build Coastguard Worker }
3971*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_div_8)3972*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
3973*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3974*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3975*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3976*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3977*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3978*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3979*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3980*4bdc9457SAndroid Build Coastguard Worker .m(1)
3981*4bdc9457SAndroid Build Coastguard Worker .n(n)
3982*4bdc9457SAndroid Build Coastguard Worker .k(k)
3983*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
3984*4bdc9457SAndroid Build Coastguard Worker }
3985*4bdc9457SAndroid Build Coastguard Worker }
3986*4bdc9457SAndroid Build Coastguard Worker }
3987*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)3988*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
3989*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3990*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3991*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3992*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3993*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3994*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3995*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3996*4bdc9457SAndroid Build Coastguard Worker .m(1)
3997*4bdc9457SAndroid Build Coastguard Worker .n(n)
3998*4bdc9457SAndroid Build Coastguard Worker .k(k)
3999*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4000*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
4001*4bdc9457SAndroid Build Coastguard Worker }
4002*4bdc9457SAndroid Build Coastguard Worker }
4003*4bdc9457SAndroid Build Coastguard Worker }
4004*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_a)4005*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_a) {
4006*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4007*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4008*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4009*4bdc9457SAndroid Build Coastguard Worker .mr(1)
4010*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4011*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4012*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4013*4bdc9457SAndroid Build Coastguard Worker .m(1)
4014*4bdc9457SAndroid Build Coastguard Worker .n(n)
4015*4bdc9457SAndroid Build Coastguard Worker .k(k)
4016*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4017*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
4018*4bdc9457SAndroid Build Coastguard Worker }
4019*4bdc9457SAndroid Build Coastguard Worker }
4020*4bdc9457SAndroid Build Coastguard Worker }
4021*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)4022*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
4023*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4024*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4025*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
4026*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4027*4bdc9457SAndroid Build Coastguard Worker .mr(1)
4028*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4029*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4030*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4031*4bdc9457SAndroid Build Coastguard Worker .m(m)
4032*4bdc9457SAndroid Build Coastguard Worker .n(n)
4033*4bdc9457SAndroid Build Coastguard Worker .k(k)
4034*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4035*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
4036*4bdc9457SAndroid Build Coastguard Worker }
4037*4bdc9457SAndroid Build Coastguard Worker }
4038*4bdc9457SAndroid Build Coastguard Worker }
4039*4bdc9457SAndroid Build Coastguard Worker }
4040*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)4041*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
4042*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4043*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4044*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
4045*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4046*4bdc9457SAndroid Build Coastguard Worker .mr(1)
4047*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4048*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4049*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4050*4bdc9457SAndroid Build Coastguard Worker .m(m)
4051*4bdc9457SAndroid Build Coastguard Worker .n(n)
4052*4bdc9457SAndroid Build Coastguard Worker .k(k)
4053*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4054*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4055*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
4056*4bdc9457SAndroid Build Coastguard Worker }
4057*4bdc9457SAndroid Build Coastguard Worker }
4058*4bdc9457SAndroid Build Coastguard Worker }
4059*4bdc9457SAndroid Build Coastguard Worker }
4060*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA,strided_cm)4061*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
4062*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4063*4bdc9457SAndroid Build Coastguard Worker .mr(1)
4064*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4065*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4066*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4067*4bdc9457SAndroid Build Coastguard Worker .m(1)
4068*4bdc9457SAndroid Build Coastguard Worker .n(8)
4069*4bdc9457SAndroid Build Coastguard Worker .k(4)
4070*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4071*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmrelaxedsimd_fma);
4072*4bdc9457SAndroid Build Coastguard Worker }
4073*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4074*4bdc9457SAndroid Build Coastguard Worker
4075*4bdc9457SAndroid Build Coastguard Worker
4076*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)4077*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
4078*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4079*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4080*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4081*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4082*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4083*4bdc9457SAndroid Build Coastguard Worker .m(3)
4084*4bdc9457SAndroid Build Coastguard Worker .n(8)
4085*4bdc9457SAndroid Build Coastguard Worker .k(1)
4086*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4087*4bdc9457SAndroid Build Coastguard Worker }
4088*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)4089*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
4090*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4091*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4092*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4093*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4094*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4095*4bdc9457SAndroid Build Coastguard Worker .m(3)
4096*4bdc9457SAndroid Build Coastguard Worker .n(8)
4097*4bdc9457SAndroid Build Coastguard Worker .k(1)
4098*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4099*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4100*4bdc9457SAndroid Build Coastguard Worker }
4101*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)4102*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
4103*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4104*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4105*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4106*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4107*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4108*4bdc9457SAndroid Build Coastguard Worker .m(3)
4109*4bdc9457SAndroid Build Coastguard Worker .n(8)
4110*4bdc9457SAndroid Build Coastguard Worker .k(1)
4111*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
4112*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4113*4bdc9457SAndroid Build Coastguard Worker }
4114*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)4115*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
4116*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4117*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4118*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4119*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4120*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4121*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4122*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4123*4bdc9457SAndroid Build Coastguard Worker .m(m)
4124*4bdc9457SAndroid Build Coastguard Worker .n(n)
4125*4bdc9457SAndroid Build Coastguard Worker .k(1)
4126*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4127*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4128*4bdc9457SAndroid Build Coastguard Worker }
4129*4bdc9457SAndroid Build Coastguard Worker }
4130*4bdc9457SAndroid Build Coastguard Worker }
4131*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)4132*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
4133*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4134*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4135*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4136*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4137*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4138*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4139*4bdc9457SAndroid Build Coastguard Worker .m(m)
4140*4bdc9457SAndroid Build Coastguard Worker .n(8)
4141*4bdc9457SAndroid Build Coastguard Worker .k(1)
4142*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4143*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4144*4bdc9457SAndroid Build Coastguard Worker }
4145*4bdc9457SAndroid Build Coastguard Worker }
4146*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)4147*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
4148*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4149*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4150*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4151*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4152*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4153*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4154*4bdc9457SAndroid Build Coastguard Worker .m(3)
4155*4bdc9457SAndroid Build Coastguard Worker .n(n)
4156*4bdc9457SAndroid Build Coastguard Worker .k(1)
4157*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4158*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4159*4bdc9457SAndroid Build Coastguard Worker }
4160*4bdc9457SAndroid Build Coastguard Worker }
4161*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)4162*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
4163*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4164*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4165*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4166*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4167*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4168*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4169*4bdc9457SAndroid Build Coastguard Worker .m(3)
4170*4bdc9457SAndroid Build Coastguard Worker .n(8)
4171*4bdc9457SAndroid Build Coastguard Worker .k(k)
4172*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4173*4bdc9457SAndroid Build Coastguard Worker }
4174*4bdc9457SAndroid Build Coastguard Worker }
4175*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)4176*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
4177*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4178*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4179*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4180*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4181*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4182*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4183*4bdc9457SAndroid Build Coastguard Worker .m(3)
4184*4bdc9457SAndroid Build Coastguard Worker .n(8)
4185*4bdc9457SAndroid Build Coastguard Worker .k(k)
4186*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
4187*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4188*4bdc9457SAndroid Build Coastguard Worker }
4189*4bdc9457SAndroid Build Coastguard Worker }
4190*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)4191*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
4192*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4193*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4194*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4195*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4196*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4197*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4198*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4199*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4200*4bdc9457SAndroid Build Coastguard Worker .m(m)
4201*4bdc9457SAndroid Build Coastguard Worker .n(n)
4202*4bdc9457SAndroid Build Coastguard Worker .k(k)
4203*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4204*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4205*4bdc9457SAndroid Build Coastguard Worker }
4206*4bdc9457SAndroid Build Coastguard Worker }
4207*4bdc9457SAndroid Build Coastguard Worker }
4208*4bdc9457SAndroid Build Coastguard Worker }
4209*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)4210*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
4211*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4212*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4213*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4214*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4215*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4216*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4217*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4218*4bdc9457SAndroid Build Coastguard Worker .m(3)
4219*4bdc9457SAndroid Build Coastguard Worker .n(n)
4220*4bdc9457SAndroid Build Coastguard Worker .k(k)
4221*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4222*4bdc9457SAndroid Build Coastguard Worker }
4223*4bdc9457SAndroid Build Coastguard Worker }
4224*4bdc9457SAndroid Build Coastguard Worker }
4225*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)4226*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
4227*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4228*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4229*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4230*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4231*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4232*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4233*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4234*4bdc9457SAndroid Build Coastguard Worker .m(3)
4235*4bdc9457SAndroid Build Coastguard Worker .n(n)
4236*4bdc9457SAndroid Build Coastguard Worker .k(k)
4237*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4238*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4239*4bdc9457SAndroid Build Coastguard Worker }
4240*4bdc9457SAndroid Build Coastguard Worker }
4241*4bdc9457SAndroid Build Coastguard Worker }
4242*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)4243*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
4244*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4245*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4246*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4247*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4248*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4249*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4250*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4251*4bdc9457SAndroid Build Coastguard Worker .m(3)
4252*4bdc9457SAndroid Build Coastguard Worker .n(n)
4253*4bdc9457SAndroid Build Coastguard Worker .k(k)
4254*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4255*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4256*4bdc9457SAndroid Build Coastguard Worker }
4257*4bdc9457SAndroid Build Coastguard Worker }
4258*4bdc9457SAndroid Build Coastguard Worker }
4259*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)4260*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
4261*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4262*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4263*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4264*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4265*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4266*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4267*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4268*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4269*4bdc9457SAndroid Build Coastguard Worker .m(m)
4270*4bdc9457SAndroid Build Coastguard Worker .n(n)
4271*4bdc9457SAndroid Build Coastguard Worker .k(k)
4272*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4273*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4274*4bdc9457SAndroid Build Coastguard Worker }
4275*4bdc9457SAndroid Build Coastguard Worker }
4276*4bdc9457SAndroid Build Coastguard Worker }
4277*4bdc9457SAndroid Build Coastguard Worker }
4278*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)4279*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
4280*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4281*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4282*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4283*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4284*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4285*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4286*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4287*4bdc9457SAndroid Build Coastguard Worker .m(3)
4288*4bdc9457SAndroid Build Coastguard Worker .n(n)
4289*4bdc9457SAndroid Build Coastguard Worker .k(k)
4290*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4291*4bdc9457SAndroid Build Coastguard Worker }
4292*4bdc9457SAndroid Build Coastguard Worker }
4293*4bdc9457SAndroid Build Coastguard Worker }
4294*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)4295*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
4296*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4297*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4298*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4299*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4300*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4301*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4302*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4303*4bdc9457SAndroid Build Coastguard Worker .m(3)
4304*4bdc9457SAndroid Build Coastguard Worker .n(n)
4305*4bdc9457SAndroid Build Coastguard Worker .k(k)
4306*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4307*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4308*4bdc9457SAndroid Build Coastguard Worker }
4309*4bdc9457SAndroid Build Coastguard Worker }
4310*4bdc9457SAndroid Build Coastguard Worker }
4311*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)4312*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
4313*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4314*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4315*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4316*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4317*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4318*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4319*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4320*4bdc9457SAndroid Build Coastguard Worker .m(3)
4321*4bdc9457SAndroid Build Coastguard Worker .n(n)
4322*4bdc9457SAndroid Build Coastguard Worker .k(k)
4323*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4324*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4325*4bdc9457SAndroid Build Coastguard Worker }
4326*4bdc9457SAndroid Build Coastguard Worker }
4327*4bdc9457SAndroid Build Coastguard Worker }
4328*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)4329*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
4330*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4331*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4332*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4333*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4334*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4335*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4336*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4337*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4338*4bdc9457SAndroid Build Coastguard Worker .m(m)
4339*4bdc9457SAndroid Build Coastguard Worker .n(n)
4340*4bdc9457SAndroid Build Coastguard Worker .k(k)
4341*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4342*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4343*4bdc9457SAndroid Build Coastguard Worker }
4344*4bdc9457SAndroid Build Coastguard Worker }
4345*4bdc9457SAndroid Build Coastguard Worker }
4346*4bdc9457SAndroid Build Coastguard Worker }
4347*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)4348*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
4349*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4350*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4351*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4352*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4353*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4354*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4355*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4356*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4357*4bdc9457SAndroid Build Coastguard Worker .m(m)
4358*4bdc9457SAndroid Build Coastguard Worker .n(n)
4359*4bdc9457SAndroid Build Coastguard Worker .k(k)
4360*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4361*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4362*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4363*4bdc9457SAndroid Build Coastguard Worker }
4364*4bdc9457SAndroid Build Coastguard Worker }
4365*4bdc9457SAndroid Build Coastguard Worker }
4366*4bdc9457SAndroid Build Coastguard Worker }
4367*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)4368*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
4369*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4370*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4371*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4372*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4373*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4374*4bdc9457SAndroid Build Coastguard Worker .m(3)
4375*4bdc9457SAndroid Build Coastguard Worker .n(8)
4376*4bdc9457SAndroid Build Coastguard Worker .k(1)
4377*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4378*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4379*4bdc9457SAndroid Build Coastguard Worker }
4380*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4381*4bdc9457SAndroid Build Coastguard Worker
4382*4bdc9457SAndroid Build Coastguard Worker
4383*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_eq_4)4384*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_eq_4) {
4385*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4386*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4387*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4388*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4389*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4390*4bdc9457SAndroid Build Coastguard Worker .m(4)
4391*4bdc9457SAndroid Build Coastguard Worker .n(2)
4392*4bdc9457SAndroid Build Coastguard Worker .k(4)
4393*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4394*4bdc9457SAndroid Build Coastguard Worker }
4395*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,strided_cn)4396*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, strided_cn) {
4397*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4398*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4399*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4400*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4401*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4402*4bdc9457SAndroid Build Coastguard Worker .m(4)
4403*4bdc9457SAndroid Build Coastguard Worker .n(2)
4404*4bdc9457SAndroid Build Coastguard Worker .k(4)
4405*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
4406*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4407*4bdc9457SAndroid Build Coastguard Worker }
4408*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_eq_4_strided_a)4409*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_eq_4_strided_a) {
4410*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4411*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4412*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4413*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4414*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4415*4bdc9457SAndroid Build Coastguard Worker .m(4)
4416*4bdc9457SAndroid Build Coastguard Worker .n(2)
4417*4bdc9457SAndroid Build Coastguard Worker .k(4)
4418*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4419*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4420*4bdc9457SAndroid Build Coastguard Worker }
4421*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)4422*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
4423*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
4424*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4425*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4426*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4427*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4428*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4429*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4430*4bdc9457SAndroid Build Coastguard Worker .m(m)
4431*4bdc9457SAndroid Build Coastguard Worker .n(n)
4432*4bdc9457SAndroid Build Coastguard Worker .k(4)
4433*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4434*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4435*4bdc9457SAndroid Build Coastguard Worker }
4436*4bdc9457SAndroid Build Coastguard Worker }
4437*4bdc9457SAndroid Build Coastguard Worker }
4438*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)4439*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
4440*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4441*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4442*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4443*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4444*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4445*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4446*4bdc9457SAndroid Build Coastguard Worker .m(m)
4447*4bdc9457SAndroid Build Coastguard Worker .n(2)
4448*4bdc9457SAndroid Build Coastguard Worker .k(4)
4449*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4450*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4451*4bdc9457SAndroid Build Coastguard Worker }
4452*4bdc9457SAndroid Build Coastguard Worker }
4453*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)4454*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
4455*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
4456*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4457*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4458*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4459*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4460*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4461*4bdc9457SAndroid Build Coastguard Worker .m(4)
4462*4bdc9457SAndroid Build Coastguard Worker .n(n)
4463*4bdc9457SAndroid Build Coastguard Worker .k(4)
4464*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4465*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4466*4bdc9457SAndroid Build Coastguard Worker }
4467*4bdc9457SAndroid Build Coastguard Worker }
4468*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_lt_4)4469*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_lt_4) {
4470*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4471*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4472*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4473*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4474*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4475*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4476*4bdc9457SAndroid Build Coastguard Worker .m(4)
4477*4bdc9457SAndroid Build Coastguard Worker .n(2)
4478*4bdc9457SAndroid Build Coastguard Worker .k(k)
4479*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4480*4bdc9457SAndroid Build Coastguard Worker }
4481*4bdc9457SAndroid Build Coastguard Worker }
4482*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_lt_4_strided_a)4483*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_lt_4_strided_a) {
4484*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4485*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4486*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4487*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4488*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4489*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4490*4bdc9457SAndroid Build Coastguard Worker .m(4)
4491*4bdc9457SAndroid Build Coastguard Worker .n(2)
4492*4bdc9457SAndroid Build Coastguard Worker .k(k)
4493*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4494*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4495*4bdc9457SAndroid Build Coastguard Worker }
4496*4bdc9457SAndroid Build Coastguard Worker }
4497*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)4498*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
4499*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4500*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
4501*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4502*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4503*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4504*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4505*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4506*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4507*4bdc9457SAndroid Build Coastguard Worker .m(m)
4508*4bdc9457SAndroid Build Coastguard Worker .n(n)
4509*4bdc9457SAndroid Build Coastguard Worker .k(k)
4510*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4511*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4512*4bdc9457SAndroid Build Coastguard Worker }
4513*4bdc9457SAndroid Build Coastguard Worker }
4514*4bdc9457SAndroid Build Coastguard Worker }
4515*4bdc9457SAndroid Build Coastguard Worker }
4516*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_gt_4)4517*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_gt_4) {
4518*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4519*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4520*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4521*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4522*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4523*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4524*4bdc9457SAndroid Build Coastguard Worker .m(4)
4525*4bdc9457SAndroid Build Coastguard Worker .n(2)
4526*4bdc9457SAndroid Build Coastguard Worker .k(k)
4527*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4528*4bdc9457SAndroid Build Coastguard Worker }
4529*4bdc9457SAndroid Build Coastguard Worker }
4530*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_gt_4_strided_a)4531*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_gt_4_strided_a) {
4532*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4533*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4534*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4535*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4536*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4537*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4538*4bdc9457SAndroid Build Coastguard Worker .m(4)
4539*4bdc9457SAndroid Build Coastguard Worker .n(2)
4540*4bdc9457SAndroid Build Coastguard Worker .k(k)
4541*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
4542*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4543*4bdc9457SAndroid Build Coastguard Worker }
4544*4bdc9457SAndroid Build Coastguard Worker }
4545*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)4546*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
4547*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4548*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
4549*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4550*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4551*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4552*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4553*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4554*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4555*4bdc9457SAndroid Build Coastguard Worker .m(m)
4556*4bdc9457SAndroid Build Coastguard Worker .n(n)
4557*4bdc9457SAndroid Build Coastguard Worker .k(k)
4558*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4559*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4560*4bdc9457SAndroid Build Coastguard Worker }
4561*4bdc9457SAndroid Build Coastguard Worker }
4562*4bdc9457SAndroid Build Coastguard Worker }
4563*4bdc9457SAndroid Build Coastguard Worker }
4564*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_div_4)4565*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_div_4) {
4566*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4567*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4568*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4569*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4570*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4571*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4572*4bdc9457SAndroid Build Coastguard Worker .m(4)
4573*4bdc9457SAndroid Build Coastguard Worker .n(2)
4574*4bdc9457SAndroid Build Coastguard Worker .k(k)
4575*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4576*4bdc9457SAndroid Build Coastguard Worker }
4577*4bdc9457SAndroid Build Coastguard Worker }
4578*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_div_4_strided_a)4579*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_div_4_strided_a) {
4580*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4581*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4582*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4583*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4584*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4585*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4586*4bdc9457SAndroid Build Coastguard Worker .m(4)
4587*4bdc9457SAndroid Build Coastguard Worker .n(2)
4588*4bdc9457SAndroid Build Coastguard Worker .k(k)
4589*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
4590*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4591*4bdc9457SAndroid Build Coastguard Worker }
4592*4bdc9457SAndroid Build Coastguard Worker }
4593*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)4594*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
4595*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4596*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
4597*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4598*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4599*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4600*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4601*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4602*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4603*4bdc9457SAndroid Build Coastguard Worker .m(m)
4604*4bdc9457SAndroid Build Coastguard Worker .n(n)
4605*4bdc9457SAndroid Build Coastguard Worker .k(k)
4606*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4607*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4608*4bdc9457SAndroid Build Coastguard Worker }
4609*4bdc9457SAndroid Build Coastguard Worker }
4610*4bdc9457SAndroid Build Coastguard Worker }
4611*4bdc9457SAndroid Build Coastguard Worker }
4612*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_gt_2)4613*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_gt_2) {
4614*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
4615*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4616*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4617*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4618*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4619*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4620*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4621*4bdc9457SAndroid Build Coastguard Worker .m(4)
4622*4bdc9457SAndroid Build Coastguard Worker .n(n)
4623*4bdc9457SAndroid Build Coastguard Worker .k(k)
4624*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4625*4bdc9457SAndroid Build Coastguard Worker }
4626*4bdc9457SAndroid Build Coastguard Worker }
4627*4bdc9457SAndroid Build Coastguard Worker }
4628*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_gt_2_strided_cn)4629*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_gt_2_strided_cn) {
4630*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
4631*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4632*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4633*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4634*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4635*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4636*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4637*4bdc9457SAndroid Build Coastguard Worker .m(4)
4638*4bdc9457SAndroid Build Coastguard Worker .n(n)
4639*4bdc9457SAndroid Build Coastguard Worker .k(k)
4640*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
4641*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4642*4bdc9457SAndroid Build Coastguard Worker }
4643*4bdc9457SAndroid Build Coastguard Worker }
4644*4bdc9457SAndroid Build Coastguard Worker }
4645*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_gt_2_strided_a)4646*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_gt_2_strided_a) {
4647*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
4648*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4649*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4650*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4651*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4652*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4653*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4654*4bdc9457SAndroid Build Coastguard Worker .m(4)
4655*4bdc9457SAndroid Build Coastguard Worker .n(n)
4656*4bdc9457SAndroid Build Coastguard Worker .k(k)
4657*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4658*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4659*4bdc9457SAndroid Build Coastguard Worker }
4660*4bdc9457SAndroid Build Coastguard Worker }
4661*4bdc9457SAndroid Build Coastguard Worker }
4662*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_gt_2_subtile)4663*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_gt_2_subtile) {
4664*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
4665*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4666*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4667*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4668*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4669*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4670*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4671*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4672*4bdc9457SAndroid Build Coastguard Worker .m(m)
4673*4bdc9457SAndroid Build Coastguard Worker .n(n)
4674*4bdc9457SAndroid Build Coastguard Worker .k(k)
4675*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4676*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4677*4bdc9457SAndroid Build Coastguard Worker }
4678*4bdc9457SAndroid Build Coastguard Worker }
4679*4bdc9457SAndroid Build Coastguard Worker }
4680*4bdc9457SAndroid Build Coastguard Worker }
4681*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_div_2)4682*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_div_2) {
4683*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
4684*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4685*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4686*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4687*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4688*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4689*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4690*4bdc9457SAndroid Build Coastguard Worker .m(4)
4691*4bdc9457SAndroid Build Coastguard Worker .n(n)
4692*4bdc9457SAndroid Build Coastguard Worker .k(k)
4693*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4694*4bdc9457SAndroid Build Coastguard Worker }
4695*4bdc9457SAndroid Build Coastguard Worker }
4696*4bdc9457SAndroid Build Coastguard Worker }
4697*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_div_2_strided_cn)4698*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_div_2_strided_cn) {
4699*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
4700*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4701*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4702*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4703*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4704*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4705*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4706*4bdc9457SAndroid Build Coastguard Worker .m(4)
4707*4bdc9457SAndroid Build Coastguard Worker .n(n)
4708*4bdc9457SAndroid Build Coastguard Worker .k(k)
4709*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
4710*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4711*4bdc9457SAndroid Build Coastguard Worker }
4712*4bdc9457SAndroid Build Coastguard Worker }
4713*4bdc9457SAndroid Build Coastguard Worker }
4714*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_div_2_strided_a)4715*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_div_2_strided_a) {
4716*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
4717*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4718*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4719*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4720*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4721*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4722*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4723*4bdc9457SAndroid Build Coastguard Worker .m(4)
4724*4bdc9457SAndroid Build Coastguard Worker .n(n)
4725*4bdc9457SAndroid Build Coastguard Worker .k(k)
4726*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4727*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4728*4bdc9457SAndroid Build Coastguard Worker }
4729*4bdc9457SAndroid Build Coastguard Worker }
4730*4bdc9457SAndroid Build Coastguard Worker }
4731*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,n_div_2_subtile)4732*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, n_div_2_subtile) {
4733*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
4734*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4735*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4736*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4737*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4738*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4739*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4740*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4741*4bdc9457SAndroid Build Coastguard Worker .m(m)
4742*4bdc9457SAndroid Build Coastguard Worker .n(n)
4743*4bdc9457SAndroid Build Coastguard Worker .k(k)
4744*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4745*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4746*4bdc9457SAndroid Build Coastguard Worker }
4747*4bdc9457SAndroid Build Coastguard Worker }
4748*4bdc9457SAndroid Build Coastguard Worker }
4749*4bdc9457SAndroid Build Coastguard Worker }
4750*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)4751*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
4752*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4753*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
4754*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4755*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4756*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4757*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4758*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4759*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4760*4bdc9457SAndroid Build Coastguard Worker .m(m)
4761*4bdc9457SAndroid Build Coastguard Worker .n(n)
4762*4bdc9457SAndroid Build Coastguard Worker .k(k)
4763*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
4764*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4765*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4766*4bdc9457SAndroid Build Coastguard Worker }
4767*4bdc9457SAndroid Build Coastguard Worker }
4768*4bdc9457SAndroid Build Coastguard Worker }
4769*4bdc9457SAndroid Build Coastguard Worker }
4770*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA,strided_cm)4771*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2C4__WASMRELAXEDSIMD_FMA, strided_cm) {
4772*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4773*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4774*4bdc9457SAndroid Build Coastguard Worker .nr(2)
4775*4bdc9457SAndroid Build Coastguard Worker .kr(4)
4776*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4777*4bdc9457SAndroid Build Coastguard Worker .m(4)
4778*4bdc9457SAndroid Build Coastguard Worker .n(2)
4779*4bdc9457SAndroid Build Coastguard Worker .k(4)
4780*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
4781*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2c4__wasmrelaxedsimd_fma);
4782*4bdc9457SAndroid Build Coastguard Worker }
4783*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4784*4bdc9457SAndroid Build Coastguard Worker
4785*4bdc9457SAndroid Build Coastguard Worker
4786*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)4787*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
4788*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4789*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4790*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4791*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4792*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4793*4bdc9457SAndroid Build Coastguard Worker .m(4)
4794*4bdc9457SAndroid Build Coastguard Worker .n(8)
4795*4bdc9457SAndroid Build Coastguard Worker .k(1)
4796*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4797*4bdc9457SAndroid Build Coastguard Worker }
4798*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)4799*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
4800*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4801*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4802*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4803*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4804*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4805*4bdc9457SAndroid Build Coastguard Worker .m(4)
4806*4bdc9457SAndroid Build Coastguard Worker .n(8)
4807*4bdc9457SAndroid Build Coastguard Worker .k(1)
4808*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4809*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4810*4bdc9457SAndroid Build Coastguard Worker }
4811*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)4812*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
4813*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4814*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4815*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4816*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4817*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4818*4bdc9457SAndroid Build Coastguard Worker .m(4)
4819*4bdc9457SAndroid Build Coastguard Worker .n(8)
4820*4bdc9457SAndroid Build Coastguard Worker .k(1)
4821*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
4822*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4823*4bdc9457SAndroid Build Coastguard Worker }
4824*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)4825*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
4826*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4827*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4828*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4829*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4830*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4831*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4832*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4833*4bdc9457SAndroid Build Coastguard Worker .m(m)
4834*4bdc9457SAndroid Build Coastguard Worker .n(n)
4835*4bdc9457SAndroid Build Coastguard Worker .k(1)
4836*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4837*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4838*4bdc9457SAndroid Build Coastguard Worker }
4839*4bdc9457SAndroid Build Coastguard Worker }
4840*4bdc9457SAndroid Build Coastguard Worker }
4841*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)4842*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
4843*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4844*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4845*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4846*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4847*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4848*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4849*4bdc9457SAndroid Build Coastguard Worker .m(m)
4850*4bdc9457SAndroid Build Coastguard Worker .n(8)
4851*4bdc9457SAndroid Build Coastguard Worker .k(1)
4852*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4853*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4854*4bdc9457SAndroid Build Coastguard Worker }
4855*4bdc9457SAndroid Build Coastguard Worker }
4856*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)4857*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
4858*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4859*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4860*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4861*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4862*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4863*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4864*4bdc9457SAndroid Build Coastguard Worker .m(4)
4865*4bdc9457SAndroid Build Coastguard Worker .n(n)
4866*4bdc9457SAndroid Build Coastguard Worker .k(1)
4867*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4868*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4869*4bdc9457SAndroid Build Coastguard Worker }
4870*4bdc9457SAndroid Build Coastguard Worker }
4871*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)4872*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
4873*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4874*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4875*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4876*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4877*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4878*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4879*4bdc9457SAndroid Build Coastguard Worker .m(4)
4880*4bdc9457SAndroid Build Coastguard Worker .n(8)
4881*4bdc9457SAndroid Build Coastguard Worker .k(k)
4882*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4883*4bdc9457SAndroid Build Coastguard Worker }
4884*4bdc9457SAndroid Build Coastguard Worker }
4885*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)4886*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
4887*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4888*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4889*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4890*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4891*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4892*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4893*4bdc9457SAndroid Build Coastguard Worker .m(4)
4894*4bdc9457SAndroid Build Coastguard Worker .n(8)
4895*4bdc9457SAndroid Build Coastguard Worker .k(k)
4896*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
4897*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4898*4bdc9457SAndroid Build Coastguard Worker }
4899*4bdc9457SAndroid Build Coastguard Worker }
4900*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)4901*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
4902*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4903*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4904*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4905*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4906*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4907*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4908*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4909*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4910*4bdc9457SAndroid Build Coastguard Worker .m(m)
4911*4bdc9457SAndroid Build Coastguard Worker .n(n)
4912*4bdc9457SAndroid Build Coastguard Worker .k(k)
4913*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4914*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4915*4bdc9457SAndroid Build Coastguard Worker }
4916*4bdc9457SAndroid Build Coastguard Worker }
4917*4bdc9457SAndroid Build Coastguard Worker }
4918*4bdc9457SAndroid Build Coastguard Worker }
4919*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)4920*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
4921*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4922*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4923*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4924*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4925*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4926*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4927*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4928*4bdc9457SAndroid Build Coastguard Worker .m(4)
4929*4bdc9457SAndroid Build Coastguard Worker .n(n)
4930*4bdc9457SAndroid Build Coastguard Worker .k(k)
4931*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4932*4bdc9457SAndroid Build Coastguard Worker }
4933*4bdc9457SAndroid Build Coastguard Worker }
4934*4bdc9457SAndroid Build Coastguard Worker }
4935*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)4936*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
4937*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4938*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4939*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4940*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4941*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4942*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4943*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4944*4bdc9457SAndroid Build Coastguard Worker .m(4)
4945*4bdc9457SAndroid Build Coastguard Worker .n(n)
4946*4bdc9457SAndroid Build Coastguard Worker .k(k)
4947*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4948*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4949*4bdc9457SAndroid Build Coastguard Worker }
4950*4bdc9457SAndroid Build Coastguard Worker }
4951*4bdc9457SAndroid Build Coastguard Worker }
4952*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)4953*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
4954*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4955*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4956*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4957*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4958*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4959*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4960*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4961*4bdc9457SAndroid Build Coastguard Worker .m(4)
4962*4bdc9457SAndroid Build Coastguard Worker .n(n)
4963*4bdc9457SAndroid Build Coastguard Worker .k(k)
4964*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4965*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4966*4bdc9457SAndroid Build Coastguard Worker }
4967*4bdc9457SAndroid Build Coastguard Worker }
4968*4bdc9457SAndroid Build Coastguard Worker }
4969*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)4970*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
4971*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4972*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4973*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4974*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4975*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4976*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4977*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4978*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4979*4bdc9457SAndroid Build Coastguard Worker .m(m)
4980*4bdc9457SAndroid Build Coastguard Worker .n(n)
4981*4bdc9457SAndroid Build Coastguard Worker .k(k)
4982*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4983*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4984*4bdc9457SAndroid Build Coastguard Worker }
4985*4bdc9457SAndroid Build Coastguard Worker }
4986*4bdc9457SAndroid Build Coastguard Worker }
4987*4bdc9457SAndroid Build Coastguard Worker }
4988*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)4989*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
4990*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4991*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4992*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4993*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4994*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4995*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4996*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4997*4bdc9457SAndroid Build Coastguard Worker .m(4)
4998*4bdc9457SAndroid Build Coastguard Worker .n(n)
4999*4bdc9457SAndroid Build Coastguard Worker .k(k)
5000*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5001*4bdc9457SAndroid Build Coastguard Worker }
5002*4bdc9457SAndroid Build Coastguard Worker }
5003*4bdc9457SAndroid Build Coastguard Worker }
5004*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)5005*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
5006*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5007*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5008*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5009*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5010*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5011*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5012*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5013*4bdc9457SAndroid Build Coastguard Worker .m(4)
5014*4bdc9457SAndroid Build Coastguard Worker .n(n)
5015*4bdc9457SAndroid Build Coastguard Worker .k(k)
5016*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5017*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5018*4bdc9457SAndroid Build Coastguard Worker }
5019*4bdc9457SAndroid Build Coastguard Worker }
5020*4bdc9457SAndroid Build Coastguard Worker }
5021*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)5022*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
5023*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5024*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5025*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5026*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5027*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5028*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5029*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5030*4bdc9457SAndroid Build Coastguard Worker .m(4)
5031*4bdc9457SAndroid Build Coastguard Worker .n(n)
5032*4bdc9457SAndroid Build Coastguard Worker .k(k)
5033*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5034*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5035*4bdc9457SAndroid Build Coastguard Worker }
5036*4bdc9457SAndroid Build Coastguard Worker }
5037*4bdc9457SAndroid Build Coastguard Worker }
5038*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)5039*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
5040*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5041*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5042*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5043*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5044*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5045*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5046*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5047*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5048*4bdc9457SAndroid Build Coastguard Worker .m(m)
5049*4bdc9457SAndroid Build Coastguard Worker .n(n)
5050*4bdc9457SAndroid Build Coastguard Worker .k(k)
5051*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5052*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5053*4bdc9457SAndroid Build Coastguard Worker }
5054*4bdc9457SAndroid Build Coastguard Worker }
5055*4bdc9457SAndroid Build Coastguard Worker }
5056*4bdc9457SAndroid Build Coastguard Worker }
5057*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)5058*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
5059*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5060*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5061*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5062*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5063*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5064*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5065*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5066*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5067*4bdc9457SAndroid Build Coastguard Worker .m(m)
5068*4bdc9457SAndroid Build Coastguard Worker .n(n)
5069*4bdc9457SAndroid Build Coastguard Worker .k(k)
5070*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5071*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5072*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5073*4bdc9457SAndroid Build Coastguard Worker }
5074*4bdc9457SAndroid Build Coastguard Worker }
5075*4bdc9457SAndroid Build Coastguard Worker }
5076*4bdc9457SAndroid Build Coastguard Worker }
5077*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)5078*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
5079*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5080*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5081*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5082*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5083*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5084*4bdc9457SAndroid Build Coastguard Worker .m(4)
5085*4bdc9457SAndroid Build Coastguard Worker .n(8)
5086*4bdc9457SAndroid Build Coastguard Worker .k(1)
5087*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5088*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5089*4bdc9457SAndroid Build Coastguard Worker }
5090*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5091*4bdc9457SAndroid Build Coastguard Worker
5092*4bdc9457SAndroid Build Coastguard Worker
5093*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)5094*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
5095*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5096*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5097*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5098*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5099*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5100*4bdc9457SAndroid Build Coastguard Worker .m(5)
5101*4bdc9457SAndroid Build Coastguard Worker .n(8)
5102*4bdc9457SAndroid Build Coastguard Worker .k(1)
5103*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5104*4bdc9457SAndroid Build Coastguard Worker }
5105*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)5106*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
5107*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5108*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5109*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5110*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5111*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5112*4bdc9457SAndroid Build Coastguard Worker .m(5)
5113*4bdc9457SAndroid Build Coastguard Worker .n(8)
5114*4bdc9457SAndroid Build Coastguard Worker .k(1)
5115*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5116*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5117*4bdc9457SAndroid Build Coastguard Worker }
5118*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)5119*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
5120*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5121*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5122*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5123*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5124*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5125*4bdc9457SAndroid Build Coastguard Worker .m(5)
5126*4bdc9457SAndroid Build Coastguard Worker .n(8)
5127*4bdc9457SAndroid Build Coastguard Worker .k(1)
5128*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
5129*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5130*4bdc9457SAndroid Build Coastguard Worker }
5131*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)5132*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
5133*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5134*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5135*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5136*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5137*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5138*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5139*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5140*4bdc9457SAndroid Build Coastguard Worker .m(m)
5141*4bdc9457SAndroid Build Coastguard Worker .n(n)
5142*4bdc9457SAndroid Build Coastguard Worker .k(1)
5143*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5144*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5145*4bdc9457SAndroid Build Coastguard Worker }
5146*4bdc9457SAndroid Build Coastguard Worker }
5147*4bdc9457SAndroid Build Coastguard Worker }
5148*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)5149*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
5150*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5151*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5152*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5153*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5154*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5155*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5156*4bdc9457SAndroid Build Coastguard Worker .m(m)
5157*4bdc9457SAndroid Build Coastguard Worker .n(8)
5158*4bdc9457SAndroid Build Coastguard Worker .k(1)
5159*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5160*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5161*4bdc9457SAndroid Build Coastguard Worker }
5162*4bdc9457SAndroid Build Coastguard Worker }
5163*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)5164*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
5165*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5166*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5167*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5168*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5169*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5170*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5171*4bdc9457SAndroid Build Coastguard Worker .m(5)
5172*4bdc9457SAndroid Build Coastguard Worker .n(n)
5173*4bdc9457SAndroid Build Coastguard Worker .k(1)
5174*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5175*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5176*4bdc9457SAndroid Build Coastguard Worker }
5177*4bdc9457SAndroid Build Coastguard Worker }
5178*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)5179*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
5180*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5181*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5182*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5183*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5184*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5185*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5186*4bdc9457SAndroid Build Coastguard Worker .m(5)
5187*4bdc9457SAndroid Build Coastguard Worker .n(8)
5188*4bdc9457SAndroid Build Coastguard Worker .k(k)
5189*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5190*4bdc9457SAndroid Build Coastguard Worker }
5191*4bdc9457SAndroid Build Coastguard Worker }
5192*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)5193*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
5194*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5195*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5196*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5197*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5198*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5199*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5200*4bdc9457SAndroid Build Coastguard Worker .m(5)
5201*4bdc9457SAndroid Build Coastguard Worker .n(8)
5202*4bdc9457SAndroid Build Coastguard Worker .k(k)
5203*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
5204*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5205*4bdc9457SAndroid Build Coastguard Worker }
5206*4bdc9457SAndroid Build Coastguard Worker }
5207*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)5208*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
5209*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5210*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5211*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5212*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5213*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5214*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5215*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5216*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5217*4bdc9457SAndroid Build Coastguard Worker .m(m)
5218*4bdc9457SAndroid Build Coastguard Worker .n(n)
5219*4bdc9457SAndroid Build Coastguard Worker .k(k)
5220*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5221*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5222*4bdc9457SAndroid Build Coastguard Worker }
5223*4bdc9457SAndroid Build Coastguard Worker }
5224*4bdc9457SAndroid Build Coastguard Worker }
5225*4bdc9457SAndroid Build Coastguard Worker }
5226*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)5227*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
5228*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5229*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5230*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5231*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5232*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5233*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5234*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5235*4bdc9457SAndroid Build Coastguard Worker .m(5)
5236*4bdc9457SAndroid Build Coastguard Worker .n(n)
5237*4bdc9457SAndroid Build Coastguard Worker .k(k)
5238*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5239*4bdc9457SAndroid Build Coastguard Worker }
5240*4bdc9457SAndroid Build Coastguard Worker }
5241*4bdc9457SAndroid Build Coastguard Worker }
5242*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)5243*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
5244*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5245*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5246*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5247*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5248*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5249*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5250*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5251*4bdc9457SAndroid Build Coastguard Worker .m(5)
5252*4bdc9457SAndroid Build Coastguard Worker .n(n)
5253*4bdc9457SAndroid Build Coastguard Worker .k(k)
5254*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5255*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5256*4bdc9457SAndroid Build Coastguard Worker }
5257*4bdc9457SAndroid Build Coastguard Worker }
5258*4bdc9457SAndroid Build Coastguard Worker }
5259*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)5260*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
5261*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5262*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5263*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5264*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5265*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5266*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5267*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5268*4bdc9457SAndroid Build Coastguard Worker .m(5)
5269*4bdc9457SAndroid Build Coastguard Worker .n(n)
5270*4bdc9457SAndroid Build Coastguard Worker .k(k)
5271*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5272*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5273*4bdc9457SAndroid Build Coastguard Worker }
5274*4bdc9457SAndroid Build Coastguard Worker }
5275*4bdc9457SAndroid Build Coastguard Worker }
5276*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)5277*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
5278*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5279*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5280*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5281*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5282*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5283*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5284*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5285*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5286*4bdc9457SAndroid Build Coastguard Worker .m(m)
5287*4bdc9457SAndroid Build Coastguard Worker .n(n)
5288*4bdc9457SAndroid Build Coastguard Worker .k(k)
5289*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5290*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5291*4bdc9457SAndroid Build Coastguard Worker }
5292*4bdc9457SAndroid Build Coastguard Worker }
5293*4bdc9457SAndroid Build Coastguard Worker }
5294*4bdc9457SAndroid Build Coastguard Worker }
5295*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)5296*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
5297*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5298*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5299*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5300*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5301*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5302*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5303*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5304*4bdc9457SAndroid Build Coastguard Worker .m(5)
5305*4bdc9457SAndroid Build Coastguard Worker .n(n)
5306*4bdc9457SAndroid Build Coastguard Worker .k(k)
5307*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5308*4bdc9457SAndroid Build Coastguard Worker }
5309*4bdc9457SAndroid Build Coastguard Worker }
5310*4bdc9457SAndroid Build Coastguard Worker }
5311*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)5312*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
5313*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5314*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5315*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5316*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5317*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5318*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5319*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5320*4bdc9457SAndroid Build Coastguard Worker .m(5)
5321*4bdc9457SAndroid Build Coastguard Worker .n(n)
5322*4bdc9457SAndroid Build Coastguard Worker .k(k)
5323*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5324*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5325*4bdc9457SAndroid Build Coastguard Worker }
5326*4bdc9457SAndroid Build Coastguard Worker }
5327*4bdc9457SAndroid Build Coastguard Worker }
5328*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)5329*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
5330*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5331*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5332*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5333*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5334*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5335*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5336*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5337*4bdc9457SAndroid Build Coastguard Worker .m(5)
5338*4bdc9457SAndroid Build Coastguard Worker .n(n)
5339*4bdc9457SAndroid Build Coastguard Worker .k(k)
5340*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5341*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5342*4bdc9457SAndroid Build Coastguard Worker }
5343*4bdc9457SAndroid Build Coastguard Worker }
5344*4bdc9457SAndroid Build Coastguard Worker }
5345*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)5346*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
5347*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5348*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5349*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5350*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5351*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5352*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5353*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5354*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5355*4bdc9457SAndroid Build Coastguard Worker .m(m)
5356*4bdc9457SAndroid Build Coastguard Worker .n(n)
5357*4bdc9457SAndroid Build Coastguard Worker .k(k)
5358*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5359*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5360*4bdc9457SAndroid Build Coastguard Worker }
5361*4bdc9457SAndroid Build Coastguard Worker }
5362*4bdc9457SAndroid Build Coastguard Worker }
5363*4bdc9457SAndroid Build Coastguard Worker }
5364*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)5365*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
5366*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5367*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5368*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5369*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5370*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5371*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5372*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5373*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5374*4bdc9457SAndroid Build Coastguard Worker .m(m)
5375*4bdc9457SAndroid Build Coastguard Worker .n(n)
5376*4bdc9457SAndroid Build Coastguard Worker .k(k)
5377*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5378*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5379*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5380*4bdc9457SAndroid Build Coastguard Worker }
5381*4bdc9457SAndroid Build Coastguard Worker }
5382*4bdc9457SAndroid Build Coastguard Worker }
5383*4bdc9457SAndroid Build Coastguard Worker }
5384*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)5385*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
5386*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5387*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5388*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5389*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5390*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5391*4bdc9457SAndroid Build Coastguard Worker .m(5)
5392*4bdc9457SAndroid Build Coastguard Worker .n(8)
5393*4bdc9457SAndroid Build Coastguard Worker .k(1)
5394*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5395*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5396*4bdc9457SAndroid Build Coastguard Worker }
5397*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5398*4bdc9457SAndroid Build Coastguard Worker
5399*4bdc9457SAndroid Build Coastguard Worker
5400*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)5401*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
5402*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5403*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5404*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5405*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5406*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5407*4bdc9457SAndroid Build Coastguard Worker .m(5)
5408*4bdc9457SAndroid Build Coastguard Worker .n(8)
5409*4bdc9457SAndroid Build Coastguard Worker .k(4)
5410*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5411*4bdc9457SAndroid Build Coastguard Worker }
5412*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,strided_cn)5413*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
5414*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5415*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5416*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5417*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5418*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5419*4bdc9457SAndroid Build Coastguard Worker .m(5)
5420*4bdc9457SAndroid Build Coastguard Worker .n(8)
5421*4bdc9457SAndroid Build Coastguard Worker .k(4)
5422*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5423*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5424*4bdc9457SAndroid Build Coastguard Worker }
5425*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_strided_a)5426*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_strided_a) {
5427*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5428*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5429*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5430*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5431*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5432*4bdc9457SAndroid Build Coastguard Worker .m(5)
5433*4bdc9457SAndroid Build Coastguard Worker .n(8)
5434*4bdc9457SAndroid Build Coastguard Worker .k(4)
5435*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5436*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5437*4bdc9457SAndroid Build Coastguard Worker }
5438*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)5439*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
5440*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5441*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5442*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5443*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5444*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5445*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5446*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5447*4bdc9457SAndroid Build Coastguard Worker .m(m)
5448*4bdc9457SAndroid Build Coastguard Worker .n(n)
5449*4bdc9457SAndroid Build Coastguard Worker .k(4)
5450*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5451*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5452*4bdc9457SAndroid Build Coastguard Worker }
5453*4bdc9457SAndroid Build Coastguard Worker }
5454*4bdc9457SAndroid Build Coastguard Worker }
5455*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)5456*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
5457*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5458*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5459*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5460*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5461*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5462*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5463*4bdc9457SAndroid Build Coastguard Worker .m(m)
5464*4bdc9457SAndroid Build Coastguard Worker .n(8)
5465*4bdc9457SAndroid Build Coastguard Worker .k(4)
5466*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5467*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5468*4bdc9457SAndroid Build Coastguard Worker }
5469*4bdc9457SAndroid Build Coastguard Worker }
5470*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)5471*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
5472*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5473*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5474*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5475*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5476*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5477*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5478*4bdc9457SAndroid Build Coastguard Worker .m(5)
5479*4bdc9457SAndroid Build Coastguard Worker .n(n)
5480*4bdc9457SAndroid Build Coastguard Worker .k(4)
5481*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5482*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5483*4bdc9457SAndroid Build Coastguard Worker }
5484*4bdc9457SAndroid Build Coastguard Worker }
5485*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)5486*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
5487*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
5488*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5489*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5490*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5491*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5492*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5493*4bdc9457SAndroid Build Coastguard Worker .m(5)
5494*4bdc9457SAndroid Build Coastguard Worker .n(8)
5495*4bdc9457SAndroid Build Coastguard Worker .k(k)
5496*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5497*4bdc9457SAndroid Build Coastguard Worker }
5498*4bdc9457SAndroid Build Coastguard Worker }
5499*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_strided_a)5500*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_strided_a) {
5501*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
5502*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5503*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5504*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5505*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5506*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5507*4bdc9457SAndroid Build Coastguard Worker .m(5)
5508*4bdc9457SAndroid Build Coastguard Worker .n(8)
5509*4bdc9457SAndroid Build Coastguard Worker .k(k)
5510*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5511*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5512*4bdc9457SAndroid Build Coastguard Worker }
5513*4bdc9457SAndroid Build Coastguard Worker }
5514*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)5515*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
5516*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
5517*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5518*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5519*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5520*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5521*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5522*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5523*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5524*4bdc9457SAndroid Build Coastguard Worker .m(m)
5525*4bdc9457SAndroid Build Coastguard Worker .n(n)
5526*4bdc9457SAndroid Build Coastguard Worker .k(k)
5527*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5528*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5529*4bdc9457SAndroid Build Coastguard Worker }
5530*4bdc9457SAndroid Build Coastguard Worker }
5531*4bdc9457SAndroid Build Coastguard Worker }
5532*4bdc9457SAndroid Build Coastguard Worker }
5533*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)5534*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
5535*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
5536*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5537*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5538*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5539*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5540*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5541*4bdc9457SAndroid Build Coastguard Worker .m(5)
5542*4bdc9457SAndroid Build Coastguard Worker .n(8)
5543*4bdc9457SAndroid Build Coastguard Worker .k(k)
5544*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5545*4bdc9457SAndroid Build Coastguard Worker }
5546*4bdc9457SAndroid Build Coastguard Worker }
5547*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_strided_a)5548*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_strided_a) {
5549*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
5550*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5551*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5552*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5553*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5554*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5555*4bdc9457SAndroid Build Coastguard Worker .m(5)
5556*4bdc9457SAndroid Build Coastguard Worker .n(8)
5557*4bdc9457SAndroid Build Coastguard Worker .k(k)
5558*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
5559*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5560*4bdc9457SAndroid Build Coastguard Worker }
5561*4bdc9457SAndroid Build Coastguard Worker }
5562*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)5563*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
5564*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
5565*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5566*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5567*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5568*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5569*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5570*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5571*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5572*4bdc9457SAndroid Build Coastguard Worker .m(m)
5573*4bdc9457SAndroid Build Coastguard Worker .n(n)
5574*4bdc9457SAndroid Build Coastguard Worker .k(k)
5575*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5576*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5577*4bdc9457SAndroid Build Coastguard Worker }
5578*4bdc9457SAndroid Build Coastguard Worker }
5579*4bdc9457SAndroid Build Coastguard Worker }
5580*4bdc9457SAndroid Build Coastguard Worker }
5581*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_div_4)5582*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
5583*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
5584*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5585*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5586*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5587*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5588*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5589*4bdc9457SAndroid Build Coastguard Worker .m(5)
5590*4bdc9457SAndroid Build Coastguard Worker .n(8)
5591*4bdc9457SAndroid Build Coastguard Worker .k(k)
5592*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5593*4bdc9457SAndroid Build Coastguard Worker }
5594*4bdc9457SAndroid Build Coastguard Worker }
5595*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_div_4_strided_a)5596*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_div_4_strided_a) {
5597*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
5598*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5599*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5600*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5601*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5602*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5603*4bdc9457SAndroid Build Coastguard Worker .m(5)
5604*4bdc9457SAndroid Build Coastguard Worker .n(8)
5605*4bdc9457SAndroid Build Coastguard Worker .k(k)
5606*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
5607*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5608*4bdc9457SAndroid Build Coastguard Worker }
5609*4bdc9457SAndroid Build Coastguard Worker }
5610*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)5611*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
5612*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
5613*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5614*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5615*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5616*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5617*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5618*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5619*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5620*4bdc9457SAndroid Build Coastguard Worker .m(m)
5621*4bdc9457SAndroid Build Coastguard Worker .n(n)
5622*4bdc9457SAndroid Build Coastguard Worker .k(k)
5623*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5624*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5625*4bdc9457SAndroid Build Coastguard Worker }
5626*4bdc9457SAndroid Build Coastguard Worker }
5627*4bdc9457SAndroid Build Coastguard Worker }
5628*4bdc9457SAndroid Build Coastguard Worker }
5629*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)5630*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
5631*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5632*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5633*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5634*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5635*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5636*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5637*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5638*4bdc9457SAndroid Build Coastguard Worker .m(5)
5639*4bdc9457SAndroid Build Coastguard Worker .n(n)
5640*4bdc9457SAndroid Build Coastguard Worker .k(k)
5641*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5642*4bdc9457SAndroid Build Coastguard Worker }
5643*4bdc9457SAndroid Build Coastguard Worker }
5644*4bdc9457SAndroid Build Coastguard Worker }
5645*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)5646*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
5647*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5648*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5649*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5650*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5651*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5652*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5653*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5654*4bdc9457SAndroid Build Coastguard Worker .m(5)
5655*4bdc9457SAndroid Build Coastguard Worker .n(n)
5656*4bdc9457SAndroid Build Coastguard Worker .k(k)
5657*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5658*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5659*4bdc9457SAndroid Build Coastguard Worker }
5660*4bdc9457SAndroid Build Coastguard Worker }
5661*4bdc9457SAndroid Build Coastguard Worker }
5662*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_a)5663*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_a) {
5664*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5665*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5666*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5667*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5668*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5669*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5670*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5671*4bdc9457SAndroid Build Coastguard Worker .m(5)
5672*4bdc9457SAndroid Build Coastguard Worker .n(n)
5673*4bdc9457SAndroid Build Coastguard Worker .k(k)
5674*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
5675*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5676*4bdc9457SAndroid Build Coastguard Worker }
5677*4bdc9457SAndroid Build Coastguard Worker }
5678*4bdc9457SAndroid Build Coastguard Worker }
5679*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)5680*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
5681*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5682*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5683*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5684*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5685*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5686*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5687*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5688*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5689*4bdc9457SAndroid Build Coastguard Worker .m(m)
5690*4bdc9457SAndroid Build Coastguard Worker .n(n)
5691*4bdc9457SAndroid Build Coastguard Worker .k(k)
5692*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5693*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5694*4bdc9457SAndroid Build Coastguard Worker }
5695*4bdc9457SAndroid Build Coastguard Worker }
5696*4bdc9457SAndroid Build Coastguard Worker }
5697*4bdc9457SAndroid Build Coastguard Worker }
5698*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_div_8)5699*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
5700*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5701*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5702*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5703*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5704*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5705*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5706*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5707*4bdc9457SAndroid Build Coastguard Worker .m(5)
5708*4bdc9457SAndroid Build Coastguard Worker .n(n)
5709*4bdc9457SAndroid Build Coastguard Worker .k(k)
5710*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5711*4bdc9457SAndroid Build Coastguard Worker }
5712*4bdc9457SAndroid Build Coastguard Worker }
5713*4bdc9457SAndroid Build Coastguard Worker }
5714*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)5715*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
5716*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5717*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5718*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5719*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5720*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5721*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5722*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5723*4bdc9457SAndroid Build Coastguard Worker .m(5)
5724*4bdc9457SAndroid Build Coastguard Worker .n(n)
5725*4bdc9457SAndroid Build Coastguard Worker .k(k)
5726*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5727*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5728*4bdc9457SAndroid Build Coastguard Worker }
5729*4bdc9457SAndroid Build Coastguard Worker }
5730*4bdc9457SAndroid Build Coastguard Worker }
5731*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_a)5732*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_a) {
5733*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5734*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5735*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5736*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5737*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5738*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5739*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5740*4bdc9457SAndroid Build Coastguard Worker .m(5)
5741*4bdc9457SAndroid Build Coastguard Worker .n(n)
5742*4bdc9457SAndroid Build Coastguard Worker .k(k)
5743*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
5744*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5745*4bdc9457SAndroid Build Coastguard Worker }
5746*4bdc9457SAndroid Build Coastguard Worker }
5747*4bdc9457SAndroid Build Coastguard Worker }
5748*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)5749*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
5750*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5751*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5752*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5753*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5754*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5755*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5756*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5757*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5758*4bdc9457SAndroid Build Coastguard Worker .m(m)
5759*4bdc9457SAndroid Build Coastguard Worker .n(n)
5760*4bdc9457SAndroid Build Coastguard Worker .k(k)
5761*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5762*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5763*4bdc9457SAndroid Build Coastguard Worker }
5764*4bdc9457SAndroid Build Coastguard Worker }
5765*4bdc9457SAndroid Build Coastguard Worker }
5766*4bdc9457SAndroid Build Coastguard Worker }
5767*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)5768*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
5769*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5770*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5771*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5772*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5773*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5774*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5775*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5776*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5777*4bdc9457SAndroid Build Coastguard Worker .m(m)
5778*4bdc9457SAndroid Build Coastguard Worker .n(n)
5779*4bdc9457SAndroid Build Coastguard Worker .k(k)
5780*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5781*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5782*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5783*4bdc9457SAndroid Build Coastguard Worker }
5784*4bdc9457SAndroid Build Coastguard Worker }
5785*4bdc9457SAndroid Build Coastguard Worker }
5786*4bdc9457SAndroid Build Coastguard Worker }
5787*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA,strided_cm)5788*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
5789*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5790*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5791*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5792*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5793*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5794*4bdc9457SAndroid Build Coastguard Worker .m(5)
5795*4bdc9457SAndroid Build Coastguard Worker .n(8)
5796*4bdc9457SAndroid Build Coastguard Worker .k(4)
5797*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5798*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8s4__wasmrelaxedsimd_fma);
5799*4bdc9457SAndroid Build Coastguard Worker }
5800*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5801*4bdc9457SAndroid Build Coastguard Worker
5802*4bdc9457SAndroid Build Coastguard Worker
5803*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)5804*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
5805*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5806*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5807*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5808*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5809*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5810*4bdc9457SAndroid Build Coastguard Worker .m(6)
5811*4bdc9457SAndroid Build Coastguard Worker .n(8)
5812*4bdc9457SAndroid Build Coastguard Worker .k(1)
5813*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5814*4bdc9457SAndroid Build Coastguard Worker }
5815*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)5816*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
5817*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5818*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5819*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5820*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5821*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5822*4bdc9457SAndroid Build Coastguard Worker .m(6)
5823*4bdc9457SAndroid Build Coastguard Worker .n(8)
5824*4bdc9457SAndroid Build Coastguard Worker .k(1)
5825*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5826*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5827*4bdc9457SAndroid Build Coastguard Worker }
5828*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)5829*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
5830*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5831*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5832*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5833*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5834*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5835*4bdc9457SAndroid Build Coastguard Worker .m(6)
5836*4bdc9457SAndroid Build Coastguard Worker .n(8)
5837*4bdc9457SAndroid Build Coastguard Worker .k(1)
5838*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
5839*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5840*4bdc9457SAndroid Build Coastguard Worker }
5841*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)5842*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
5843*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5844*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5845*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5846*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5847*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5848*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5849*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5850*4bdc9457SAndroid Build Coastguard Worker .m(m)
5851*4bdc9457SAndroid Build Coastguard Worker .n(n)
5852*4bdc9457SAndroid Build Coastguard Worker .k(1)
5853*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5854*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5855*4bdc9457SAndroid Build Coastguard Worker }
5856*4bdc9457SAndroid Build Coastguard Worker }
5857*4bdc9457SAndroid Build Coastguard Worker }
5858*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)5859*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
5860*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5861*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5862*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5863*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5864*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5865*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5866*4bdc9457SAndroid Build Coastguard Worker .m(m)
5867*4bdc9457SAndroid Build Coastguard Worker .n(8)
5868*4bdc9457SAndroid Build Coastguard Worker .k(1)
5869*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5870*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5871*4bdc9457SAndroid Build Coastguard Worker }
5872*4bdc9457SAndroid Build Coastguard Worker }
5873*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)5874*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
5875*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5876*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5877*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5878*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5879*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5880*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5881*4bdc9457SAndroid Build Coastguard Worker .m(6)
5882*4bdc9457SAndroid Build Coastguard Worker .n(n)
5883*4bdc9457SAndroid Build Coastguard Worker .k(1)
5884*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5885*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5886*4bdc9457SAndroid Build Coastguard Worker }
5887*4bdc9457SAndroid Build Coastguard Worker }
5888*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)5889*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
5890*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5891*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5892*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5893*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5894*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5895*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5896*4bdc9457SAndroid Build Coastguard Worker .m(6)
5897*4bdc9457SAndroid Build Coastguard Worker .n(8)
5898*4bdc9457SAndroid Build Coastguard Worker .k(k)
5899*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5900*4bdc9457SAndroid Build Coastguard Worker }
5901*4bdc9457SAndroid Build Coastguard Worker }
5902*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)5903*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
5904*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5905*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5906*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5907*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5908*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5909*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5910*4bdc9457SAndroid Build Coastguard Worker .m(6)
5911*4bdc9457SAndroid Build Coastguard Worker .n(8)
5912*4bdc9457SAndroid Build Coastguard Worker .k(k)
5913*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
5914*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5915*4bdc9457SAndroid Build Coastguard Worker }
5916*4bdc9457SAndroid Build Coastguard Worker }
5917*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)5918*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
5919*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5920*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5921*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5922*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5923*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5924*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5925*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5926*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5927*4bdc9457SAndroid Build Coastguard Worker .m(m)
5928*4bdc9457SAndroid Build Coastguard Worker .n(n)
5929*4bdc9457SAndroid Build Coastguard Worker .k(k)
5930*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5931*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5932*4bdc9457SAndroid Build Coastguard Worker }
5933*4bdc9457SAndroid Build Coastguard Worker }
5934*4bdc9457SAndroid Build Coastguard Worker }
5935*4bdc9457SAndroid Build Coastguard Worker }
5936*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)5937*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
5938*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5939*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5940*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5941*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5942*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5943*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5944*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5945*4bdc9457SAndroid Build Coastguard Worker .m(6)
5946*4bdc9457SAndroid Build Coastguard Worker .n(n)
5947*4bdc9457SAndroid Build Coastguard Worker .k(k)
5948*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5949*4bdc9457SAndroid Build Coastguard Worker }
5950*4bdc9457SAndroid Build Coastguard Worker }
5951*4bdc9457SAndroid Build Coastguard Worker }
5952*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)5953*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
5954*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5955*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5956*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5957*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5958*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5959*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5960*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5961*4bdc9457SAndroid Build Coastguard Worker .m(6)
5962*4bdc9457SAndroid Build Coastguard Worker .n(n)
5963*4bdc9457SAndroid Build Coastguard Worker .k(k)
5964*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5965*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5966*4bdc9457SAndroid Build Coastguard Worker }
5967*4bdc9457SAndroid Build Coastguard Worker }
5968*4bdc9457SAndroid Build Coastguard Worker }
5969*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)5970*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
5971*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5972*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5973*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5974*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5975*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5976*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5977*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5978*4bdc9457SAndroid Build Coastguard Worker .m(6)
5979*4bdc9457SAndroid Build Coastguard Worker .n(n)
5980*4bdc9457SAndroid Build Coastguard Worker .k(k)
5981*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5982*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5983*4bdc9457SAndroid Build Coastguard Worker }
5984*4bdc9457SAndroid Build Coastguard Worker }
5985*4bdc9457SAndroid Build Coastguard Worker }
5986*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)5987*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
5988*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5989*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5990*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5991*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5992*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5993*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5994*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5995*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5996*4bdc9457SAndroid Build Coastguard Worker .m(m)
5997*4bdc9457SAndroid Build Coastguard Worker .n(n)
5998*4bdc9457SAndroid Build Coastguard Worker .k(k)
5999*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6000*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6001*4bdc9457SAndroid Build Coastguard Worker }
6002*4bdc9457SAndroid Build Coastguard Worker }
6003*4bdc9457SAndroid Build Coastguard Worker }
6004*4bdc9457SAndroid Build Coastguard Worker }
6005*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)6006*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
6007*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6008*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6009*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6010*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6011*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6012*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6013*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6014*4bdc9457SAndroid Build Coastguard Worker .m(6)
6015*4bdc9457SAndroid Build Coastguard Worker .n(n)
6016*4bdc9457SAndroid Build Coastguard Worker .k(k)
6017*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6018*4bdc9457SAndroid Build Coastguard Worker }
6019*4bdc9457SAndroid Build Coastguard Worker }
6020*4bdc9457SAndroid Build Coastguard Worker }
6021*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)6022*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
6023*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6024*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6025*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6026*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6027*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6028*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6029*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6030*4bdc9457SAndroid Build Coastguard Worker .m(6)
6031*4bdc9457SAndroid Build Coastguard Worker .n(n)
6032*4bdc9457SAndroid Build Coastguard Worker .k(k)
6033*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
6034*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6035*4bdc9457SAndroid Build Coastguard Worker }
6036*4bdc9457SAndroid Build Coastguard Worker }
6037*4bdc9457SAndroid Build Coastguard Worker }
6038*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)6039*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
6040*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6041*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6042*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6043*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6044*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6045*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6046*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6047*4bdc9457SAndroid Build Coastguard Worker .m(6)
6048*4bdc9457SAndroid Build Coastguard Worker .n(n)
6049*4bdc9457SAndroid Build Coastguard Worker .k(k)
6050*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6051*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6052*4bdc9457SAndroid Build Coastguard Worker }
6053*4bdc9457SAndroid Build Coastguard Worker }
6054*4bdc9457SAndroid Build Coastguard Worker }
6055*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)6056*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
6057*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6058*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6059*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6060*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6061*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6062*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6063*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6064*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6065*4bdc9457SAndroid Build Coastguard Worker .m(m)
6066*4bdc9457SAndroid Build Coastguard Worker .n(n)
6067*4bdc9457SAndroid Build Coastguard Worker .k(k)
6068*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6069*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6070*4bdc9457SAndroid Build Coastguard Worker }
6071*4bdc9457SAndroid Build Coastguard Worker }
6072*4bdc9457SAndroid Build Coastguard Worker }
6073*4bdc9457SAndroid Build Coastguard Worker }
6074*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)6075*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
6076*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6077*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
6078*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6079*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6080*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6081*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6082*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6083*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6084*4bdc9457SAndroid Build Coastguard Worker .m(m)
6085*4bdc9457SAndroid Build Coastguard Worker .n(n)
6086*4bdc9457SAndroid Build Coastguard Worker .k(k)
6087*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
6088*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6089*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6090*4bdc9457SAndroid Build Coastguard Worker }
6091*4bdc9457SAndroid Build Coastguard Worker }
6092*4bdc9457SAndroid Build Coastguard Worker }
6093*4bdc9457SAndroid Build Coastguard Worker }
6094*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)6095*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
6096*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6097*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6098*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6099*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6100*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6101*4bdc9457SAndroid Build Coastguard Worker .m(6)
6102*4bdc9457SAndroid Build Coastguard Worker .n(8)
6103*4bdc9457SAndroid Build Coastguard Worker .k(1)
6104*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
6105*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6106*4bdc9457SAndroid Build Coastguard Worker }
6107*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
6108*4bdc9457SAndroid Build Coastguard Worker
6109*4bdc9457SAndroid Build Coastguard Worker
6110*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)6111*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
6112*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6113*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6114*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6115*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6116*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6117*4bdc9457SAndroid Build Coastguard Worker .m(6)
6118*4bdc9457SAndroid Build Coastguard Worker .n(8)
6119*4bdc9457SAndroid Build Coastguard Worker .k(4)
6120*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6121*4bdc9457SAndroid Build Coastguard Worker }
6122*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,strided_cn)6123*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
6124*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6125*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6126*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6127*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6128*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6129*4bdc9457SAndroid Build Coastguard Worker .m(6)
6130*4bdc9457SAndroid Build Coastguard Worker .n(8)
6131*4bdc9457SAndroid Build Coastguard Worker .k(4)
6132*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
6133*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6134*4bdc9457SAndroid Build Coastguard Worker }
6135*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_strided_a)6136*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_strided_a) {
6137*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6138*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6139*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6140*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6141*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6142*4bdc9457SAndroid Build Coastguard Worker .m(6)
6143*4bdc9457SAndroid Build Coastguard Worker .n(8)
6144*4bdc9457SAndroid Build Coastguard Worker .k(4)
6145*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6146*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6147*4bdc9457SAndroid Build Coastguard Worker }
6148*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)6149*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
6150*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
6151*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6152*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6153*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6154*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6155*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6156*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6157*4bdc9457SAndroid Build Coastguard Worker .m(m)
6158*4bdc9457SAndroid Build Coastguard Worker .n(n)
6159*4bdc9457SAndroid Build Coastguard Worker .k(4)
6160*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6161*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6162*4bdc9457SAndroid Build Coastguard Worker }
6163*4bdc9457SAndroid Build Coastguard Worker }
6164*4bdc9457SAndroid Build Coastguard Worker }
6165*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)6166*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
6167*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6168*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6169*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6170*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6171*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6172*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6173*4bdc9457SAndroid Build Coastguard Worker .m(m)
6174*4bdc9457SAndroid Build Coastguard Worker .n(8)
6175*4bdc9457SAndroid Build Coastguard Worker .k(4)
6176*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6177*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6178*4bdc9457SAndroid Build Coastguard Worker }
6179*4bdc9457SAndroid Build Coastguard Worker }
6180*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)6181*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
6182*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
6183*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6184*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6185*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6186*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6187*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6188*4bdc9457SAndroid Build Coastguard Worker .m(6)
6189*4bdc9457SAndroid Build Coastguard Worker .n(n)
6190*4bdc9457SAndroid Build Coastguard Worker .k(4)
6191*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6192*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6193*4bdc9457SAndroid Build Coastguard Worker }
6194*4bdc9457SAndroid Build Coastguard Worker }
6195*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)6196*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
6197*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
6198*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6199*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6200*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6201*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6202*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6203*4bdc9457SAndroid Build Coastguard Worker .m(6)
6204*4bdc9457SAndroid Build Coastguard Worker .n(8)
6205*4bdc9457SAndroid Build Coastguard Worker .k(k)
6206*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6207*4bdc9457SAndroid Build Coastguard Worker }
6208*4bdc9457SAndroid Build Coastguard Worker }
6209*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_strided_a)6210*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_strided_a) {
6211*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
6212*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6213*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6214*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6215*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6216*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6217*4bdc9457SAndroid Build Coastguard Worker .m(6)
6218*4bdc9457SAndroid Build Coastguard Worker .n(8)
6219*4bdc9457SAndroid Build Coastguard Worker .k(k)
6220*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6221*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6222*4bdc9457SAndroid Build Coastguard Worker }
6223*4bdc9457SAndroid Build Coastguard Worker }
6224*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)6225*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
6226*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
6227*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
6228*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6229*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6230*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6231*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6232*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6233*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6234*4bdc9457SAndroid Build Coastguard Worker .m(m)
6235*4bdc9457SAndroid Build Coastguard Worker .n(n)
6236*4bdc9457SAndroid Build Coastguard Worker .k(k)
6237*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6238*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6239*4bdc9457SAndroid Build Coastguard Worker }
6240*4bdc9457SAndroid Build Coastguard Worker }
6241*4bdc9457SAndroid Build Coastguard Worker }
6242*4bdc9457SAndroid Build Coastguard Worker }
6243*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)6244*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
6245*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
6246*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6247*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6248*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6249*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6250*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6251*4bdc9457SAndroid Build Coastguard Worker .m(6)
6252*4bdc9457SAndroid Build Coastguard Worker .n(8)
6253*4bdc9457SAndroid Build Coastguard Worker .k(k)
6254*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6255*4bdc9457SAndroid Build Coastguard Worker }
6256*4bdc9457SAndroid Build Coastguard Worker }
6257*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_strided_a)6258*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_strided_a) {
6259*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
6260*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6261*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6262*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6263*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6264*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6265*4bdc9457SAndroid Build Coastguard Worker .m(6)
6266*4bdc9457SAndroid Build Coastguard Worker .n(8)
6267*4bdc9457SAndroid Build Coastguard Worker .k(k)
6268*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
6269*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6270*4bdc9457SAndroid Build Coastguard Worker }
6271*4bdc9457SAndroid Build Coastguard Worker }
6272*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)6273*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
6274*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
6275*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
6276*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6277*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6278*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6279*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6280*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6281*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6282*4bdc9457SAndroid Build Coastguard Worker .m(m)
6283*4bdc9457SAndroid Build Coastguard Worker .n(n)
6284*4bdc9457SAndroid Build Coastguard Worker .k(k)
6285*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6286*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6287*4bdc9457SAndroid Build Coastguard Worker }
6288*4bdc9457SAndroid Build Coastguard Worker }
6289*4bdc9457SAndroid Build Coastguard Worker }
6290*4bdc9457SAndroid Build Coastguard Worker }
6291*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_div_4)6292*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
6293*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
6294*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6295*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6296*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6297*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6298*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6299*4bdc9457SAndroid Build Coastguard Worker .m(6)
6300*4bdc9457SAndroid Build Coastguard Worker .n(8)
6301*4bdc9457SAndroid Build Coastguard Worker .k(k)
6302*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6303*4bdc9457SAndroid Build Coastguard Worker }
6304*4bdc9457SAndroid Build Coastguard Worker }
6305*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_div_4_strided_a)6306*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_div_4_strided_a) {
6307*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
6308*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6309*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6310*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6311*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6312*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6313*4bdc9457SAndroid Build Coastguard Worker .m(6)
6314*4bdc9457SAndroid Build Coastguard Worker .n(8)
6315*4bdc9457SAndroid Build Coastguard Worker .k(k)
6316*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
6317*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6318*4bdc9457SAndroid Build Coastguard Worker }
6319*4bdc9457SAndroid Build Coastguard Worker }
6320*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)6321*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
6322*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
6323*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
6324*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6325*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6326*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6327*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6328*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6329*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6330*4bdc9457SAndroid Build Coastguard Worker .m(m)
6331*4bdc9457SAndroid Build Coastguard Worker .n(n)
6332*4bdc9457SAndroid Build Coastguard Worker .k(k)
6333*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6334*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6335*4bdc9457SAndroid Build Coastguard Worker }
6336*4bdc9457SAndroid Build Coastguard Worker }
6337*4bdc9457SAndroid Build Coastguard Worker }
6338*4bdc9457SAndroid Build Coastguard Worker }
6339*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)6340*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
6341*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
6342*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
6343*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6344*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6345*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6346*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6347*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6348*4bdc9457SAndroid Build Coastguard Worker .m(6)
6349*4bdc9457SAndroid Build Coastguard Worker .n(n)
6350*4bdc9457SAndroid Build Coastguard Worker .k(k)
6351*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6352*4bdc9457SAndroid Build Coastguard Worker }
6353*4bdc9457SAndroid Build Coastguard Worker }
6354*4bdc9457SAndroid Build Coastguard Worker }
6355*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)6356*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
6357*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
6358*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
6359*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6360*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6361*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6362*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6363*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6364*4bdc9457SAndroid Build Coastguard Worker .m(6)
6365*4bdc9457SAndroid Build Coastguard Worker .n(n)
6366*4bdc9457SAndroid Build Coastguard Worker .k(k)
6367*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
6368*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6369*4bdc9457SAndroid Build Coastguard Worker }
6370*4bdc9457SAndroid Build Coastguard Worker }
6371*4bdc9457SAndroid Build Coastguard Worker }
6372*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_a)6373*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_a) {
6374*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
6375*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
6376*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6377*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6378*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6379*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6380*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6381*4bdc9457SAndroid Build Coastguard Worker .m(6)
6382*4bdc9457SAndroid Build Coastguard Worker .n(n)
6383*4bdc9457SAndroid Build Coastguard Worker .k(k)
6384*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
6385*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6386*4bdc9457SAndroid Build Coastguard Worker }
6387*4bdc9457SAndroid Build Coastguard Worker }
6388*4bdc9457SAndroid Build Coastguard Worker }
6389*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)6390*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
6391*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
6392*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
6393*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6394*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6395*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6396*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6397*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6398*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6399*4bdc9457SAndroid Build Coastguard Worker .m(m)
6400*4bdc9457SAndroid Build Coastguard Worker .n(n)
6401*4bdc9457SAndroid Build Coastguard Worker .k(k)
6402*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6403*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6404*4bdc9457SAndroid Build Coastguard Worker }
6405*4bdc9457SAndroid Build Coastguard Worker }
6406*4bdc9457SAndroid Build Coastguard Worker }
6407*4bdc9457SAndroid Build Coastguard Worker }
6408*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_div_8)6409*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
6410*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6411*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
6412*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6413*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6414*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6415*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6416*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6417*4bdc9457SAndroid Build Coastguard Worker .m(6)
6418*4bdc9457SAndroid Build Coastguard Worker .n(n)
6419*4bdc9457SAndroid Build Coastguard Worker .k(k)
6420*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6421*4bdc9457SAndroid Build Coastguard Worker }
6422*4bdc9457SAndroid Build Coastguard Worker }
6423*4bdc9457SAndroid Build Coastguard Worker }
6424*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)6425*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
6426*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6427*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
6428*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6429*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6430*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6431*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6432*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6433*4bdc9457SAndroid Build Coastguard Worker .m(6)
6434*4bdc9457SAndroid Build Coastguard Worker .n(n)
6435*4bdc9457SAndroid Build Coastguard Worker .k(k)
6436*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
6437*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6438*4bdc9457SAndroid Build Coastguard Worker }
6439*4bdc9457SAndroid Build Coastguard Worker }
6440*4bdc9457SAndroid Build Coastguard Worker }
6441*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_a)6442*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_a) {
6443*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6444*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
6445*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6446*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6447*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6448*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6449*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6450*4bdc9457SAndroid Build Coastguard Worker .m(6)
6451*4bdc9457SAndroid Build Coastguard Worker .n(n)
6452*4bdc9457SAndroid Build Coastguard Worker .k(k)
6453*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
6454*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6455*4bdc9457SAndroid Build Coastguard Worker }
6456*4bdc9457SAndroid Build Coastguard Worker }
6457*4bdc9457SAndroid Build Coastguard Worker }
6458*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)6459*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
6460*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6461*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
6462*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6463*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6464*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6465*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6466*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6467*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6468*4bdc9457SAndroid Build Coastguard Worker .m(m)
6469*4bdc9457SAndroid Build Coastguard Worker .n(n)
6470*4bdc9457SAndroid Build Coastguard Worker .k(k)
6471*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6472*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6473*4bdc9457SAndroid Build Coastguard Worker }
6474*4bdc9457SAndroid Build Coastguard Worker }
6475*4bdc9457SAndroid Build Coastguard Worker }
6476*4bdc9457SAndroid Build Coastguard Worker }
6477*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)6478*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
6479*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
6480*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
6481*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6482*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6483*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6484*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6485*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6486*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6487*4bdc9457SAndroid Build Coastguard Worker .m(m)
6488*4bdc9457SAndroid Build Coastguard Worker .n(n)
6489*4bdc9457SAndroid Build Coastguard Worker .k(k)
6490*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
6491*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6492*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6493*4bdc9457SAndroid Build Coastguard Worker }
6494*4bdc9457SAndroid Build Coastguard Worker }
6495*4bdc9457SAndroid Build Coastguard Worker }
6496*4bdc9457SAndroid Build Coastguard Worker }
6497*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA,strided_cm)6498*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
6499*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6500*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6501*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6502*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6503*4bdc9457SAndroid Build Coastguard Worker .sr(4)
6504*4bdc9457SAndroid Build Coastguard Worker .m(6)
6505*4bdc9457SAndroid Build Coastguard Worker .n(8)
6506*4bdc9457SAndroid Build Coastguard Worker .k(4)
6507*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
6508*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmrelaxedsimd_fma);
6509*4bdc9457SAndroid Build Coastguard Worker }
6510*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
6511*4bdc9457SAndroid Build Coastguard Worker
6512*4bdc9457SAndroid Build Coastguard Worker
6513*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_2X4__WASM,k_eq_1)6514*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, k_eq_1) {
6515*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6516*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6517*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6518*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6519*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6520*4bdc9457SAndroid Build Coastguard Worker .m(2)
6521*4bdc9457SAndroid Build Coastguard Worker .n(4)
6522*4bdc9457SAndroid Build Coastguard Worker .k(1)
6523*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6524*4bdc9457SAndroid Build Coastguard Worker }
6525*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,strided_cn)6526*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, strided_cn) {
6527*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6528*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6529*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6530*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6531*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6532*4bdc9457SAndroid Build Coastguard Worker .m(2)
6533*4bdc9457SAndroid Build Coastguard Worker .n(4)
6534*4bdc9457SAndroid Build Coastguard Worker .k(1)
6535*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6536*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6537*4bdc9457SAndroid Build Coastguard Worker }
6538*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,k_eq_1_strided_a)6539*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, k_eq_1_strided_a) {
6540*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6541*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6542*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6543*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6544*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6545*4bdc9457SAndroid Build Coastguard Worker .m(2)
6546*4bdc9457SAndroid Build Coastguard Worker .n(4)
6547*4bdc9457SAndroid Build Coastguard Worker .k(1)
6548*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
6549*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6550*4bdc9457SAndroid Build Coastguard Worker }
6551*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,k_eq_1_subtile)6552*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, k_eq_1_subtile) {
6553*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6554*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6555*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6556*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6557*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6558*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6559*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6560*4bdc9457SAndroid Build Coastguard Worker .m(m)
6561*4bdc9457SAndroid Build Coastguard Worker .n(n)
6562*4bdc9457SAndroid Build Coastguard Worker .k(1)
6563*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6564*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6565*4bdc9457SAndroid Build Coastguard Worker }
6566*4bdc9457SAndroid Build Coastguard Worker }
6567*4bdc9457SAndroid Build Coastguard Worker }
6568*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,k_eq_1_subtile_m)6569*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, k_eq_1_subtile_m) {
6570*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6571*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6572*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6573*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6574*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6575*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6576*4bdc9457SAndroid Build Coastguard Worker .m(m)
6577*4bdc9457SAndroid Build Coastguard Worker .n(4)
6578*4bdc9457SAndroid Build Coastguard Worker .k(1)
6579*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6580*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6581*4bdc9457SAndroid Build Coastguard Worker }
6582*4bdc9457SAndroid Build Coastguard Worker }
6583*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,k_eq_1_subtile_n)6584*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, k_eq_1_subtile_n) {
6585*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6586*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6587*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6588*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6589*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6590*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6591*4bdc9457SAndroid Build Coastguard Worker .m(2)
6592*4bdc9457SAndroid Build Coastguard Worker .n(n)
6593*4bdc9457SAndroid Build Coastguard Worker .k(1)
6594*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6595*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6596*4bdc9457SAndroid Build Coastguard Worker }
6597*4bdc9457SAndroid Build Coastguard Worker }
6598*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,k_gt_1)6599*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, k_gt_1) {
6600*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6601*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6602*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6603*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6604*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6605*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6606*4bdc9457SAndroid Build Coastguard Worker .m(2)
6607*4bdc9457SAndroid Build Coastguard Worker .n(4)
6608*4bdc9457SAndroid Build Coastguard Worker .k(k)
6609*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6610*4bdc9457SAndroid Build Coastguard Worker }
6611*4bdc9457SAndroid Build Coastguard Worker }
6612*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,k_gt_1_strided_a)6613*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, k_gt_1_strided_a) {
6614*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6615*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6616*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6617*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6618*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6619*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6620*4bdc9457SAndroid Build Coastguard Worker .m(2)
6621*4bdc9457SAndroid Build Coastguard Worker .n(4)
6622*4bdc9457SAndroid Build Coastguard Worker .k(k)
6623*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
6624*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6625*4bdc9457SAndroid Build Coastguard Worker }
6626*4bdc9457SAndroid Build Coastguard Worker }
6627*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,k_gt_1_subtile)6628*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, k_gt_1_subtile) {
6629*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6630*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6631*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6632*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6633*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6634*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6635*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6636*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6637*4bdc9457SAndroid Build Coastguard Worker .m(m)
6638*4bdc9457SAndroid Build Coastguard Worker .n(n)
6639*4bdc9457SAndroid Build Coastguard Worker .k(k)
6640*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6641*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6642*4bdc9457SAndroid Build Coastguard Worker }
6643*4bdc9457SAndroid Build Coastguard Worker }
6644*4bdc9457SAndroid Build Coastguard Worker }
6645*4bdc9457SAndroid Build Coastguard Worker }
6646*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,n_gt_4)6647*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, n_gt_4) {
6648*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6649*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6650*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6651*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6652*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6653*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6654*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6655*4bdc9457SAndroid Build Coastguard Worker .m(2)
6656*4bdc9457SAndroid Build Coastguard Worker .n(n)
6657*4bdc9457SAndroid Build Coastguard Worker .k(k)
6658*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6659*4bdc9457SAndroid Build Coastguard Worker }
6660*4bdc9457SAndroid Build Coastguard Worker }
6661*4bdc9457SAndroid Build Coastguard Worker }
6662*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,n_gt_4_strided_cn)6663*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, n_gt_4_strided_cn) {
6664*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6665*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6666*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6667*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6668*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6669*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6670*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6671*4bdc9457SAndroid Build Coastguard Worker .m(2)
6672*4bdc9457SAndroid Build Coastguard Worker .n(n)
6673*4bdc9457SAndroid Build Coastguard Worker .k(k)
6674*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6675*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6676*4bdc9457SAndroid Build Coastguard Worker }
6677*4bdc9457SAndroid Build Coastguard Worker }
6678*4bdc9457SAndroid Build Coastguard Worker }
6679*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,n_gt_4_strided_a)6680*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, n_gt_4_strided_a) {
6681*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6682*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6683*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6684*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6685*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6686*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6687*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6688*4bdc9457SAndroid Build Coastguard Worker .m(2)
6689*4bdc9457SAndroid Build Coastguard Worker .n(n)
6690*4bdc9457SAndroid Build Coastguard Worker .k(k)
6691*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6692*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6693*4bdc9457SAndroid Build Coastguard Worker }
6694*4bdc9457SAndroid Build Coastguard Worker }
6695*4bdc9457SAndroid Build Coastguard Worker }
6696*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,n_gt_4_subtile)6697*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, n_gt_4_subtile) {
6698*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6699*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6700*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6701*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6702*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6703*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6704*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6705*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6706*4bdc9457SAndroid Build Coastguard Worker .m(m)
6707*4bdc9457SAndroid Build Coastguard Worker .n(n)
6708*4bdc9457SAndroid Build Coastguard Worker .k(k)
6709*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6710*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6711*4bdc9457SAndroid Build Coastguard Worker }
6712*4bdc9457SAndroid Build Coastguard Worker }
6713*4bdc9457SAndroid Build Coastguard Worker }
6714*4bdc9457SAndroid Build Coastguard Worker }
6715*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,n_div_4)6716*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, n_div_4) {
6717*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6718*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6719*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6720*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6721*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6722*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6723*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6724*4bdc9457SAndroid Build Coastguard Worker .m(2)
6725*4bdc9457SAndroid Build Coastguard Worker .n(n)
6726*4bdc9457SAndroid Build Coastguard Worker .k(k)
6727*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6728*4bdc9457SAndroid Build Coastguard Worker }
6729*4bdc9457SAndroid Build Coastguard Worker }
6730*4bdc9457SAndroid Build Coastguard Worker }
6731*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,n_div_4_strided_cn)6732*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, n_div_4_strided_cn) {
6733*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6734*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6735*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6736*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6737*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6738*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6739*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6740*4bdc9457SAndroid Build Coastguard Worker .m(2)
6741*4bdc9457SAndroid Build Coastguard Worker .n(n)
6742*4bdc9457SAndroid Build Coastguard Worker .k(k)
6743*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6744*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6745*4bdc9457SAndroid Build Coastguard Worker }
6746*4bdc9457SAndroid Build Coastguard Worker }
6747*4bdc9457SAndroid Build Coastguard Worker }
6748*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,n_div_4_strided_a)6749*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, n_div_4_strided_a) {
6750*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6751*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6752*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6753*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6754*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6755*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6756*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6757*4bdc9457SAndroid Build Coastguard Worker .m(2)
6758*4bdc9457SAndroid Build Coastguard Worker .n(n)
6759*4bdc9457SAndroid Build Coastguard Worker .k(k)
6760*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6761*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6762*4bdc9457SAndroid Build Coastguard Worker }
6763*4bdc9457SAndroid Build Coastguard Worker }
6764*4bdc9457SAndroid Build Coastguard Worker }
6765*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,n_div_4_subtile)6766*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, n_div_4_subtile) {
6767*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6768*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6769*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6770*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6771*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6772*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6773*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6774*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6775*4bdc9457SAndroid Build Coastguard Worker .m(m)
6776*4bdc9457SAndroid Build Coastguard Worker .n(n)
6777*4bdc9457SAndroid Build Coastguard Worker .k(k)
6778*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6779*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6780*4bdc9457SAndroid Build Coastguard Worker }
6781*4bdc9457SAndroid Build Coastguard Worker }
6782*4bdc9457SAndroid Build Coastguard Worker }
6783*4bdc9457SAndroid Build Coastguard Worker }
6784*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,strided_cm_subtile)6785*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, strided_cm_subtile) {
6786*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6787*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6788*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6789*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6790*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6791*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6792*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6793*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6794*4bdc9457SAndroid Build Coastguard Worker .m(m)
6795*4bdc9457SAndroid Build Coastguard Worker .n(n)
6796*4bdc9457SAndroid Build Coastguard Worker .k(k)
6797*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6798*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6799*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6800*4bdc9457SAndroid Build Coastguard Worker }
6801*4bdc9457SAndroid Build Coastguard Worker }
6802*4bdc9457SAndroid Build Coastguard Worker }
6803*4bdc9457SAndroid Build Coastguard Worker }
6804*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__WASM,strided_cm)6805*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__WASM, strided_cm) {
6806*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6807*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6808*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6809*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6810*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6811*4bdc9457SAndroid Build Coastguard Worker .m(2)
6812*4bdc9457SAndroid Build Coastguard Worker .n(4)
6813*4bdc9457SAndroid Build Coastguard Worker .k(1)
6814*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6815*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__wasm);
6816*4bdc9457SAndroid Build Coastguard Worker }
6817*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
6818*4bdc9457SAndroid Build Coastguard Worker
6819*4bdc9457SAndroid Build Coastguard Worker
6820*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X2__WASM,k_eq_1)6821*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, k_eq_1) {
6822*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6823*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6824*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6825*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6826*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6827*4bdc9457SAndroid Build Coastguard Worker .m(4)
6828*4bdc9457SAndroid Build Coastguard Worker .n(2)
6829*4bdc9457SAndroid Build Coastguard Worker .k(1)
6830*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6831*4bdc9457SAndroid Build Coastguard Worker }
6832*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,strided_cn)6833*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, strided_cn) {
6834*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6835*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6836*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6837*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6838*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6839*4bdc9457SAndroid Build Coastguard Worker .m(4)
6840*4bdc9457SAndroid Build Coastguard Worker .n(2)
6841*4bdc9457SAndroid Build Coastguard Worker .k(1)
6842*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
6843*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6844*4bdc9457SAndroid Build Coastguard Worker }
6845*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,k_eq_1_strided_a)6846*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, k_eq_1_strided_a) {
6847*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6848*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6849*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6850*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6851*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6852*4bdc9457SAndroid Build Coastguard Worker .m(4)
6853*4bdc9457SAndroid Build Coastguard Worker .n(2)
6854*4bdc9457SAndroid Build Coastguard Worker .k(1)
6855*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
6856*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6857*4bdc9457SAndroid Build Coastguard Worker }
6858*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,k_eq_1_subtile)6859*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, k_eq_1_subtile) {
6860*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6861*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6862*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6863*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6864*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6865*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6866*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6867*4bdc9457SAndroid Build Coastguard Worker .m(m)
6868*4bdc9457SAndroid Build Coastguard Worker .n(n)
6869*4bdc9457SAndroid Build Coastguard Worker .k(1)
6870*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6871*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6872*4bdc9457SAndroid Build Coastguard Worker }
6873*4bdc9457SAndroid Build Coastguard Worker }
6874*4bdc9457SAndroid Build Coastguard Worker }
6875*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,k_eq_1_subtile_m)6876*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, k_eq_1_subtile_m) {
6877*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6878*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6879*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6880*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6881*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6882*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6883*4bdc9457SAndroid Build Coastguard Worker .m(m)
6884*4bdc9457SAndroid Build Coastguard Worker .n(2)
6885*4bdc9457SAndroid Build Coastguard Worker .k(1)
6886*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6887*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6888*4bdc9457SAndroid Build Coastguard Worker }
6889*4bdc9457SAndroid Build Coastguard Worker }
6890*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,k_eq_1_subtile_n)6891*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, k_eq_1_subtile_n) {
6892*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6893*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6894*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6895*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6896*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6897*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6898*4bdc9457SAndroid Build Coastguard Worker .m(4)
6899*4bdc9457SAndroid Build Coastguard Worker .n(n)
6900*4bdc9457SAndroid Build Coastguard Worker .k(1)
6901*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6902*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6903*4bdc9457SAndroid Build Coastguard Worker }
6904*4bdc9457SAndroid Build Coastguard Worker }
6905*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,k_gt_1)6906*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, k_gt_1) {
6907*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6908*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6909*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6910*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6911*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6912*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6913*4bdc9457SAndroid Build Coastguard Worker .m(4)
6914*4bdc9457SAndroid Build Coastguard Worker .n(2)
6915*4bdc9457SAndroid Build Coastguard Worker .k(k)
6916*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6917*4bdc9457SAndroid Build Coastguard Worker }
6918*4bdc9457SAndroid Build Coastguard Worker }
6919*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,k_gt_1_strided_a)6920*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, k_gt_1_strided_a) {
6921*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6922*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6923*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6924*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6925*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6926*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6927*4bdc9457SAndroid Build Coastguard Worker .m(4)
6928*4bdc9457SAndroid Build Coastguard Worker .n(2)
6929*4bdc9457SAndroid Build Coastguard Worker .k(k)
6930*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
6931*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6932*4bdc9457SAndroid Build Coastguard Worker }
6933*4bdc9457SAndroid Build Coastguard Worker }
6934*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,k_gt_1_subtile)6935*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, k_gt_1_subtile) {
6936*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6937*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6938*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6939*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6940*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6941*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6942*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6943*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6944*4bdc9457SAndroid Build Coastguard Worker .m(m)
6945*4bdc9457SAndroid Build Coastguard Worker .n(n)
6946*4bdc9457SAndroid Build Coastguard Worker .k(k)
6947*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6948*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6949*4bdc9457SAndroid Build Coastguard Worker }
6950*4bdc9457SAndroid Build Coastguard Worker }
6951*4bdc9457SAndroid Build Coastguard Worker }
6952*4bdc9457SAndroid Build Coastguard Worker }
6953*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,n_gt_2)6954*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, n_gt_2) {
6955*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6956*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6957*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6958*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6959*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6960*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6961*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6962*4bdc9457SAndroid Build Coastguard Worker .m(4)
6963*4bdc9457SAndroid Build Coastguard Worker .n(n)
6964*4bdc9457SAndroid Build Coastguard Worker .k(k)
6965*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6966*4bdc9457SAndroid Build Coastguard Worker }
6967*4bdc9457SAndroid Build Coastguard Worker }
6968*4bdc9457SAndroid Build Coastguard Worker }
6969*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,n_gt_2_strided_cn)6970*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, n_gt_2_strided_cn) {
6971*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6972*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6973*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6974*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6975*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6976*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6977*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6978*4bdc9457SAndroid Build Coastguard Worker .m(4)
6979*4bdc9457SAndroid Build Coastguard Worker .n(n)
6980*4bdc9457SAndroid Build Coastguard Worker .k(k)
6981*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
6982*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
6983*4bdc9457SAndroid Build Coastguard Worker }
6984*4bdc9457SAndroid Build Coastguard Worker }
6985*4bdc9457SAndroid Build Coastguard Worker }
6986*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,n_gt_2_strided_a)6987*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, n_gt_2_strided_a) {
6988*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6989*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6990*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6991*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6992*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6993*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6994*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6995*4bdc9457SAndroid Build Coastguard Worker .m(4)
6996*4bdc9457SAndroid Build Coastguard Worker .n(n)
6997*4bdc9457SAndroid Build Coastguard Worker .k(k)
6998*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6999*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
7000*4bdc9457SAndroid Build Coastguard Worker }
7001*4bdc9457SAndroid Build Coastguard Worker }
7002*4bdc9457SAndroid Build Coastguard Worker }
7003*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,n_gt_2_subtile)7004*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, n_gt_2_subtile) {
7005*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
7006*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7007*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7008*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7009*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7010*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7011*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7012*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7013*4bdc9457SAndroid Build Coastguard Worker .m(m)
7014*4bdc9457SAndroid Build Coastguard Worker .n(n)
7015*4bdc9457SAndroid Build Coastguard Worker .k(k)
7016*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7017*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
7018*4bdc9457SAndroid Build Coastguard Worker }
7019*4bdc9457SAndroid Build Coastguard Worker }
7020*4bdc9457SAndroid Build Coastguard Worker }
7021*4bdc9457SAndroid Build Coastguard Worker }
7022*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,n_div_2)7023*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, n_div_2) {
7024*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
7025*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7026*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7027*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7028*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7029*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7030*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7031*4bdc9457SAndroid Build Coastguard Worker .m(4)
7032*4bdc9457SAndroid Build Coastguard Worker .n(n)
7033*4bdc9457SAndroid Build Coastguard Worker .k(k)
7034*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
7035*4bdc9457SAndroid Build Coastguard Worker }
7036*4bdc9457SAndroid Build Coastguard Worker }
7037*4bdc9457SAndroid Build Coastguard Worker }
7038*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,n_div_2_strided_cn)7039*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, n_div_2_strided_cn) {
7040*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
7041*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7042*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7043*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7044*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7045*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7046*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7047*4bdc9457SAndroid Build Coastguard Worker .m(4)
7048*4bdc9457SAndroid Build Coastguard Worker .n(n)
7049*4bdc9457SAndroid Build Coastguard Worker .k(k)
7050*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
7051*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
7052*4bdc9457SAndroid Build Coastguard Worker }
7053*4bdc9457SAndroid Build Coastguard Worker }
7054*4bdc9457SAndroid Build Coastguard Worker }
7055*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,n_div_2_strided_a)7056*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, n_div_2_strided_a) {
7057*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
7058*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7059*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7060*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7061*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7062*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7063*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7064*4bdc9457SAndroid Build Coastguard Worker .m(4)
7065*4bdc9457SAndroid Build Coastguard Worker .n(n)
7066*4bdc9457SAndroid Build Coastguard Worker .k(k)
7067*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
7068*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
7069*4bdc9457SAndroid Build Coastguard Worker }
7070*4bdc9457SAndroid Build Coastguard Worker }
7071*4bdc9457SAndroid Build Coastguard Worker }
7072*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,n_div_2_subtile)7073*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, n_div_2_subtile) {
7074*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
7075*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7076*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7077*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7078*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7079*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7080*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7081*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7082*4bdc9457SAndroid Build Coastguard Worker .m(m)
7083*4bdc9457SAndroid Build Coastguard Worker .n(n)
7084*4bdc9457SAndroid Build Coastguard Worker .k(k)
7085*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7086*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
7087*4bdc9457SAndroid Build Coastguard Worker }
7088*4bdc9457SAndroid Build Coastguard Worker }
7089*4bdc9457SAndroid Build Coastguard Worker }
7090*4bdc9457SAndroid Build Coastguard Worker }
7091*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,strided_cm_subtile)7092*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, strided_cm_subtile) {
7093*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7094*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
7095*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7096*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7097*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7098*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7099*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7100*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7101*4bdc9457SAndroid Build Coastguard Worker .m(m)
7102*4bdc9457SAndroid Build Coastguard Worker .n(n)
7103*4bdc9457SAndroid Build Coastguard Worker .k(k)
7104*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
7105*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7106*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
7107*4bdc9457SAndroid Build Coastguard Worker }
7108*4bdc9457SAndroid Build Coastguard Worker }
7109*4bdc9457SAndroid Build Coastguard Worker }
7110*4bdc9457SAndroid Build Coastguard Worker }
7111*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__WASM,strided_cm)7112*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__WASM, strided_cm) {
7113*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7114*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7115*4bdc9457SAndroid Build Coastguard Worker .nr(2)
7116*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7117*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7118*4bdc9457SAndroid Build Coastguard Worker .m(4)
7119*4bdc9457SAndroid Build Coastguard Worker .n(2)
7120*4bdc9457SAndroid Build Coastguard Worker .k(1)
7121*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
7122*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__wasm);
7123*4bdc9457SAndroid Build Coastguard Worker }
7124*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
7125*4bdc9457SAndroid Build Coastguard Worker
7126*4bdc9457SAndroid Build Coastguard Worker
7127*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X4__WASM,k_eq_1)7128*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, k_eq_1) {
7129*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7130*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7131*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7132*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7133*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7134*4bdc9457SAndroid Build Coastguard Worker .m(4)
7135*4bdc9457SAndroid Build Coastguard Worker .n(4)
7136*4bdc9457SAndroid Build Coastguard Worker .k(1)
7137*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7138*4bdc9457SAndroid Build Coastguard Worker }
7139*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,strided_cn)7140*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, strided_cn) {
7141*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7142*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7143*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7144*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7145*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7146*4bdc9457SAndroid Build Coastguard Worker .m(4)
7147*4bdc9457SAndroid Build Coastguard Worker .n(4)
7148*4bdc9457SAndroid Build Coastguard Worker .k(1)
7149*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7150*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7151*4bdc9457SAndroid Build Coastguard Worker }
7152*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,k_eq_1_strided_a)7153*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, k_eq_1_strided_a) {
7154*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7155*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7156*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7157*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7158*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7159*4bdc9457SAndroid Build Coastguard Worker .m(4)
7160*4bdc9457SAndroid Build Coastguard Worker .n(4)
7161*4bdc9457SAndroid Build Coastguard Worker .k(1)
7162*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
7163*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7164*4bdc9457SAndroid Build Coastguard Worker }
7165*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,k_eq_1_subtile)7166*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, k_eq_1_subtile) {
7167*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7168*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7169*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7170*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7171*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7172*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7173*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7174*4bdc9457SAndroid Build Coastguard Worker .m(m)
7175*4bdc9457SAndroid Build Coastguard Worker .n(n)
7176*4bdc9457SAndroid Build Coastguard Worker .k(1)
7177*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7178*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7179*4bdc9457SAndroid Build Coastguard Worker }
7180*4bdc9457SAndroid Build Coastguard Worker }
7181*4bdc9457SAndroid Build Coastguard Worker }
7182*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,k_eq_1_subtile_m)7183*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, k_eq_1_subtile_m) {
7184*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7185*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7186*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7187*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7188*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7189*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7190*4bdc9457SAndroid Build Coastguard Worker .m(m)
7191*4bdc9457SAndroid Build Coastguard Worker .n(4)
7192*4bdc9457SAndroid Build Coastguard Worker .k(1)
7193*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7194*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7195*4bdc9457SAndroid Build Coastguard Worker }
7196*4bdc9457SAndroid Build Coastguard Worker }
7197*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,k_eq_1_subtile_n)7198*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, k_eq_1_subtile_n) {
7199*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7200*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7201*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7202*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7203*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7204*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7205*4bdc9457SAndroid Build Coastguard Worker .m(4)
7206*4bdc9457SAndroid Build Coastguard Worker .n(n)
7207*4bdc9457SAndroid Build Coastguard Worker .k(1)
7208*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7209*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7210*4bdc9457SAndroid Build Coastguard Worker }
7211*4bdc9457SAndroid Build Coastguard Worker }
7212*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,k_gt_1)7213*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, k_gt_1) {
7214*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7215*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7216*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7217*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7218*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7219*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7220*4bdc9457SAndroid Build Coastguard Worker .m(4)
7221*4bdc9457SAndroid Build Coastguard Worker .n(4)
7222*4bdc9457SAndroid Build Coastguard Worker .k(k)
7223*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7224*4bdc9457SAndroid Build Coastguard Worker }
7225*4bdc9457SAndroid Build Coastguard Worker }
7226*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,k_gt_1_strided_a)7227*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, k_gt_1_strided_a) {
7228*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7229*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7230*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7231*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7232*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7233*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7234*4bdc9457SAndroid Build Coastguard Worker .m(4)
7235*4bdc9457SAndroid Build Coastguard Worker .n(4)
7236*4bdc9457SAndroid Build Coastguard Worker .k(k)
7237*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
7238*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7239*4bdc9457SAndroid Build Coastguard Worker }
7240*4bdc9457SAndroid Build Coastguard Worker }
7241*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,k_gt_1_subtile)7242*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, k_gt_1_subtile) {
7243*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7244*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7245*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7246*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7247*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7248*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7249*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7250*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7251*4bdc9457SAndroid Build Coastguard Worker .m(m)
7252*4bdc9457SAndroid Build Coastguard Worker .n(n)
7253*4bdc9457SAndroid Build Coastguard Worker .k(k)
7254*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7255*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7256*4bdc9457SAndroid Build Coastguard Worker }
7257*4bdc9457SAndroid Build Coastguard Worker }
7258*4bdc9457SAndroid Build Coastguard Worker }
7259*4bdc9457SAndroid Build Coastguard Worker }
7260*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,n_gt_4)7261*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, n_gt_4) {
7262*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7263*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7264*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7265*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7266*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7267*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7268*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7269*4bdc9457SAndroid Build Coastguard Worker .m(4)
7270*4bdc9457SAndroid Build Coastguard Worker .n(n)
7271*4bdc9457SAndroid Build Coastguard Worker .k(k)
7272*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7273*4bdc9457SAndroid Build Coastguard Worker }
7274*4bdc9457SAndroid Build Coastguard Worker }
7275*4bdc9457SAndroid Build Coastguard Worker }
7276*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,n_gt_4_strided_cn)7277*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, n_gt_4_strided_cn) {
7278*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7279*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7280*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7281*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7282*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7283*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7284*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7285*4bdc9457SAndroid Build Coastguard Worker .m(4)
7286*4bdc9457SAndroid Build Coastguard Worker .n(n)
7287*4bdc9457SAndroid Build Coastguard Worker .k(k)
7288*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7289*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7290*4bdc9457SAndroid Build Coastguard Worker }
7291*4bdc9457SAndroid Build Coastguard Worker }
7292*4bdc9457SAndroid Build Coastguard Worker }
7293*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,n_gt_4_strided_a)7294*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, n_gt_4_strided_a) {
7295*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7296*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7297*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7298*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7299*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7300*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7301*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7302*4bdc9457SAndroid Build Coastguard Worker .m(4)
7303*4bdc9457SAndroid Build Coastguard Worker .n(n)
7304*4bdc9457SAndroid Build Coastguard Worker .k(k)
7305*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
7306*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7307*4bdc9457SAndroid Build Coastguard Worker }
7308*4bdc9457SAndroid Build Coastguard Worker }
7309*4bdc9457SAndroid Build Coastguard Worker }
7310*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,n_gt_4_subtile)7311*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, n_gt_4_subtile) {
7312*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7313*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7314*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7315*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7316*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7317*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7318*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7319*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7320*4bdc9457SAndroid Build Coastguard Worker .m(m)
7321*4bdc9457SAndroid Build Coastguard Worker .n(n)
7322*4bdc9457SAndroid Build Coastguard Worker .k(k)
7323*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7324*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7325*4bdc9457SAndroid Build Coastguard Worker }
7326*4bdc9457SAndroid Build Coastguard Worker }
7327*4bdc9457SAndroid Build Coastguard Worker }
7328*4bdc9457SAndroid Build Coastguard Worker }
7329*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,n_div_4)7330*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, n_div_4) {
7331*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7332*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7333*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7334*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7335*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7336*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7337*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7338*4bdc9457SAndroid Build Coastguard Worker .m(4)
7339*4bdc9457SAndroid Build Coastguard Worker .n(n)
7340*4bdc9457SAndroid Build Coastguard Worker .k(k)
7341*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7342*4bdc9457SAndroid Build Coastguard Worker }
7343*4bdc9457SAndroid Build Coastguard Worker }
7344*4bdc9457SAndroid Build Coastguard Worker }
7345*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,n_div_4_strided_cn)7346*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, n_div_4_strided_cn) {
7347*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7348*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7349*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7350*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7351*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7352*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7353*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7354*4bdc9457SAndroid Build Coastguard Worker .m(4)
7355*4bdc9457SAndroid Build Coastguard Worker .n(n)
7356*4bdc9457SAndroid Build Coastguard Worker .k(k)
7357*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7358*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7359*4bdc9457SAndroid Build Coastguard Worker }
7360*4bdc9457SAndroid Build Coastguard Worker }
7361*4bdc9457SAndroid Build Coastguard Worker }
7362*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,n_div_4_strided_a)7363*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, n_div_4_strided_a) {
7364*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7365*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7366*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7367*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7368*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7369*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7370*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7371*4bdc9457SAndroid Build Coastguard Worker .m(4)
7372*4bdc9457SAndroid Build Coastguard Worker .n(n)
7373*4bdc9457SAndroid Build Coastguard Worker .k(k)
7374*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
7375*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7376*4bdc9457SAndroid Build Coastguard Worker }
7377*4bdc9457SAndroid Build Coastguard Worker }
7378*4bdc9457SAndroid Build Coastguard Worker }
7379*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,n_div_4_subtile)7380*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, n_div_4_subtile) {
7381*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7382*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7383*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7384*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7385*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7386*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7387*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7388*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7389*4bdc9457SAndroid Build Coastguard Worker .m(m)
7390*4bdc9457SAndroid Build Coastguard Worker .n(n)
7391*4bdc9457SAndroid Build Coastguard Worker .k(k)
7392*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7393*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7394*4bdc9457SAndroid Build Coastguard Worker }
7395*4bdc9457SAndroid Build Coastguard Worker }
7396*4bdc9457SAndroid Build Coastguard Worker }
7397*4bdc9457SAndroid Build Coastguard Worker }
7398*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,strided_cm_subtile)7399*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, strided_cm_subtile) {
7400*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7401*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7402*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
7403*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7404*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7405*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7406*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7407*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7408*4bdc9457SAndroid Build Coastguard Worker .m(m)
7409*4bdc9457SAndroid Build Coastguard Worker .n(n)
7410*4bdc9457SAndroid Build Coastguard Worker .k(k)
7411*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
7412*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7413*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7414*4bdc9457SAndroid Build Coastguard Worker }
7415*4bdc9457SAndroid Build Coastguard Worker }
7416*4bdc9457SAndroid Build Coastguard Worker }
7417*4bdc9457SAndroid Build Coastguard Worker }
7418*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__WASM,strided_cm)7419*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__WASM, strided_cm) {
7420*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7421*4bdc9457SAndroid Build Coastguard Worker .mr(4)
7422*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7423*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7424*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7425*4bdc9457SAndroid Build Coastguard Worker .m(4)
7426*4bdc9457SAndroid Build Coastguard Worker .n(4)
7427*4bdc9457SAndroid Build Coastguard Worker .k(1)
7428*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
7429*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__wasm);
7430*4bdc9457SAndroid Build Coastguard Worker }
7431*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
7432*4bdc9457SAndroid Build Coastguard Worker
7433*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,k_eq_1)7434*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, k_eq_1) {
7435*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7436*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7437*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7438*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7439*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7440*4bdc9457SAndroid Build Coastguard Worker .m(2)
7441*4bdc9457SAndroid Build Coastguard Worker .n(4)
7442*4bdc9457SAndroid Build Coastguard Worker .k(1)
7443*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7444*4bdc9457SAndroid Build Coastguard Worker }
7445*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,strided_cn)7446*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, strided_cn) {
7447*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7448*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7449*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7450*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7451*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7452*4bdc9457SAndroid Build Coastguard Worker .m(2)
7453*4bdc9457SAndroid Build Coastguard Worker .n(4)
7454*4bdc9457SAndroid Build Coastguard Worker .k(1)
7455*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7456*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7457*4bdc9457SAndroid Build Coastguard Worker }
7458*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,k_eq_1_strided_a)7459*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, k_eq_1_strided_a) {
7460*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7461*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7462*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7463*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7464*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7465*4bdc9457SAndroid Build Coastguard Worker .m(2)
7466*4bdc9457SAndroid Build Coastguard Worker .n(4)
7467*4bdc9457SAndroid Build Coastguard Worker .k(1)
7468*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
7469*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7470*4bdc9457SAndroid Build Coastguard Worker }
7471*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,k_eq_1_subtile)7472*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, k_eq_1_subtile) {
7473*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7474*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
7475*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7476*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7477*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7478*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7479*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7480*4bdc9457SAndroid Build Coastguard Worker .m(m)
7481*4bdc9457SAndroid Build Coastguard Worker .n(n)
7482*4bdc9457SAndroid Build Coastguard Worker .k(1)
7483*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7484*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7485*4bdc9457SAndroid Build Coastguard Worker }
7486*4bdc9457SAndroid Build Coastguard Worker }
7487*4bdc9457SAndroid Build Coastguard Worker }
7488*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,k_eq_1_subtile_m)7489*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, k_eq_1_subtile_m) {
7490*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
7491*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7492*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7493*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7494*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7495*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7496*4bdc9457SAndroid Build Coastguard Worker .m(m)
7497*4bdc9457SAndroid Build Coastguard Worker .n(4)
7498*4bdc9457SAndroid Build Coastguard Worker .k(1)
7499*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7500*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7501*4bdc9457SAndroid Build Coastguard Worker }
7502*4bdc9457SAndroid Build Coastguard Worker }
7503*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,k_eq_1_subtile_n)7504*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, k_eq_1_subtile_n) {
7505*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7506*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7507*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7508*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7509*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7510*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7511*4bdc9457SAndroid Build Coastguard Worker .m(2)
7512*4bdc9457SAndroid Build Coastguard Worker .n(n)
7513*4bdc9457SAndroid Build Coastguard Worker .k(1)
7514*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7515*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7516*4bdc9457SAndroid Build Coastguard Worker }
7517*4bdc9457SAndroid Build Coastguard Worker }
7518*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,k_gt_1)7519*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, k_gt_1) {
7520*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7521*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7522*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7523*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7524*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7525*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7526*4bdc9457SAndroid Build Coastguard Worker .m(2)
7527*4bdc9457SAndroid Build Coastguard Worker .n(4)
7528*4bdc9457SAndroid Build Coastguard Worker .k(k)
7529*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7530*4bdc9457SAndroid Build Coastguard Worker }
7531*4bdc9457SAndroid Build Coastguard Worker }
7532*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,k_gt_1_strided_a)7533*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, k_gt_1_strided_a) {
7534*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7535*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7536*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7537*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7538*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7539*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7540*4bdc9457SAndroid Build Coastguard Worker .m(2)
7541*4bdc9457SAndroid Build Coastguard Worker .n(4)
7542*4bdc9457SAndroid Build Coastguard Worker .k(k)
7543*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
7544*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7545*4bdc9457SAndroid Build Coastguard Worker }
7546*4bdc9457SAndroid Build Coastguard Worker }
7547*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,k_gt_1_subtile)7548*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, k_gt_1_subtile) {
7549*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
7550*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7551*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
7552*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7553*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7554*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7555*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7556*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7557*4bdc9457SAndroid Build Coastguard Worker .m(m)
7558*4bdc9457SAndroid Build Coastguard Worker .n(n)
7559*4bdc9457SAndroid Build Coastguard Worker .k(k)
7560*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7561*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7562*4bdc9457SAndroid Build Coastguard Worker }
7563*4bdc9457SAndroid Build Coastguard Worker }
7564*4bdc9457SAndroid Build Coastguard Worker }
7565*4bdc9457SAndroid Build Coastguard Worker }
7566*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,n_gt_4)7567*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, n_gt_4) {
7568*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7569*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7570*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7571*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7572*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7573*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7574*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7575*4bdc9457SAndroid Build Coastguard Worker .m(2)
7576*4bdc9457SAndroid Build Coastguard Worker .n(n)
7577*4bdc9457SAndroid Build Coastguard Worker .k(k)
7578*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7579*4bdc9457SAndroid Build Coastguard Worker }
7580*4bdc9457SAndroid Build Coastguard Worker }
7581*4bdc9457SAndroid Build Coastguard Worker }
7582*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,n_gt_4_strided_cn)7583*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, n_gt_4_strided_cn) {
7584*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7585*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7586*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7587*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7588*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7589*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7590*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7591*4bdc9457SAndroid Build Coastguard Worker .m(2)
7592*4bdc9457SAndroid Build Coastguard Worker .n(n)
7593*4bdc9457SAndroid Build Coastguard Worker .k(k)
7594*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7595*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7596*4bdc9457SAndroid Build Coastguard Worker }
7597*4bdc9457SAndroid Build Coastguard Worker }
7598*4bdc9457SAndroid Build Coastguard Worker }
7599*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,n_gt_4_strided_a)7600*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, n_gt_4_strided_a) {
7601*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7602*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7603*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7604*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7605*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7606*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7607*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7608*4bdc9457SAndroid Build Coastguard Worker .m(2)
7609*4bdc9457SAndroid Build Coastguard Worker .n(n)
7610*4bdc9457SAndroid Build Coastguard Worker .k(k)
7611*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
7612*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7613*4bdc9457SAndroid Build Coastguard Worker }
7614*4bdc9457SAndroid Build Coastguard Worker }
7615*4bdc9457SAndroid Build Coastguard Worker }
7616*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,n_gt_4_subtile)7617*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, n_gt_4_subtile) {
7618*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
7619*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7620*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
7621*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7622*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7623*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7624*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7625*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7626*4bdc9457SAndroid Build Coastguard Worker .m(m)
7627*4bdc9457SAndroid Build Coastguard Worker .n(n)
7628*4bdc9457SAndroid Build Coastguard Worker .k(k)
7629*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7630*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7631*4bdc9457SAndroid Build Coastguard Worker }
7632*4bdc9457SAndroid Build Coastguard Worker }
7633*4bdc9457SAndroid Build Coastguard Worker }
7634*4bdc9457SAndroid Build Coastguard Worker }
7635*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,n_div_4)7636*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, n_div_4) {
7637*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7638*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7639*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7640*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7641*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7642*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7643*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7644*4bdc9457SAndroid Build Coastguard Worker .m(2)
7645*4bdc9457SAndroid Build Coastguard Worker .n(n)
7646*4bdc9457SAndroid Build Coastguard Worker .k(k)
7647*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7648*4bdc9457SAndroid Build Coastguard Worker }
7649*4bdc9457SAndroid Build Coastguard Worker }
7650*4bdc9457SAndroid Build Coastguard Worker }
7651*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,n_div_4_strided_cn)7652*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, n_div_4_strided_cn) {
7653*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7654*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7655*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7656*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7657*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7658*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7659*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7660*4bdc9457SAndroid Build Coastguard Worker .m(2)
7661*4bdc9457SAndroid Build Coastguard Worker .n(n)
7662*4bdc9457SAndroid Build Coastguard Worker .k(k)
7663*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
7664*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7665*4bdc9457SAndroid Build Coastguard Worker }
7666*4bdc9457SAndroid Build Coastguard Worker }
7667*4bdc9457SAndroid Build Coastguard Worker }
7668*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,n_div_4_strided_a)7669*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, n_div_4_strided_a) {
7670*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7671*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7672*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7673*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7674*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7675*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7676*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7677*4bdc9457SAndroid Build Coastguard Worker .m(2)
7678*4bdc9457SAndroid Build Coastguard Worker .n(n)
7679*4bdc9457SAndroid Build Coastguard Worker .k(k)
7680*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
7681*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7682*4bdc9457SAndroid Build Coastguard Worker }
7683*4bdc9457SAndroid Build Coastguard Worker }
7684*4bdc9457SAndroid Build Coastguard Worker }
7685*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,n_div_4_subtile)7686*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, n_div_4_subtile) {
7687*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
7688*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7689*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
7690*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7691*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7692*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7693*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7694*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7695*4bdc9457SAndroid Build Coastguard Worker .m(m)
7696*4bdc9457SAndroid Build Coastguard Worker .n(n)
7697*4bdc9457SAndroid Build Coastguard Worker .k(k)
7698*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7699*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7700*4bdc9457SAndroid Build Coastguard Worker }
7701*4bdc9457SAndroid Build Coastguard Worker }
7702*4bdc9457SAndroid Build Coastguard Worker }
7703*4bdc9457SAndroid Build Coastguard Worker }
7704*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,strided_cm_subtile)7705*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, strided_cm_subtile) {
7706*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
7707*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
7708*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
7709*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7710*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7711*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7712*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7713*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7714*4bdc9457SAndroid Build Coastguard Worker .m(m)
7715*4bdc9457SAndroid Build Coastguard Worker .n(n)
7716*4bdc9457SAndroid Build Coastguard Worker .k(k)
7717*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
7718*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
7719*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7720*4bdc9457SAndroid Build Coastguard Worker }
7721*4bdc9457SAndroid Build Coastguard Worker }
7722*4bdc9457SAndroid Build Coastguard Worker }
7723*4bdc9457SAndroid Build Coastguard Worker }
7724*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_2X4__SCALAR,strided_cm)7725*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_2X4__SCALAR, strided_cm) {
7726*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
7727*4bdc9457SAndroid Build Coastguard Worker .mr(2)
7728*4bdc9457SAndroid Build Coastguard Worker .nr(4)
7729*4bdc9457SAndroid Build Coastguard Worker .kr(1)
7730*4bdc9457SAndroid Build Coastguard Worker .sr(1)
7731*4bdc9457SAndroid Build Coastguard Worker .m(2)
7732*4bdc9457SAndroid Build Coastguard Worker .n(4)
7733*4bdc9457SAndroid Build Coastguard Worker .k(1)
7734*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
7735*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_2x4__scalar);
7736*4bdc9457SAndroid Build Coastguard Worker }
7737