1*4bdc9457SAndroid Build Coastguard Worker // Copyright (c) Facebook, Inc. and its affiliates.
2*4bdc9457SAndroid Build Coastguard Worker // All rights reserved.
3*4bdc9457SAndroid Build Coastguard Worker //
4*4bdc9457SAndroid Build Coastguard Worker // Copyright 2019 Google LLC
5*4bdc9457SAndroid Build Coastguard Worker //
6*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
7*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
8*4bdc9457SAndroid Build Coastguard Worker //
9*4bdc9457SAndroid Build Coastguard Worker // Auto-generated file. Do not edit!
10*4bdc9457SAndroid Build Coastguard Worker // Specification: test/f32-gemm-relu.yaml
11*4bdc9457SAndroid Build Coastguard Worker // Generator: tools/generate-gemm-test.py
12*4bdc9457SAndroid Build Coastguard Worker
13*4bdc9457SAndroid Build Coastguard Worker
14*4bdc9457SAndroid Build Coastguard Worker #include <gtest/gtest.h>
15*4bdc9457SAndroid Build Coastguard Worker
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/allocator.h>
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h>
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/isa-checks.h>
19*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microparams-init.h>
20*4bdc9457SAndroid Build Coastguard Worker
21*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/gemm.h>
22*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/igemm.h>
23*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/ppmm.h>
24*4bdc9457SAndroid Build Coastguard Worker #include "gemm-microkernel-tester.h"
25*4bdc9457SAndroid Build Coastguard Worker
26*4bdc9457SAndroid Build Coastguard Worker
27*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_eq_1)28*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_eq_1) {
29*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
30*4bdc9457SAndroid Build Coastguard Worker .mr(1)
31*4bdc9457SAndroid Build Coastguard Worker .nr(8)
32*4bdc9457SAndroid Build Coastguard Worker .kr(1)
33*4bdc9457SAndroid Build Coastguard Worker .sr(1)
34*4bdc9457SAndroid Build Coastguard Worker .m(1)
35*4bdc9457SAndroid Build Coastguard Worker .n(8)
36*4bdc9457SAndroid Build Coastguard Worker .k(1)
37*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
38*4bdc9457SAndroid Build Coastguard Worker }
39*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,strided_cn)40*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, strided_cn) {
41*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
42*4bdc9457SAndroid Build Coastguard Worker .mr(1)
43*4bdc9457SAndroid Build Coastguard Worker .nr(8)
44*4bdc9457SAndroid Build Coastguard Worker .kr(1)
45*4bdc9457SAndroid Build Coastguard Worker .sr(1)
46*4bdc9457SAndroid Build Coastguard Worker .m(1)
47*4bdc9457SAndroid Build Coastguard Worker .n(8)
48*4bdc9457SAndroid Build Coastguard Worker .k(1)
49*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
50*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
51*4bdc9457SAndroid Build Coastguard Worker }
52*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_eq_1_strided_a)53*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_eq_1_strided_a) {
54*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
55*4bdc9457SAndroid Build Coastguard Worker .mr(1)
56*4bdc9457SAndroid Build Coastguard Worker .nr(8)
57*4bdc9457SAndroid Build Coastguard Worker .kr(1)
58*4bdc9457SAndroid Build Coastguard Worker .sr(1)
59*4bdc9457SAndroid Build Coastguard Worker .m(1)
60*4bdc9457SAndroid Build Coastguard Worker .n(8)
61*4bdc9457SAndroid Build Coastguard Worker .k(1)
62*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
63*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
64*4bdc9457SAndroid Build Coastguard Worker }
65*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)66*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
67*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
68*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
69*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
70*4bdc9457SAndroid Build Coastguard Worker .mr(1)
71*4bdc9457SAndroid Build Coastguard Worker .nr(8)
72*4bdc9457SAndroid Build Coastguard Worker .kr(1)
73*4bdc9457SAndroid Build Coastguard Worker .sr(1)
74*4bdc9457SAndroid Build Coastguard Worker .m(m)
75*4bdc9457SAndroid Build Coastguard Worker .n(n)
76*4bdc9457SAndroid Build Coastguard Worker .k(1)
77*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
78*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
79*4bdc9457SAndroid Build Coastguard Worker }
80*4bdc9457SAndroid Build Coastguard Worker }
81*4bdc9457SAndroid Build Coastguard Worker }
82*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)83*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
84*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
85*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
86*4bdc9457SAndroid Build Coastguard Worker .mr(1)
87*4bdc9457SAndroid Build Coastguard Worker .nr(8)
88*4bdc9457SAndroid Build Coastguard Worker .kr(1)
89*4bdc9457SAndroid Build Coastguard Worker .sr(1)
90*4bdc9457SAndroid Build Coastguard Worker .m(m)
91*4bdc9457SAndroid Build Coastguard Worker .n(8)
92*4bdc9457SAndroid Build Coastguard Worker .k(1)
93*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
94*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
95*4bdc9457SAndroid Build Coastguard Worker }
96*4bdc9457SAndroid Build Coastguard Worker }
97*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)98*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
99*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
100*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
101*4bdc9457SAndroid Build Coastguard Worker .mr(1)
102*4bdc9457SAndroid Build Coastguard Worker .nr(8)
103*4bdc9457SAndroid Build Coastguard Worker .kr(1)
104*4bdc9457SAndroid Build Coastguard Worker .sr(1)
105*4bdc9457SAndroid Build Coastguard Worker .m(1)
106*4bdc9457SAndroid Build Coastguard Worker .n(n)
107*4bdc9457SAndroid Build Coastguard Worker .k(1)
108*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
109*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
110*4bdc9457SAndroid Build Coastguard Worker }
111*4bdc9457SAndroid Build Coastguard Worker }
112*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_gt_1)113*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_gt_1) {
114*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
115*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
116*4bdc9457SAndroid Build Coastguard Worker .mr(1)
117*4bdc9457SAndroid Build Coastguard Worker .nr(8)
118*4bdc9457SAndroid Build Coastguard Worker .kr(1)
119*4bdc9457SAndroid Build Coastguard Worker .sr(1)
120*4bdc9457SAndroid Build Coastguard Worker .m(1)
121*4bdc9457SAndroid Build Coastguard Worker .n(8)
122*4bdc9457SAndroid Build Coastguard Worker .k(k)
123*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
124*4bdc9457SAndroid Build Coastguard Worker }
125*4bdc9457SAndroid Build Coastguard Worker }
126*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_gt_1_strided_a)127*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_gt_1_strided_a) {
128*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
129*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
130*4bdc9457SAndroid Build Coastguard Worker .mr(1)
131*4bdc9457SAndroid Build Coastguard Worker .nr(8)
132*4bdc9457SAndroid Build Coastguard Worker .kr(1)
133*4bdc9457SAndroid Build Coastguard Worker .sr(1)
134*4bdc9457SAndroid Build Coastguard Worker .m(1)
135*4bdc9457SAndroid Build Coastguard Worker .n(8)
136*4bdc9457SAndroid Build Coastguard Worker .k(k)
137*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
138*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
139*4bdc9457SAndroid Build Coastguard Worker }
140*4bdc9457SAndroid Build Coastguard Worker }
141*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)142*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
143*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
144*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
145*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
146*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
147*4bdc9457SAndroid Build Coastguard Worker .mr(1)
148*4bdc9457SAndroid Build Coastguard Worker .nr(8)
149*4bdc9457SAndroid Build Coastguard Worker .kr(1)
150*4bdc9457SAndroid Build Coastguard Worker .sr(1)
151*4bdc9457SAndroid Build Coastguard Worker .m(m)
152*4bdc9457SAndroid Build Coastguard Worker .n(n)
153*4bdc9457SAndroid Build Coastguard Worker .k(k)
154*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
155*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
156*4bdc9457SAndroid Build Coastguard Worker }
157*4bdc9457SAndroid Build Coastguard Worker }
158*4bdc9457SAndroid Build Coastguard Worker }
159*4bdc9457SAndroid Build Coastguard Worker }
160*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_gt_8)161*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_gt_8) {
162*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
163*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
164*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
165*4bdc9457SAndroid Build Coastguard Worker .mr(1)
166*4bdc9457SAndroid Build Coastguard Worker .nr(8)
167*4bdc9457SAndroid Build Coastguard Worker .kr(1)
168*4bdc9457SAndroid Build Coastguard Worker .sr(1)
169*4bdc9457SAndroid Build Coastguard Worker .m(1)
170*4bdc9457SAndroid Build Coastguard Worker .n(n)
171*4bdc9457SAndroid Build Coastguard Worker .k(k)
172*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
173*4bdc9457SAndroid Build Coastguard Worker }
174*4bdc9457SAndroid Build Coastguard Worker }
175*4bdc9457SAndroid Build Coastguard Worker }
176*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)177*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
178*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
179*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
180*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
181*4bdc9457SAndroid Build Coastguard Worker .mr(1)
182*4bdc9457SAndroid Build Coastguard Worker .nr(8)
183*4bdc9457SAndroid Build Coastguard Worker .kr(1)
184*4bdc9457SAndroid Build Coastguard Worker .sr(1)
185*4bdc9457SAndroid Build Coastguard Worker .m(1)
186*4bdc9457SAndroid Build Coastguard Worker .n(n)
187*4bdc9457SAndroid Build Coastguard Worker .k(k)
188*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
189*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
190*4bdc9457SAndroid Build Coastguard Worker }
191*4bdc9457SAndroid Build Coastguard Worker }
192*4bdc9457SAndroid Build Coastguard Worker }
193*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_a)194*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_a) {
195*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
196*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
197*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
198*4bdc9457SAndroid Build Coastguard Worker .mr(1)
199*4bdc9457SAndroid Build Coastguard Worker .nr(8)
200*4bdc9457SAndroid Build Coastguard Worker .kr(1)
201*4bdc9457SAndroid Build Coastguard Worker .sr(1)
202*4bdc9457SAndroid Build Coastguard Worker .m(1)
203*4bdc9457SAndroid Build Coastguard Worker .n(n)
204*4bdc9457SAndroid Build Coastguard Worker .k(k)
205*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
206*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
207*4bdc9457SAndroid Build Coastguard Worker }
208*4bdc9457SAndroid Build Coastguard Worker }
209*4bdc9457SAndroid Build Coastguard Worker }
210*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)211*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
212*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
213*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
214*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
215*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
216*4bdc9457SAndroid Build Coastguard Worker .mr(1)
217*4bdc9457SAndroid Build Coastguard Worker .nr(8)
218*4bdc9457SAndroid Build Coastguard Worker .kr(1)
219*4bdc9457SAndroid Build Coastguard Worker .sr(1)
220*4bdc9457SAndroid Build Coastguard Worker .m(m)
221*4bdc9457SAndroid Build Coastguard Worker .n(n)
222*4bdc9457SAndroid Build Coastguard Worker .k(k)
223*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
224*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
225*4bdc9457SAndroid Build Coastguard Worker }
226*4bdc9457SAndroid Build Coastguard Worker }
227*4bdc9457SAndroid Build Coastguard Worker }
228*4bdc9457SAndroid Build Coastguard Worker }
229*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_div_8)230*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_div_8) {
231*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
232*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
233*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
234*4bdc9457SAndroid Build Coastguard Worker .mr(1)
235*4bdc9457SAndroid Build Coastguard Worker .nr(8)
236*4bdc9457SAndroid Build Coastguard Worker .kr(1)
237*4bdc9457SAndroid Build Coastguard Worker .sr(1)
238*4bdc9457SAndroid Build Coastguard Worker .m(1)
239*4bdc9457SAndroid Build Coastguard Worker .n(n)
240*4bdc9457SAndroid Build Coastguard Worker .k(k)
241*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
242*4bdc9457SAndroid Build Coastguard Worker }
243*4bdc9457SAndroid Build Coastguard Worker }
244*4bdc9457SAndroid Build Coastguard Worker }
245*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)246*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
247*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
248*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
249*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
250*4bdc9457SAndroid Build Coastguard Worker .mr(1)
251*4bdc9457SAndroid Build Coastguard Worker .nr(8)
252*4bdc9457SAndroid Build Coastguard Worker .kr(1)
253*4bdc9457SAndroid Build Coastguard Worker .sr(1)
254*4bdc9457SAndroid Build Coastguard Worker .m(1)
255*4bdc9457SAndroid Build Coastguard Worker .n(n)
256*4bdc9457SAndroid Build Coastguard Worker .k(k)
257*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
258*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
259*4bdc9457SAndroid Build Coastguard Worker }
260*4bdc9457SAndroid Build Coastguard Worker }
261*4bdc9457SAndroid Build Coastguard Worker }
262*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_div_8_strided_a)263*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_div_8_strided_a) {
264*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
265*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
266*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
267*4bdc9457SAndroid Build Coastguard Worker .mr(1)
268*4bdc9457SAndroid Build Coastguard Worker .nr(8)
269*4bdc9457SAndroid Build Coastguard Worker .kr(1)
270*4bdc9457SAndroid Build Coastguard Worker .sr(1)
271*4bdc9457SAndroid Build Coastguard Worker .m(1)
272*4bdc9457SAndroid Build Coastguard Worker .n(n)
273*4bdc9457SAndroid Build Coastguard Worker .k(k)
274*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
275*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
276*4bdc9457SAndroid Build Coastguard Worker }
277*4bdc9457SAndroid Build Coastguard Worker }
278*4bdc9457SAndroid Build Coastguard Worker }
279*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)280*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
281*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
282*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
283*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
284*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
285*4bdc9457SAndroid Build Coastguard Worker .mr(1)
286*4bdc9457SAndroid Build Coastguard Worker .nr(8)
287*4bdc9457SAndroid Build Coastguard Worker .kr(1)
288*4bdc9457SAndroid Build Coastguard Worker .sr(1)
289*4bdc9457SAndroid Build Coastguard Worker .m(m)
290*4bdc9457SAndroid Build Coastguard Worker .n(n)
291*4bdc9457SAndroid Build Coastguard Worker .k(k)
292*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
293*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
294*4bdc9457SAndroid Build Coastguard Worker }
295*4bdc9457SAndroid Build Coastguard Worker }
296*4bdc9457SAndroid Build Coastguard Worker }
297*4bdc9457SAndroid Build Coastguard Worker }
298*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)299*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
300*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
301*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
302*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
303*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
304*4bdc9457SAndroid Build Coastguard Worker .mr(1)
305*4bdc9457SAndroid Build Coastguard Worker .nr(8)
306*4bdc9457SAndroid Build Coastguard Worker .kr(1)
307*4bdc9457SAndroid Build Coastguard Worker .sr(1)
308*4bdc9457SAndroid Build Coastguard Worker .m(m)
309*4bdc9457SAndroid Build Coastguard Worker .n(n)
310*4bdc9457SAndroid Build Coastguard Worker .k(k)
311*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
312*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
313*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
314*4bdc9457SAndroid Build Coastguard Worker }
315*4bdc9457SAndroid Build Coastguard Worker }
316*4bdc9457SAndroid Build Coastguard Worker }
317*4bdc9457SAndroid Build Coastguard Worker }
318*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT,strided_cm)319*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_LOADSPLAT, strided_cm) {
320*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
321*4bdc9457SAndroid Build Coastguard Worker .mr(1)
322*4bdc9457SAndroid Build Coastguard Worker .nr(8)
323*4bdc9457SAndroid Build Coastguard Worker .kr(1)
324*4bdc9457SAndroid Build Coastguard Worker .sr(1)
325*4bdc9457SAndroid Build Coastguard Worker .m(1)
326*4bdc9457SAndroid Build Coastguard Worker .n(8)
327*4bdc9457SAndroid Build Coastguard Worker .k(1)
328*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
329*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat);
330*4bdc9457SAndroid Build Coastguard Worker }
331*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
332*4bdc9457SAndroid Build Coastguard Worker
333*4bdc9457SAndroid Build Coastguard Worker
334*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_eq_4)335*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_eq_4) {
336*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
337*4bdc9457SAndroid Build Coastguard Worker .mr(1)
338*4bdc9457SAndroid Build Coastguard Worker .nr(8)
339*4bdc9457SAndroid Build Coastguard Worker .kr(1)
340*4bdc9457SAndroid Build Coastguard Worker .sr(1)
341*4bdc9457SAndroid Build Coastguard Worker .m(1)
342*4bdc9457SAndroid Build Coastguard Worker .n(8)
343*4bdc9457SAndroid Build Coastguard Worker .k(4)
344*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
345*4bdc9457SAndroid Build Coastguard Worker }
346*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,strided_cn)347*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, strided_cn) {
348*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
349*4bdc9457SAndroid Build Coastguard Worker .mr(1)
350*4bdc9457SAndroid Build Coastguard Worker .nr(8)
351*4bdc9457SAndroid Build Coastguard Worker .kr(1)
352*4bdc9457SAndroid Build Coastguard Worker .sr(1)
353*4bdc9457SAndroid Build Coastguard Worker .m(1)
354*4bdc9457SAndroid Build Coastguard Worker .n(8)
355*4bdc9457SAndroid Build Coastguard Worker .k(4)
356*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
357*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
358*4bdc9457SAndroid Build Coastguard Worker }
359*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_eq_4_strided_a)360*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_eq_4_strided_a) {
361*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
362*4bdc9457SAndroid Build Coastguard Worker .mr(1)
363*4bdc9457SAndroid Build Coastguard Worker .nr(8)
364*4bdc9457SAndroid Build Coastguard Worker .kr(1)
365*4bdc9457SAndroid Build Coastguard Worker .sr(1)
366*4bdc9457SAndroid Build Coastguard Worker .m(1)
367*4bdc9457SAndroid Build Coastguard Worker .n(8)
368*4bdc9457SAndroid Build Coastguard Worker .k(4)
369*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
370*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
371*4bdc9457SAndroid Build Coastguard Worker }
372*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_eq_4_subtile)373*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
374*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
375*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
376*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
377*4bdc9457SAndroid Build Coastguard Worker .mr(1)
378*4bdc9457SAndroid Build Coastguard Worker .nr(8)
379*4bdc9457SAndroid Build Coastguard Worker .kr(1)
380*4bdc9457SAndroid Build Coastguard Worker .sr(1)
381*4bdc9457SAndroid Build Coastguard Worker .m(m)
382*4bdc9457SAndroid Build Coastguard Worker .n(n)
383*4bdc9457SAndroid Build Coastguard Worker .k(4)
384*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
385*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
386*4bdc9457SAndroid Build Coastguard Worker }
387*4bdc9457SAndroid Build Coastguard Worker }
388*4bdc9457SAndroid Build Coastguard Worker }
389*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)390*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
391*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
392*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
393*4bdc9457SAndroid Build Coastguard Worker .mr(1)
394*4bdc9457SAndroid Build Coastguard Worker .nr(8)
395*4bdc9457SAndroid Build Coastguard Worker .kr(1)
396*4bdc9457SAndroid Build Coastguard Worker .sr(1)
397*4bdc9457SAndroid Build Coastguard Worker .m(m)
398*4bdc9457SAndroid Build Coastguard Worker .n(8)
399*4bdc9457SAndroid Build Coastguard Worker .k(4)
400*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
401*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
402*4bdc9457SAndroid Build Coastguard Worker }
403*4bdc9457SAndroid Build Coastguard Worker }
404*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)405*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
406*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
407*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
408*4bdc9457SAndroid Build Coastguard Worker .mr(1)
409*4bdc9457SAndroid Build Coastguard Worker .nr(8)
410*4bdc9457SAndroid Build Coastguard Worker .kr(1)
411*4bdc9457SAndroid Build Coastguard Worker .sr(1)
412*4bdc9457SAndroid Build Coastguard Worker .m(1)
413*4bdc9457SAndroid Build Coastguard Worker .n(n)
414*4bdc9457SAndroid Build Coastguard Worker .k(4)
415*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
416*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
417*4bdc9457SAndroid Build Coastguard Worker }
418*4bdc9457SAndroid Build Coastguard Worker }
419*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_lt_4)420*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_lt_4) {
421*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
422*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
423*4bdc9457SAndroid Build Coastguard Worker .mr(1)
424*4bdc9457SAndroid Build Coastguard Worker .nr(8)
425*4bdc9457SAndroid Build Coastguard Worker .kr(1)
426*4bdc9457SAndroid Build Coastguard Worker .sr(1)
427*4bdc9457SAndroid Build Coastguard Worker .m(1)
428*4bdc9457SAndroid Build Coastguard Worker .n(8)
429*4bdc9457SAndroid Build Coastguard Worker .k(k)
430*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
431*4bdc9457SAndroid Build Coastguard Worker }
432*4bdc9457SAndroid Build Coastguard Worker }
433*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_lt_4_strided_a)434*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_lt_4_strided_a) {
435*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
436*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
437*4bdc9457SAndroid Build Coastguard Worker .mr(1)
438*4bdc9457SAndroid Build Coastguard Worker .nr(8)
439*4bdc9457SAndroid Build Coastguard Worker .kr(1)
440*4bdc9457SAndroid Build Coastguard Worker .sr(1)
441*4bdc9457SAndroid Build Coastguard Worker .m(1)
442*4bdc9457SAndroid Build Coastguard Worker .n(8)
443*4bdc9457SAndroid Build Coastguard Worker .k(k)
444*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
445*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
446*4bdc9457SAndroid Build Coastguard Worker }
447*4bdc9457SAndroid Build Coastguard Worker }
448*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_lt_4_subtile)449*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
450*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
451*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
452*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
453*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
454*4bdc9457SAndroid Build Coastguard Worker .mr(1)
455*4bdc9457SAndroid Build Coastguard Worker .nr(8)
456*4bdc9457SAndroid Build Coastguard Worker .kr(1)
457*4bdc9457SAndroid Build Coastguard Worker .sr(1)
458*4bdc9457SAndroid Build Coastguard Worker .m(m)
459*4bdc9457SAndroid Build Coastguard Worker .n(n)
460*4bdc9457SAndroid Build Coastguard Worker .k(k)
461*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
462*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
463*4bdc9457SAndroid Build Coastguard Worker }
464*4bdc9457SAndroid Build Coastguard Worker }
465*4bdc9457SAndroid Build Coastguard Worker }
466*4bdc9457SAndroid Build Coastguard Worker }
467*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_gt_4)468*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_gt_4) {
469*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
470*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
471*4bdc9457SAndroid Build Coastguard Worker .mr(1)
472*4bdc9457SAndroid Build Coastguard Worker .nr(8)
473*4bdc9457SAndroid Build Coastguard Worker .kr(1)
474*4bdc9457SAndroid Build Coastguard Worker .sr(1)
475*4bdc9457SAndroid Build Coastguard Worker .m(1)
476*4bdc9457SAndroid Build Coastguard Worker .n(8)
477*4bdc9457SAndroid Build Coastguard Worker .k(k)
478*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
479*4bdc9457SAndroid Build Coastguard Worker }
480*4bdc9457SAndroid Build Coastguard Worker }
481*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_gt_4_strided_a)482*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_gt_4_strided_a) {
483*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
484*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
485*4bdc9457SAndroid Build Coastguard Worker .mr(1)
486*4bdc9457SAndroid Build Coastguard Worker .nr(8)
487*4bdc9457SAndroid Build Coastguard Worker .kr(1)
488*4bdc9457SAndroid Build Coastguard Worker .sr(1)
489*4bdc9457SAndroid Build Coastguard Worker .m(1)
490*4bdc9457SAndroid Build Coastguard Worker .n(8)
491*4bdc9457SAndroid Build Coastguard Worker .k(k)
492*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
493*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
494*4bdc9457SAndroid Build Coastguard Worker }
495*4bdc9457SAndroid Build Coastguard Worker }
496*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_gt_4_subtile)497*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
498*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
499*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
500*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
501*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
502*4bdc9457SAndroid Build Coastguard Worker .mr(1)
503*4bdc9457SAndroid Build Coastguard Worker .nr(8)
504*4bdc9457SAndroid Build Coastguard Worker .kr(1)
505*4bdc9457SAndroid Build Coastguard Worker .sr(1)
506*4bdc9457SAndroid Build Coastguard Worker .m(m)
507*4bdc9457SAndroid Build Coastguard Worker .n(n)
508*4bdc9457SAndroid Build Coastguard Worker .k(k)
509*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
510*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
511*4bdc9457SAndroid Build Coastguard Worker }
512*4bdc9457SAndroid Build Coastguard Worker }
513*4bdc9457SAndroid Build Coastguard Worker }
514*4bdc9457SAndroid Build Coastguard Worker }
515*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_div_4)516*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_div_4) {
517*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
518*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
519*4bdc9457SAndroid Build Coastguard Worker .mr(1)
520*4bdc9457SAndroid Build Coastguard Worker .nr(8)
521*4bdc9457SAndroid Build Coastguard Worker .kr(1)
522*4bdc9457SAndroid Build Coastguard Worker .sr(1)
523*4bdc9457SAndroid Build Coastguard Worker .m(1)
524*4bdc9457SAndroid Build Coastguard Worker .n(8)
525*4bdc9457SAndroid Build Coastguard Worker .k(k)
526*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
527*4bdc9457SAndroid Build Coastguard Worker }
528*4bdc9457SAndroid Build Coastguard Worker }
529*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_div_4_strided_a)530*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_div_4_strided_a) {
531*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
532*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
533*4bdc9457SAndroid Build Coastguard Worker .mr(1)
534*4bdc9457SAndroid Build Coastguard Worker .nr(8)
535*4bdc9457SAndroid Build Coastguard Worker .kr(1)
536*4bdc9457SAndroid Build Coastguard Worker .sr(1)
537*4bdc9457SAndroid Build Coastguard Worker .m(1)
538*4bdc9457SAndroid Build Coastguard Worker .n(8)
539*4bdc9457SAndroid Build Coastguard Worker .k(k)
540*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
541*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
542*4bdc9457SAndroid Build Coastguard Worker }
543*4bdc9457SAndroid Build Coastguard Worker }
544*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,k_div_4_subtile)545*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, k_div_4_subtile) {
546*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
547*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
548*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
549*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
550*4bdc9457SAndroid Build Coastguard Worker .mr(1)
551*4bdc9457SAndroid Build Coastguard Worker .nr(8)
552*4bdc9457SAndroid Build Coastguard Worker .kr(1)
553*4bdc9457SAndroid Build Coastguard Worker .sr(1)
554*4bdc9457SAndroid Build Coastguard Worker .m(m)
555*4bdc9457SAndroid Build Coastguard Worker .n(n)
556*4bdc9457SAndroid Build Coastguard Worker .k(k)
557*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
558*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
559*4bdc9457SAndroid Build Coastguard Worker }
560*4bdc9457SAndroid Build Coastguard Worker }
561*4bdc9457SAndroid Build Coastguard Worker }
562*4bdc9457SAndroid Build Coastguard Worker }
563*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,n_gt_8)564*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, n_gt_8) {
565*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
566*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
567*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
568*4bdc9457SAndroid Build Coastguard Worker .mr(1)
569*4bdc9457SAndroid Build Coastguard Worker .nr(8)
570*4bdc9457SAndroid Build Coastguard Worker .kr(1)
571*4bdc9457SAndroid Build Coastguard Worker .sr(1)
572*4bdc9457SAndroid Build Coastguard Worker .m(1)
573*4bdc9457SAndroid Build Coastguard Worker .n(n)
574*4bdc9457SAndroid Build Coastguard Worker .k(k)
575*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
576*4bdc9457SAndroid Build Coastguard Worker }
577*4bdc9457SAndroid Build Coastguard Worker }
578*4bdc9457SAndroid Build Coastguard Worker }
579*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)580*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
581*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
582*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
583*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
584*4bdc9457SAndroid Build Coastguard Worker .mr(1)
585*4bdc9457SAndroid Build Coastguard Worker .nr(8)
586*4bdc9457SAndroid Build Coastguard Worker .kr(1)
587*4bdc9457SAndroid Build Coastguard Worker .sr(1)
588*4bdc9457SAndroid Build Coastguard Worker .m(1)
589*4bdc9457SAndroid Build Coastguard Worker .n(n)
590*4bdc9457SAndroid Build Coastguard Worker .k(k)
591*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
592*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
593*4bdc9457SAndroid Build Coastguard Worker }
594*4bdc9457SAndroid Build Coastguard Worker }
595*4bdc9457SAndroid Build Coastguard Worker }
596*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,n_gt_8_strided_a)597*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, n_gt_8_strided_a) {
598*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
599*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
600*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
601*4bdc9457SAndroid Build Coastguard Worker .mr(1)
602*4bdc9457SAndroid Build Coastguard Worker .nr(8)
603*4bdc9457SAndroid Build Coastguard Worker .kr(1)
604*4bdc9457SAndroid Build Coastguard Worker .sr(1)
605*4bdc9457SAndroid Build Coastguard Worker .m(1)
606*4bdc9457SAndroid Build Coastguard Worker .n(n)
607*4bdc9457SAndroid Build Coastguard Worker .k(k)
608*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
609*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
610*4bdc9457SAndroid Build Coastguard Worker }
611*4bdc9457SAndroid Build Coastguard Worker }
612*4bdc9457SAndroid Build Coastguard Worker }
613*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,n_gt_8_subtile)614*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
615*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
616*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
617*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
618*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
619*4bdc9457SAndroid Build Coastguard Worker .mr(1)
620*4bdc9457SAndroid Build Coastguard Worker .nr(8)
621*4bdc9457SAndroid Build Coastguard Worker .kr(1)
622*4bdc9457SAndroid Build Coastguard Worker .sr(1)
623*4bdc9457SAndroid Build Coastguard Worker .m(m)
624*4bdc9457SAndroid Build Coastguard Worker .n(n)
625*4bdc9457SAndroid Build Coastguard Worker .k(k)
626*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
627*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
628*4bdc9457SAndroid Build Coastguard Worker }
629*4bdc9457SAndroid Build Coastguard Worker }
630*4bdc9457SAndroid Build Coastguard Worker }
631*4bdc9457SAndroid Build Coastguard Worker }
632*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,n_div_8)633*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, n_div_8) {
634*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
635*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
636*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
637*4bdc9457SAndroid Build Coastguard Worker .mr(1)
638*4bdc9457SAndroid Build Coastguard Worker .nr(8)
639*4bdc9457SAndroid Build Coastguard Worker .kr(1)
640*4bdc9457SAndroid Build Coastguard Worker .sr(1)
641*4bdc9457SAndroid Build Coastguard Worker .m(1)
642*4bdc9457SAndroid Build Coastguard Worker .n(n)
643*4bdc9457SAndroid Build Coastguard Worker .k(k)
644*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
645*4bdc9457SAndroid Build Coastguard Worker }
646*4bdc9457SAndroid Build Coastguard Worker }
647*4bdc9457SAndroid Build Coastguard Worker }
648*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,n_div_8_strided_cn)649*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
650*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
651*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
652*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
653*4bdc9457SAndroid Build Coastguard Worker .mr(1)
654*4bdc9457SAndroid Build Coastguard Worker .nr(8)
655*4bdc9457SAndroid Build Coastguard Worker .kr(1)
656*4bdc9457SAndroid Build Coastguard Worker .sr(1)
657*4bdc9457SAndroid Build Coastguard Worker .m(1)
658*4bdc9457SAndroid Build Coastguard Worker .n(n)
659*4bdc9457SAndroid Build Coastguard Worker .k(k)
660*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
661*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
662*4bdc9457SAndroid Build Coastguard Worker }
663*4bdc9457SAndroid Build Coastguard Worker }
664*4bdc9457SAndroid Build Coastguard Worker }
665*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,n_div_8_strided_a)666*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, n_div_8_strided_a) {
667*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
668*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
669*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
670*4bdc9457SAndroid Build Coastguard Worker .mr(1)
671*4bdc9457SAndroid Build Coastguard Worker .nr(8)
672*4bdc9457SAndroid Build Coastguard Worker .kr(1)
673*4bdc9457SAndroid Build Coastguard Worker .sr(1)
674*4bdc9457SAndroid Build Coastguard Worker .m(1)
675*4bdc9457SAndroid Build Coastguard Worker .n(n)
676*4bdc9457SAndroid Build Coastguard Worker .k(k)
677*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
678*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
679*4bdc9457SAndroid Build Coastguard Worker }
680*4bdc9457SAndroid Build Coastguard Worker }
681*4bdc9457SAndroid Build Coastguard Worker }
682*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,n_div_8_subtile)683*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, n_div_8_subtile) {
684*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
685*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
686*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
687*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
688*4bdc9457SAndroid Build Coastguard Worker .mr(1)
689*4bdc9457SAndroid Build Coastguard Worker .nr(8)
690*4bdc9457SAndroid Build Coastguard Worker .kr(1)
691*4bdc9457SAndroid Build Coastguard Worker .sr(1)
692*4bdc9457SAndroid Build Coastguard Worker .m(m)
693*4bdc9457SAndroid Build Coastguard Worker .n(n)
694*4bdc9457SAndroid Build Coastguard Worker .k(k)
695*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
696*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
697*4bdc9457SAndroid Build Coastguard Worker }
698*4bdc9457SAndroid Build Coastguard Worker }
699*4bdc9457SAndroid Build Coastguard Worker }
700*4bdc9457SAndroid Build Coastguard Worker }
701*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,strided_cm_subtile)702*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, strided_cm_subtile) {
703*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
704*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
705*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
706*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
707*4bdc9457SAndroid Build Coastguard Worker .mr(1)
708*4bdc9457SAndroid Build Coastguard Worker .nr(8)
709*4bdc9457SAndroid Build Coastguard Worker .kr(1)
710*4bdc9457SAndroid Build Coastguard Worker .sr(1)
711*4bdc9457SAndroid Build Coastguard Worker .m(m)
712*4bdc9457SAndroid Build Coastguard Worker .n(n)
713*4bdc9457SAndroid Build Coastguard Worker .k(k)
714*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
715*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
716*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
717*4bdc9457SAndroid Build Coastguard Worker }
718*4bdc9457SAndroid Build Coastguard Worker }
719*4bdc9457SAndroid Build Coastguard Worker }
720*4bdc9457SAndroid Build Coastguard Worker }
721*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT,strided_cm)722*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMSIMD_SPLAT, strided_cm) {
723*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
724*4bdc9457SAndroid Build Coastguard Worker .mr(1)
725*4bdc9457SAndroid Build Coastguard Worker .nr(8)
726*4bdc9457SAndroid Build Coastguard Worker .kr(1)
727*4bdc9457SAndroid Build Coastguard Worker .sr(1)
728*4bdc9457SAndroid Build Coastguard Worker .m(1)
729*4bdc9457SAndroid Build Coastguard Worker .n(8)
730*4bdc9457SAndroid Build Coastguard Worker .k(4)
731*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
732*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat);
733*4bdc9457SAndroid Build Coastguard Worker }
734*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
735*4bdc9457SAndroid Build Coastguard Worker
736*4bdc9457SAndroid Build Coastguard Worker
737*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_eq_4)738*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_eq_4) {
739*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
740*4bdc9457SAndroid Build Coastguard Worker .mr(1)
741*4bdc9457SAndroid Build Coastguard Worker .nr(8)
742*4bdc9457SAndroid Build Coastguard Worker .kr(1)
743*4bdc9457SAndroid Build Coastguard Worker .sr(4)
744*4bdc9457SAndroid Build Coastguard Worker .m(1)
745*4bdc9457SAndroid Build Coastguard Worker .n(8)
746*4bdc9457SAndroid Build Coastguard Worker .k(4)
747*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
748*4bdc9457SAndroid Build Coastguard Worker }
749*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,strided_cn)750*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, strided_cn) {
751*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
752*4bdc9457SAndroid Build Coastguard Worker .mr(1)
753*4bdc9457SAndroid Build Coastguard Worker .nr(8)
754*4bdc9457SAndroid Build Coastguard Worker .kr(1)
755*4bdc9457SAndroid Build Coastguard Worker .sr(4)
756*4bdc9457SAndroid Build Coastguard Worker .m(1)
757*4bdc9457SAndroid Build Coastguard Worker .n(8)
758*4bdc9457SAndroid Build Coastguard Worker .k(4)
759*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
760*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
761*4bdc9457SAndroid Build Coastguard Worker }
762*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_eq_4_strided_a)763*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_eq_4_strided_a) {
764*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
765*4bdc9457SAndroid Build Coastguard Worker .mr(1)
766*4bdc9457SAndroid Build Coastguard Worker .nr(8)
767*4bdc9457SAndroid Build Coastguard Worker .kr(1)
768*4bdc9457SAndroid Build Coastguard Worker .sr(4)
769*4bdc9457SAndroid Build Coastguard Worker .m(1)
770*4bdc9457SAndroid Build Coastguard Worker .n(8)
771*4bdc9457SAndroid Build Coastguard Worker .k(4)
772*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
773*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
774*4bdc9457SAndroid Build Coastguard Worker }
775*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_eq_4_subtile)776*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_eq_4_subtile) {
777*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
778*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
779*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
780*4bdc9457SAndroid Build Coastguard Worker .mr(1)
781*4bdc9457SAndroid Build Coastguard Worker .nr(8)
782*4bdc9457SAndroid Build Coastguard Worker .kr(1)
783*4bdc9457SAndroid Build Coastguard Worker .sr(4)
784*4bdc9457SAndroid Build Coastguard Worker .m(m)
785*4bdc9457SAndroid Build Coastguard Worker .n(n)
786*4bdc9457SAndroid Build Coastguard Worker .k(4)
787*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
788*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
789*4bdc9457SAndroid Build Coastguard Worker }
790*4bdc9457SAndroid Build Coastguard Worker }
791*4bdc9457SAndroid Build Coastguard Worker }
792*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_eq_4_subtile_m)793*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_eq_4_subtile_m) {
794*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
795*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
796*4bdc9457SAndroid Build Coastguard Worker .mr(1)
797*4bdc9457SAndroid Build Coastguard Worker .nr(8)
798*4bdc9457SAndroid Build Coastguard Worker .kr(1)
799*4bdc9457SAndroid Build Coastguard Worker .sr(4)
800*4bdc9457SAndroid Build Coastguard Worker .m(m)
801*4bdc9457SAndroid Build Coastguard Worker .n(8)
802*4bdc9457SAndroid Build Coastguard Worker .k(4)
803*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
804*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
805*4bdc9457SAndroid Build Coastguard Worker }
806*4bdc9457SAndroid Build Coastguard Worker }
807*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_eq_4_subtile_n)808*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_eq_4_subtile_n) {
809*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
810*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
811*4bdc9457SAndroid Build Coastguard Worker .mr(1)
812*4bdc9457SAndroid Build Coastguard Worker .nr(8)
813*4bdc9457SAndroid Build Coastguard Worker .kr(1)
814*4bdc9457SAndroid Build Coastguard Worker .sr(4)
815*4bdc9457SAndroid Build Coastguard Worker .m(1)
816*4bdc9457SAndroid Build Coastguard Worker .n(n)
817*4bdc9457SAndroid Build Coastguard Worker .k(4)
818*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
819*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
820*4bdc9457SAndroid Build Coastguard Worker }
821*4bdc9457SAndroid Build Coastguard Worker }
822*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_lt_4)823*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_lt_4) {
824*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
825*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
826*4bdc9457SAndroid Build Coastguard Worker .mr(1)
827*4bdc9457SAndroid Build Coastguard Worker .nr(8)
828*4bdc9457SAndroid Build Coastguard Worker .kr(1)
829*4bdc9457SAndroid Build Coastguard Worker .sr(4)
830*4bdc9457SAndroid Build Coastguard Worker .m(1)
831*4bdc9457SAndroid Build Coastguard Worker .n(8)
832*4bdc9457SAndroid Build Coastguard Worker .k(k)
833*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
834*4bdc9457SAndroid Build Coastguard Worker }
835*4bdc9457SAndroid Build Coastguard Worker }
836*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_lt_4_strided_a)837*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_lt_4_strided_a) {
838*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
839*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
840*4bdc9457SAndroid Build Coastguard Worker .mr(1)
841*4bdc9457SAndroid Build Coastguard Worker .nr(8)
842*4bdc9457SAndroid Build Coastguard Worker .kr(1)
843*4bdc9457SAndroid Build Coastguard Worker .sr(4)
844*4bdc9457SAndroid Build Coastguard Worker .m(1)
845*4bdc9457SAndroid Build Coastguard Worker .n(8)
846*4bdc9457SAndroid Build Coastguard Worker .k(k)
847*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
848*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
849*4bdc9457SAndroid Build Coastguard Worker }
850*4bdc9457SAndroid Build Coastguard Worker }
851*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_lt_4_subtile)852*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_lt_4_subtile) {
853*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
854*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
855*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
856*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
857*4bdc9457SAndroid Build Coastguard Worker .mr(1)
858*4bdc9457SAndroid Build Coastguard Worker .nr(8)
859*4bdc9457SAndroid Build Coastguard Worker .kr(1)
860*4bdc9457SAndroid Build Coastguard Worker .sr(4)
861*4bdc9457SAndroid Build Coastguard Worker .m(m)
862*4bdc9457SAndroid Build Coastguard Worker .n(n)
863*4bdc9457SAndroid Build Coastguard Worker .k(k)
864*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
865*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
866*4bdc9457SAndroid Build Coastguard Worker }
867*4bdc9457SAndroid Build Coastguard Worker }
868*4bdc9457SAndroid Build Coastguard Worker }
869*4bdc9457SAndroid Build Coastguard Worker }
870*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_gt_4)871*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_gt_4) {
872*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
873*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
874*4bdc9457SAndroid Build Coastguard Worker .mr(1)
875*4bdc9457SAndroid Build Coastguard Worker .nr(8)
876*4bdc9457SAndroid Build Coastguard Worker .kr(1)
877*4bdc9457SAndroid Build Coastguard Worker .sr(4)
878*4bdc9457SAndroid Build Coastguard Worker .m(1)
879*4bdc9457SAndroid Build Coastguard Worker .n(8)
880*4bdc9457SAndroid Build Coastguard Worker .k(k)
881*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
882*4bdc9457SAndroid Build Coastguard Worker }
883*4bdc9457SAndroid Build Coastguard Worker }
884*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_gt_4_strided_a)885*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_gt_4_strided_a) {
886*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
887*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
888*4bdc9457SAndroid Build Coastguard Worker .mr(1)
889*4bdc9457SAndroid Build Coastguard Worker .nr(8)
890*4bdc9457SAndroid Build Coastguard Worker .kr(1)
891*4bdc9457SAndroid Build Coastguard Worker .sr(4)
892*4bdc9457SAndroid Build Coastguard Worker .m(1)
893*4bdc9457SAndroid Build Coastguard Worker .n(8)
894*4bdc9457SAndroid Build Coastguard Worker .k(k)
895*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
896*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
897*4bdc9457SAndroid Build Coastguard Worker }
898*4bdc9457SAndroid Build Coastguard Worker }
899*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_gt_4_subtile)900*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_gt_4_subtile) {
901*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
902*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
903*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
904*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
905*4bdc9457SAndroid Build Coastguard Worker .mr(1)
906*4bdc9457SAndroid Build Coastguard Worker .nr(8)
907*4bdc9457SAndroid Build Coastguard Worker .kr(1)
908*4bdc9457SAndroid Build Coastguard Worker .sr(4)
909*4bdc9457SAndroid Build Coastguard Worker .m(m)
910*4bdc9457SAndroid Build Coastguard Worker .n(n)
911*4bdc9457SAndroid Build Coastguard Worker .k(k)
912*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
913*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
914*4bdc9457SAndroid Build Coastguard Worker }
915*4bdc9457SAndroid Build Coastguard Worker }
916*4bdc9457SAndroid Build Coastguard Worker }
917*4bdc9457SAndroid Build Coastguard Worker }
918*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_div_4)919*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_div_4) {
920*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
921*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
922*4bdc9457SAndroid Build Coastguard Worker .mr(1)
923*4bdc9457SAndroid Build Coastguard Worker .nr(8)
924*4bdc9457SAndroid Build Coastguard Worker .kr(1)
925*4bdc9457SAndroid Build Coastguard Worker .sr(4)
926*4bdc9457SAndroid Build Coastguard Worker .m(1)
927*4bdc9457SAndroid Build Coastguard Worker .n(8)
928*4bdc9457SAndroid Build Coastguard Worker .k(k)
929*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
930*4bdc9457SAndroid Build Coastguard Worker }
931*4bdc9457SAndroid Build Coastguard Worker }
932*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_div_4_strided_a)933*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_div_4_strided_a) {
934*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
935*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
936*4bdc9457SAndroid Build Coastguard Worker .mr(1)
937*4bdc9457SAndroid Build Coastguard Worker .nr(8)
938*4bdc9457SAndroid Build Coastguard Worker .kr(1)
939*4bdc9457SAndroid Build Coastguard Worker .sr(4)
940*4bdc9457SAndroid Build Coastguard Worker .m(1)
941*4bdc9457SAndroid Build Coastguard Worker .n(8)
942*4bdc9457SAndroid Build Coastguard Worker .k(k)
943*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
944*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
945*4bdc9457SAndroid Build Coastguard Worker }
946*4bdc9457SAndroid Build Coastguard Worker }
947*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,k_div_4_subtile)948*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, k_div_4_subtile) {
949*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
950*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
951*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
952*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
953*4bdc9457SAndroid Build Coastguard Worker .mr(1)
954*4bdc9457SAndroid Build Coastguard Worker .nr(8)
955*4bdc9457SAndroid Build Coastguard Worker .kr(1)
956*4bdc9457SAndroid Build Coastguard Worker .sr(4)
957*4bdc9457SAndroid Build Coastguard Worker .m(m)
958*4bdc9457SAndroid Build Coastguard Worker .n(n)
959*4bdc9457SAndroid Build Coastguard Worker .k(k)
960*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
961*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
962*4bdc9457SAndroid Build Coastguard Worker }
963*4bdc9457SAndroid Build Coastguard Worker }
964*4bdc9457SAndroid Build Coastguard Worker }
965*4bdc9457SAndroid Build Coastguard Worker }
966*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,n_gt_8)967*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, n_gt_8) {
968*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
969*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
970*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
971*4bdc9457SAndroid Build Coastguard Worker .mr(1)
972*4bdc9457SAndroid Build Coastguard Worker .nr(8)
973*4bdc9457SAndroid Build Coastguard Worker .kr(1)
974*4bdc9457SAndroid Build Coastguard Worker .sr(4)
975*4bdc9457SAndroid Build Coastguard Worker .m(1)
976*4bdc9457SAndroid Build Coastguard Worker .n(n)
977*4bdc9457SAndroid Build Coastguard Worker .k(k)
978*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
979*4bdc9457SAndroid Build Coastguard Worker }
980*4bdc9457SAndroid Build Coastguard Worker }
981*4bdc9457SAndroid Build Coastguard Worker }
982*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,n_gt_8_strided_cn)983*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, n_gt_8_strided_cn) {
984*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
985*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
986*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
987*4bdc9457SAndroid Build Coastguard Worker .mr(1)
988*4bdc9457SAndroid Build Coastguard Worker .nr(8)
989*4bdc9457SAndroid Build Coastguard Worker .kr(1)
990*4bdc9457SAndroid Build Coastguard Worker .sr(4)
991*4bdc9457SAndroid Build Coastguard Worker .m(1)
992*4bdc9457SAndroid Build Coastguard Worker .n(n)
993*4bdc9457SAndroid Build Coastguard Worker .k(k)
994*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
995*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
996*4bdc9457SAndroid Build Coastguard Worker }
997*4bdc9457SAndroid Build Coastguard Worker }
998*4bdc9457SAndroid Build Coastguard Worker }
999*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,n_gt_8_strided_a)1000*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, n_gt_8_strided_a) {
1001*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1002*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1003*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1004*4bdc9457SAndroid Build Coastguard Worker .mr(1)
1005*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1006*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1007*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1008*4bdc9457SAndroid Build Coastguard Worker .m(1)
1009*4bdc9457SAndroid Build Coastguard Worker .n(n)
1010*4bdc9457SAndroid Build Coastguard Worker .k(k)
1011*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1012*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
1013*4bdc9457SAndroid Build Coastguard Worker }
1014*4bdc9457SAndroid Build Coastguard Worker }
1015*4bdc9457SAndroid Build Coastguard Worker }
1016*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,n_gt_8_subtile)1017*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, n_gt_8_subtile) {
1018*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1019*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1020*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
1021*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1022*4bdc9457SAndroid Build Coastguard Worker .mr(1)
1023*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1024*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1025*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1026*4bdc9457SAndroid Build Coastguard Worker .m(m)
1027*4bdc9457SAndroid Build Coastguard Worker .n(n)
1028*4bdc9457SAndroid Build Coastguard Worker .k(k)
1029*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1030*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
1031*4bdc9457SAndroid Build Coastguard Worker }
1032*4bdc9457SAndroid Build Coastguard Worker }
1033*4bdc9457SAndroid Build Coastguard Worker }
1034*4bdc9457SAndroid Build Coastguard Worker }
1035*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,n_div_8)1036*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, n_div_8) {
1037*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1038*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1039*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1040*4bdc9457SAndroid Build Coastguard Worker .mr(1)
1041*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1042*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1043*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1044*4bdc9457SAndroid Build Coastguard Worker .m(1)
1045*4bdc9457SAndroid Build Coastguard Worker .n(n)
1046*4bdc9457SAndroid Build Coastguard Worker .k(k)
1047*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
1048*4bdc9457SAndroid Build Coastguard Worker }
1049*4bdc9457SAndroid Build Coastguard Worker }
1050*4bdc9457SAndroid Build Coastguard Worker }
1051*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,n_div_8_strided_cn)1052*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, n_div_8_strided_cn) {
1053*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1054*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1055*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1056*4bdc9457SAndroid Build Coastguard Worker .mr(1)
1057*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1058*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1059*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1060*4bdc9457SAndroid Build Coastguard Worker .m(1)
1061*4bdc9457SAndroid Build Coastguard Worker .n(n)
1062*4bdc9457SAndroid Build Coastguard Worker .k(k)
1063*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1064*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
1065*4bdc9457SAndroid Build Coastguard Worker }
1066*4bdc9457SAndroid Build Coastguard Worker }
1067*4bdc9457SAndroid Build Coastguard Worker }
1068*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,n_div_8_strided_a)1069*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, n_div_8_strided_a) {
1070*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1071*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1072*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1073*4bdc9457SAndroid Build Coastguard Worker .mr(1)
1074*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1075*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1076*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1077*4bdc9457SAndroid Build Coastguard Worker .m(1)
1078*4bdc9457SAndroid Build Coastguard Worker .n(n)
1079*4bdc9457SAndroid Build Coastguard Worker .k(k)
1080*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1081*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
1082*4bdc9457SAndroid Build Coastguard Worker }
1083*4bdc9457SAndroid Build Coastguard Worker }
1084*4bdc9457SAndroid Build Coastguard Worker }
1085*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,n_div_8_subtile)1086*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, n_div_8_subtile) {
1087*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1088*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1089*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
1090*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1091*4bdc9457SAndroid Build Coastguard Worker .mr(1)
1092*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1093*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1094*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1095*4bdc9457SAndroid Build Coastguard Worker .m(m)
1096*4bdc9457SAndroid Build Coastguard Worker .n(n)
1097*4bdc9457SAndroid Build Coastguard Worker .k(k)
1098*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1099*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
1100*4bdc9457SAndroid Build Coastguard Worker }
1101*4bdc9457SAndroid Build Coastguard Worker }
1102*4bdc9457SAndroid Build Coastguard Worker }
1103*4bdc9457SAndroid Build Coastguard Worker }
1104*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,strided_cm_subtile)1105*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, strided_cm_subtile) {
1106*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1107*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1108*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
1109*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1110*4bdc9457SAndroid Build Coastguard Worker .mr(1)
1111*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1112*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1113*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1114*4bdc9457SAndroid Build Coastguard Worker .m(m)
1115*4bdc9457SAndroid Build Coastguard Worker .n(n)
1116*4bdc9457SAndroid Build Coastguard Worker .k(k)
1117*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1118*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1119*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
1120*4bdc9457SAndroid Build Coastguard Worker }
1121*4bdc9457SAndroid Build Coastguard Worker }
1122*4bdc9457SAndroid Build Coastguard Worker }
1123*4bdc9457SAndroid Build Coastguard Worker }
1124*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8S4__WASMSIMD,strided_cm)1125*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8S4__WASMSIMD, strided_cm) {
1126*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1127*4bdc9457SAndroid Build Coastguard Worker .mr(1)
1128*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1129*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1130*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1131*4bdc9457SAndroid Build Coastguard Worker .m(1)
1132*4bdc9457SAndroid Build Coastguard Worker .n(8)
1133*4bdc9457SAndroid Build Coastguard Worker .k(4)
1134*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1135*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd);
1136*4bdc9457SAndroid Build Coastguard Worker }
1137*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1138*4bdc9457SAndroid Build Coastguard Worker
1139*4bdc9457SAndroid Build Coastguard Worker
1140*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_eq_4)1141*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_eq_4) {
1142*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1143*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1144*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1145*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1146*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1147*4bdc9457SAndroid Build Coastguard Worker .m(4)
1148*4bdc9457SAndroid Build Coastguard Worker .n(8)
1149*4bdc9457SAndroid Build Coastguard Worker .k(4)
1150*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1151*4bdc9457SAndroid Build Coastguard Worker }
1152*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,strided_cn)1153*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, strided_cn) {
1154*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1155*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1156*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1157*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1158*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1159*4bdc9457SAndroid Build Coastguard Worker .m(4)
1160*4bdc9457SAndroid Build Coastguard Worker .n(8)
1161*4bdc9457SAndroid Build Coastguard Worker .k(4)
1162*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1163*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1164*4bdc9457SAndroid Build Coastguard Worker }
1165*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_eq_4_strided_a)1166*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_eq_4_strided_a) {
1167*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1168*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1169*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1170*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1171*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1172*4bdc9457SAndroid Build Coastguard Worker .m(4)
1173*4bdc9457SAndroid Build Coastguard Worker .n(8)
1174*4bdc9457SAndroid Build Coastguard Worker .k(4)
1175*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1176*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1177*4bdc9457SAndroid Build Coastguard Worker }
1178*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_eq_4_subtile)1179*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
1180*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1181*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1182*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1183*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1184*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1185*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1186*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1187*4bdc9457SAndroid Build Coastguard Worker .m(m)
1188*4bdc9457SAndroid Build Coastguard Worker .n(n)
1189*4bdc9457SAndroid Build Coastguard Worker .k(4)
1190*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1191*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1192*4bdc9457SAndroid Build Coastguard Worker }
1193*4bdc9457SAndroid Build Coastguard Worker }
1194*4bdc9457SAndroid Build Coastguard Worker }
1195*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)1196*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
1197*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1198*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1199*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1200*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1201*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1202*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1203*4bdc9457SAndroid Build Coastguard Worker .m(m)
1204*4bdc9457SAndroid Build Coastguard Worker .n(8)
1205*4bdc9457SAndroid Build Coastguard Worker .k(4)
1206*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1207*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1208*4bdc9457SAndroid Build Coastguard Worker }
1209*4bdc9457SAndroid Build Coastguard Worker }
1210*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)1211*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
1212*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1213*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1214*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1215*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1216*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1217*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1218*4bdc9457SAndroid Build Coastguard Worker .m(4)
1219*4bdc9457SAndroid Build Coastguard Worker .n(n)
1220*4bdc9457SAndroid Build Coastguard Worker .k(4)
1221*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1222*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1223*4bdc9457SAndroid Build Coastguard Worker }
1224*4bdc9457SAndroid Build Coastguard Worker }
1225*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_lt_4)1226*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_lt_4) {
1227*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1228*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1229*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1230*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1231*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1232*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1233*4bdc9457SAndroid Build Coastguard Worker .m(4)
1234*4bdc9457SAndroid Build Coastguard Worker .n(8)
1235*4bdc9457SAndroid Build Coastguard Worker .k(k)
1236*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1237*4bdc9457SAndroid Build Coastguard Worker }
1238*4bdc9457SAndroid Build Coastguard Worker }
1239*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_lt_4_strided_a)1240*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_lt_4_strided_a) {
1241*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1242*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1243*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1244*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1245*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1246*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1247*4bdc9457SAndroid Build Coastguard Worker .m(4)
1248*4bdc9457SAndroid Build Coastguard Worker .n(8)
1249*4bdc9457SAndroid Build Coastguard Worker .k(k)
1250*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1251*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1252*4bdc9457SAndroid Build Coastguard Worker }
1253*4bdc9457SAndroid Build Coastguard Worker }
1254*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_lt_4_subtile)1255*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
1256*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1257*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1258*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1259*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1260*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1261*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1262*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1263*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1264*4bdc9457SAndroid Build Coastguard Worker .m(m)
1265*4bdc9457SAndroid Build Coastguard Worker .n(n)
1266*4bdc9457SAndroid Build Coastguard Worker .k(k)
1267*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1268*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1269*4bdc9457SAndroid Build Coastguard Worker }
1270*4bdc9457SAndroid Build Coastguard Worker }
1271*4bdc9457SAndroid Build Coastguard Worker }
1272*4bdc9457SAndroid Build Coastguard Worker }
1273*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_gt_4)1274*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_gt_4) {
1275*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1276*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1277*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1278*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1279*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1280*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1281*4bdc9457SAndroid Build Coastguard Worker .m(4)
1282*4bdc9457SAndroid Build Coastguard Worker .n(8)
1283*4bdc9457SAndroid Build Coastguard Worker .k(k)
1284*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1285*4bdc9457SAndroid Build Coastguard Worker }
1286*4bdc9457SAndroid Build Coastguard Worker }
1287*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_gt_4_strided_a)1288*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_gt_4_strided_a) {
1289*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1290*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1291*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1292*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1293*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1294*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1295*4bdc9457SAndroid Build Coastguard Worker .m(4)
1296*4bdc9457SAndroid Build Coastguard Worker .n(8)
1297*4bdc9457SAndroid Build Coastguard Worker .k(k)
1298*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
1299*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1300*4bdc9457SAndroid Build Coastguard Worker }
1301*4bdc9457SAndroid Build Coastguard Worker }
1302*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_gt_4_subtile)1303*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
1304*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1305*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1306*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1307*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1308*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1309*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1310*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1311*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1312*4bdc9457SAndroid Build Coastguard Worker .m(m)
1313*4bdc9457SAndroid Build Coastguard Worker .n(n)
1314*4bdc9457SAndroid Build Coastguard Worker .k(k)
1315*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1316*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1317*4bdc9457SAndroid Build Coastguard Worker }
1318*4bdc9457SAndroid Build Coastguard Worker }
1319*4bdc9457SAndroid Build Coastguard Worker }
1320*4bdc9457SAndroid Build Coastguard Worker }
1321*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_div_4)1322*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_div_4) {
1323*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1324*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1325*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1326*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1327*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1328*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1329*4bdc9457SAndroid Build Coastguard Worker .m(4)
1330*4bdc9457SAndroid Build Coastguard Worker .n(8)
1331*4bdc9457SAndroid Build Coastguard Worker .k(k)
1332*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1333*4bdc9457SAndroid Build Coastguard Worker }
1334*4bdc9457SAndroid Build Coastguard Worker }
1335*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_div_4_strided_a)1336*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_div_4_strided_a) {
1337*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1338*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1339*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1340*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1341*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1342*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1343*4bdc9457SAndroid Build Coastguard Worker .m(4)
1344*4bdc9457SAndroid Build Coastguard Worker .n(8)
1345*4bdc9457SAndroid Build Coastguard Worker .k(k)
1346*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
1347*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1348*4bdc9457SAndroid Build Coastguard Worker }
1349*4bdc9457SAndroid Build Coastguard Worker }
1350*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,k_div_4_subtile)1351*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, k_div_4_subtile) {
1352*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1353*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1354*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1355*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1356*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1357*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1358*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1359*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1360*4bdc9457SAndroid Build Coastguard Worker .m(m)
1361*4bdc9457SAndroid Build Coastguard Worker .n(n)
1362*4bdc9457SAndroid Build Coastguard Worker .k(k)
1363*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1364*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1365*4bdc9457SAndroid Build Coastguard Worker }
1366*4bdc9457SAndroid Build Coastguard Worker }
1367*4bdc9457SAndroid Build Coastguard Worker }
1368*4bdc9457SAndroid Build Coastguard Worker }
1369*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,n_gt_8)1370*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, n_gt_8) {
1371*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1372*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1373*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1374*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1375*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1376*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1377*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1378*4bdc9457SAndroid Build Coastguard Worker .m(4)
1379*4bdc9457SAndroid Build Coastguard Worker .n(n)
1380*4bdc9457SAndroid Build Coastguard Worker .k(k)
1381*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1382*4bdc9457SAndroid Build Coastguard Worker }
1383*4bdc9457SAndroid Build Coastguard Worker }
1384*4bdc9457SAndroid Build Coastguard Worker }
1385*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)1386*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
1387*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1388*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1389*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1390*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1391*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1392*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1393*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1394*4bdc9457SAndroid Build Coastguard Worker .m(4)
1395*4bdc9457SAndroid Build Coastguard Worker .n(n)
1396*4bdc9457SAndroid Build Coastguard Worker .k(k)
1397*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1398*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1399*4bdc9457SAndroid Build Coastguard Worker }
1400*4bdc9457SAndroid Build Coastguard Worker }
1401*4bdc9457SAndroid Build Coastguard Worker }
1402*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,n_gt_8_strided_a)1403*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, n_gt_8_strided_a) {
1404*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1405*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1406*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1407*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1408*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1409*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1410*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1411*4bdc9457SAndroid Build Coastguard Worker .m(4)
1412*4bdc9457SAndroid Build Coastguard Worker .n(n)
1413*4bdc9457SAndroid Build Coastguard Worker .k(k)
1414*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1415*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1416*4bdc9457SAndroid Build Coastguard Worker }
1417*4bdc9457SAndroid Build Coastguard Worker }
1418*4bdc9457SAndroid Build Coastguard Worker }
1419*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,n_gt_8_subtile)1420*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
1421*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1422*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1423*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1424*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1425*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1426*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1427*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1428*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1429*4bdc9457SAndroid Build Coastguard Worker .m(m)
1430*4bdc9457SAndroid Build Coastguard Worker .n(n)
1431*4bdc9457SAndroid Build Coastguard Worker .k(k)
1432*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1433*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1434*4bdc9457SAndroid Build Coastguard Worker }
1435*4bdc9457SAndroid Build Coastguard Worker }
1436*4bdc9457SAndroid Build Coastguard Worker }
1437*4bdc9457SAndroid Build Coastguard Worker }
1438*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,n_div_8)1439*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, n_div_8) {
1440*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1441*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1442*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1443*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1444*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1445*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1446*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1447*4bdc9457SAndroid Build Coastguard Worker .m(4)
1448*4bdc9457SAndroid Build Coastguard Worker .n(n)
1449*4bdc9457SAndroid Build Coastguard Worker .k(k)
1450*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1451*4bdc9457SAndroid Build Coastguard Worker }
1452*4bdc9457SAndroid Build Coastguard Worker }
1453*4bdc9457SAndroid Build Coastguard Worker }
1454*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,n_div_8_strided_cn)1455*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
1456*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1457*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1458*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1459*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1460*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1461*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1462*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1463*4bdc9457SAndroid Build Coastguard Worker .m(4)
1464*4bdc9457SAndroid Build Coastguard Worker .n(n)
1465*4bdc9457SAndroid Build Coastguard Worker .k(k)
1466*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1467*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1468*4bdc9457SAndroid Build Coastguard Worker }
1469*4bdc9457SAndroid Build Coastguard Worker }
1470*4bdc9457SAndroid Build Coastguard Worker }
1471*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,n_div_8_strided_a)1472*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, n_div_8_strided_a) {
1473*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1474*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1475*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1476*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1477*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1478*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1479*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1480*4bdc9457SAndroid Build Coastguard Worker .m(4)
1481*4bdc9457SAndroid Build Coastguard Worker .n(n)
1482*4bdc9457SAndroid Build Coastguard Worker .k(k)
1483*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1484*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1485*4bdc9457SAndroid Build Coastguard Worker }
1486*4bdc9457SAndroid Build Coastguard Worker }
1487*4bdc9457SAndroid Build Coastguard Worker }
1488*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,n_div_8_subtile)1489*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, n_div_8_subtile) {
1490*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1491*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1492*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1493*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1494*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1495*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1496*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1497*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1498*4bdc9457SAndroid Build Coastguard Worker .m(m)
1499*4bdc9457SAndroid Build Coastguard Worker .n(n)
1500*4bdc9457SAndroid Build Coastguard Worker .k(k)
1501*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1502*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1503*4bdc9457SAndroid Build Coastguard Worker }
1504*4bdc9457SAndroid Build Coastguard Worker }
1505*4bdc9457SAndroid Build Coastguard Worker }
1506*4bdc9457SAndroid Build Coastguard Worker }
1507*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,strided_cm_subtile)1508*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, strided_cm_subtile) {
1509*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1510*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1511*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1512*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1513*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1514*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1515*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1516*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1517*4bdc9457SAndroid Build Coastguard Worker .m(m)
1518*4bdc9457SAndroid Build Coastguard Worker .n(n)
1519*4bdc9457SAndroid Build Coastguard Worker .k(k)
1520*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1521*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1522*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1523*4bdc9457SAndroid Build Coastguard Worker }
1524*4bdc9457SAndroid Build Coastguard Worker }
1525*4bdc9457SAndroid Build Coastguard Worker }
1526*4bdc9457SAndroid Build Coastguard Worker }
1527*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT,strided_cm)1528*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMSIMD_SPLAT, strided_cm) {
1529*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1530*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1531*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1532*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1533*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1534*4bdc9457SAndroid Build Coastguard Worker .m(4)
1535*4bdc9457SAndroid Build Coastguard Worker .n(8)
1536*4bdc9457SAndroid Build Coastguard Worker .k(4)
1537*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1538*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmsimd_splat);
1539*4bdc9457SAndroid Build Coastguard Worker }
1540*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1541*4bdc9457SAndroid Build Coastguard Worker
1542*4bdc9457SAndroid Build Coastguard Worker
1543*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_eq_4)1544*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_eq_4) {
1545*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1546*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1547*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1548*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1549*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1550*4bdc9457SAndroid Build Coastguard Worker .m(5)
1551*4bdc9457SAndroid Build Coastguard Worker .n(8)
1552*4bdc9457SAndroid Build Coastguard Worker .k(4)
1553*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1554*4bdc9457SAndroid Build Coastguard Worker }
1555*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,strided_cn)1556*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, strided_cn) {
1557*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1558*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1559*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1560*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1561*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1562*4bdc9457SAndroid Build Coastguard Worker .m(5)
1563*4bdc9457SAndroid Build Coastguard Worker .n(8)
1564*4bdc9457SAndroid Build Coastguard Worker .k(4)
1565*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1566*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1567*4bdc9457SAndroid Build Coastguard Worker }
1568*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_eq_4_strided_a)1569*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_eq_4_strided_a) {
1570*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1571*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1572*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1573*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1574*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1575*4bdc9457SAndroid Build Coastguard Worker .m(5)
1576*4bdc9457SAndroid Build Coastguard Worker .n(8)
1577*4bdc9457SAndroid Build Coastguard Worker .k(4)
1578*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1579*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1580*4bdc9457SAndroid Build Coastguard Worker }
1581*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_eq_4_subtile)1582*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
1583*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1584*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
1585*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1586*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1587*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1588*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1589*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1590*4bdc9457SAndroid Build Coastguard Worker .m(m)
1591*4bdc9457SAndroid Build Coastguard Worker .n(n)
1592*4bdc9457SAndroid Build Coastguard Worker .k(4)
1593*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1594*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1595*4bdc9457SAndroid Build Coastguard Worker }
1596*4bdc9457SAndroid Build Coastguard Worker }
1597*4bdc9457SAndroid Build Coastguard Worker }
1598*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)1599*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
1600*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
1601*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1602*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1603*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1604*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1605*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1606*4bdc9457SAndroid Build Coastguard Worker .m(m)
1607*4bdc9457SAndroid Build Coastguard Worker .n(8)
1608*4bdc9457SAndroid Build Coastguard Worker .k(4)
1609*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1610*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1611*4bdc9457SAndroid Build Coastguard Worker }
1612*4bdc9457SAndroid Build Coastguard Worker }
1613*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)1614*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
1615*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1616*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1617*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1618*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1619*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1620*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1621*4bdc9457SAndroid Build Coastguard Worker .m(5)
1622*4bdc9457SAndroid Build Coastguard Worker .n(n)
1623*4bdc9457SAndroid Build Coastguard Worker .k(4)
1624*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1625*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1626*4bdc9457SAndroid Build Coastguard Worker }
1627*4bdc9457SAndroid Build Coastguard Worker }
1628*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_lt_4)1629*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_lt_4) {
1630*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1631*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1632*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1633*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1634*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1635*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1636*4bdc9457SAndroid Build Coastguard Worker .m(5)
1637*4bdc9457SAndroid Build Coastguard Worker .n(8)
1638*4bdc9457SAndroid Build Coastguard Worker .k(k)
1639*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1640*4bdc9457SAndroid Build Coastguard Worker }
1641*4bdc9457SAndroid Build Coastguard Worker }
1642*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_lt_4_strided_a)1643*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_lt_4_strided_a) {
1644*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1645*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1646*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1647*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1648*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1649*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1650*4bdc9457SAndroid Build Coastguard Worker .m(5)
1651*4bdc9457SAndroid Build Coastguard Worker .n(8)
1652*4bdc9457SAndroid Build Coastguard Worker .k(k)
1653*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1654*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1655*4bdc9457SAndroid Build Coastguard Worker }
1656*4bdc9457SAndroid Build Coastguard Worker }
1657*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_lt_4_subtile)1658*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
1659*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1660*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1661*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
1662*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1663*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1664*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1665*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1666*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1667*4bdc9457SAndroid Build Coastguard Worker .m(m)
1668*4bdc9457SAndroid Build Coastguard Worker .n(n)
1669*4bdc9457SAndroid Build Coastguard Worker .k(k)
1670*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1671*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1672*4bdc9457SAndroid Build Coastguard Worker }
1673*4bdc9457SAndroid Build Coastguard Worker }
1674*4bdc9457SAndroid Build Coastguard Worker }
1675*4bdc9457SAndroid Build Coastguard Worker }
1676*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_gt_4)1677*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_gt_4) {
1678*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1679*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1680*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1681*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1682*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1683*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1684*4bdc9457SAndroid Build Coastguard Worker .m(5)
1685*4bdc9457SAndroid Build Coastguard Worker .n(8)
1686*4bdc9457SAndroid Build Coastguard Worker .k(k)
1687*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1688*4bdc9457SAndroid Build Coastguard Worker }
1689*4bdc9457SAndroid Build Coastguard Worker }
1690*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_gt_4_strided_a)1691*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_gt_4_strided_a) {
1692*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1693*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1694*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1695*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1696*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1697*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1698*4bdc9457SAndroid Build Coastguard Worker .m(5)
1699*4bdc9457SAndroid Build Coastguard Worker .n(8)
1700*4bdc9457SAndroid Build Coastguard Worker .k(k)
1701*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
1702*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1703*4bdc9457SAndroid Build Coastguard Worker }
1704*4bdc9457SAndroid Build Coastguard Worker }
1705*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_gt_4_subtile)1706*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
1707*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1708*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1709*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
1710*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1711*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1712*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1713*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1714*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1715*4bdc9457SAndroid Build Coastguard Worker .m(m)
1716*4bdc9457SAndroid Build Coastguard Worker .n(n)
1717*4bdc9457SAndroid Build Coastguard Worker .k(k)
1718*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1719*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1720*4bdc9457SAndroid Build Coastguard Worker }
1721*4bdc9457SAndroid Build Coastguard Worker }
1722*4bdc9457SAndroid Build Coastguard Worker }
1723*4bdc9457SAndroid Build Coastguard Worker }
1724*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_div_4)1725*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_div_4) {
1726*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1727*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1728*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1729*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1730*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1731*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1732*4bdc9457SAndroid Build Coastguard Worker .m(5)
1733*4bdc9457SAndroid Build Coastguard Worker .n(8)
1734*4bdc9457SAndroid Build Coastguard Worker .k(k)
1735*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1736*4bdc9457SAndroid Build Coastguard Worker }
1737*4bdc9457SAndroid Build Coastguard Worker }
1738*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_div_4_strided_a)1739*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_div_4_strided_a) {
1740*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1741*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1742*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1743*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1744*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1745*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1746*4bdc9457SAndroid Build Coastguard Worker .m(5)
1747*4bdc9457SAndroid Build Coastguard Worker .n(8)
1748*4bdc9457SAndroid Build Coastguard Worker .k(k)
1749*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
1750*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1751*4bdc9457SAndroid Build Coastguard Worker }
1752*4bdc9457SAndroid Build Coastguard Worker }
1753*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,k_div_4_subtile)1754*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, k_div_4_subtile) {
1755*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1756*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1757*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
1758*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1759*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1760*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1761*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1762*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1763*4bdc9457SAndroid Build Coastguard Worker .m(m)
1764*4bdc9457SAndroid Build Coastguard Worker .n(n)
1765*4bdc9457SAndroid Build Coastguard Worker .k(k)
1766*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1767*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1768*4bdc9457SAndroid Build Coastguard Worker }
1769*4bdc9457SAndroid Build Coastguard Worker }
1770*4bdc9457SAndroid Build Coastguard Worker }
1771*4bdc9457SAndroid Build Coastguard Worker }
1772*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,n_gt_8)1773*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, n_gt_8) {
1774*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1775*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1776*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1777*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1778*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1779*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1780*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1781*4bdc9457SAndroid Build Coastguard Worker .m(5)
1782*4bdc9457SAndroid Build Coastguard Worker .n(n)
1783*4bdc9457SAndroid Build Coastguard Worker .k(k)
1784*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1785*4bdc9457SAndroid Build Coastguard Worker }
1786*4bdc9457SAndroid Build Coastguard Worker }
1787*4bdc9457SAndroid Build Coastguard Worker }
1788*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)1789*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
1790*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1791*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1792*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1793*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1794*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1795*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1796*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1797*4bdc9457SAndroid Build Coastguard Worker .m(5)
1798*4bdc9457SAndroid Build Coastguard Worker .n(n)
1799*4bdc9457SAndroid Build Coastguard Worker .k(k)
1800*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1801*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1802*4bdc9457SAndroid Build Coastguard Worker }
1803*4bdc9457SAndroid Build Coastguard Worker }
1804*4bdc9457SAndroid Build Coastguard Worker }
1805*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,n_gt_8_strided_a)1806*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, n_gt_8_strided_a) {
1807*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1808*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1809*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1810*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1811*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1812*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1813*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1814*4bdc9457SAndroid Build Coastguard Worker .m(5)
1815*4bdc9457SAndroid Build Coastguard Worker .n(n)
1816*4bdc9457SAndroid Build Coastguard Worker .k(k)
1817*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1818*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1819*4bdc9457SAndroid Build Coastguard Worker }
1820*4bdc9457SAndroid Build Coastguard Worker }
1821*4bdc9457SAndroid Build Coastguard Worker }
1822*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,n_gt_8_subtile)1823*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
1824*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1825*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1826*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
1827*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1828*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1829*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1830*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1831*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1832*4bdc9457SAndroid Build Coastguard Worker .m(m)
1833*4bdc9457SAndroid Build Coastguard Worker .n(n)
1834*4bdc9457SAndroid Build Coastguard Worker .k(k)
1835*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1836*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1837*4bdc9457SAndroid Build Coastguard Worker }
1838*4bdc9457SAndroid Build Coastguard Worker }
1839*4bdc9457SAndroid Build Coastguard Worker }
1840*4bdc9457SAndroid Build Coastguard Worker }
1841*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,n_div_8)1842*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, n_div_8) {
1843*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1844*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1845*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1846*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1847*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1848*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1849*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1850*4bdc9457SAndroid Build Coastguard Worker .m(5)
1851*4bdc9457SAndroid Build Coastguard Worker .n(n)
1852*4bdc9457SAndroid Build Coastguard Worker .k(k)
1853*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1854*4bdc9457SAndroid Build Coastguard Worker }
1855*4bdc9457SAndroid Build Coastguard Worker }
1856*4bdc9457SAndroid Build Coastguard Worker }
1857*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,n_div_8_strided_cn)1858*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
1859*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1860*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1861*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1862*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1863*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1864*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1865*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1866*4bdc9457SAndroid Build Coastguard Worker .m(5)
1867*4bdc9457SAndroid Build Coastguard Worker .n(n)
1868*4bdc9457SAndroid Build Coastguard Worker .k(k)
1869*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1870*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1871*4bdc9457SAndroid Build Coastguard Worker }
1872*4bdc9457SAndroid Build Coastguard Worker }
1873*4bdc9457SAndroid Build Coastguard Worker }
1874*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,n_div_8_strided_a)1875*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, n_div_8_strided_a) {
1876*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1877*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1878*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1879*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1880*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1881*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1882*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1883*4bdc9457SAndroid Build Coastguard Worker .m(5)
1884*4bdc9457SAndroid Build Coastguard Worker .n(n)
1885*4bdc9457SAndroid Build Coastguard Worker .k(k)
1886*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1887*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1888*4bdc9457SAndroid Build Coastguard Worker }
1889*4bdc9457SAndroid Build Coastguard Worker }
1890*4bdc9457SAndroid Build Coastguard Worker }
1891*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,n_div_8_subtile)1892*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, n_div_8_subtile) {
1893*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1894*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1895*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
1896*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1897*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1898*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1899*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1900*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1901*4bdc9457SAndroid Build Coastguard Worker .m(m)
1902*4bdc9457SAndroid Build Coastguard Worker .n(n)
1903*4bdc9457SAndroid Build Coastguard Worker .k(k)
1904*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1905*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1906*4bdc9457SAndroid Build Coastguard Worker }
1907*4bdc9457SAndroid Build Coastguard Worker }
1908*4bdc9457SAndroid Build Coastguard Worker }
1909*4bdc9457SAndroid Build Coastguard Worker }
1910*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,strided_cm_subtile)1911*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, strided_cm_subtile) {
1912*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1913*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1914*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
1915*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1916*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1917*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1918*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1919*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1920*4bdc9457SAndroid Build Coastguard Worker .m(m)
1921*4bdc9457SAndroid Build Coastguard Worker .n(n)
1922*4bdc9457SAndroid Build Coastguard Worker .k(k)
1923*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1924*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1925*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1926*4bdc9457SAndroid Build Coastguard Worker }
1927*4bdc9457SAndroid Build Coastguard Worker }
1928*4bdc9457SAndroid Build Coastguard Worker }
1929*4bdc9457SAndroid Build Coastguard Worker }
1930*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT,strided_cm)1931*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMSIMD_SPLAT, strided_cm) {
1932*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1933*4bdc9457SAndroid Build Coastguard Worker .mr(5)
1934*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1935*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1936*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1937*4bdc9457SAndroid Build Coastguard Worker .m(5)
1938*4bdc9457SAndroid Build Coastguard Worker .n(8)
1939*4bdc9457SAndroid Build Coastguard Worker .k(4)
1940*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1941*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmsimd_splat);
1942*4bdc9457SAndroid Build Coastguard Worker }
1943*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1944*4bdc9457SAndroid Build Coastguard Worker
1945*4bdc9457SAndroid Build Coastguard Worker
1946*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_eq_1)1947*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_eq_1) {
1948*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1949*4bdc9457SAndroid Build Coastguard Worker .mr(6)
1950*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1951*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1952*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1953*4bdc9457SAndroid Build Coastguard Worker .m(6)
1954*4bdc9457SAndroid Build Coastguard Worker .n(8)
1955*4bdc9457SAndroid Build Coastguard Worker .k(1)
1956*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
1957*4bdc9457SAndroid Build Coastguard Worker }
1958*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,strided_cn)1959*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, strided_cn) {
1960*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1961*4bdc9457SAndroid Build Coastguard Worker .mr(6)
1962*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1963*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1964*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1965*4bdc9457SAndroid Build Coastguard Worker .m(6)
1966*4bdc9457SAndroid Build Coastguard Worker .n(8)
1967*4bdc9457SAndroid Build Coastguard Worker .k(1)
1968*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1969*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
1970*4bdc9457SAndroid Build Coastguard Worker }
1971*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_eq_1_strided_a)1972*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_eq_1_strided_a) {
1973*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1974*4bdc9457SAndroid Build Coastguard Worker .mr(6)
1975*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1976*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1977*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1978*4bdc9457SAndroid Build Coastguard Worker .m(6)
1979*4bdc9457SAndroid Build Coastguard Worker .n(8)
1980*4bdc9457SAndroid Build Coastguard Worker .k(1)
1981*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
1982*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
1983*4bdc9457SAndroid Build Coastguard Worker }
1984*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)1985*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
1986*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1987*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
1988*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1989*4bdc9457SAndroid Build Coastguard Worker .mr(6)
1990*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1991*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1992*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1993*4bdc9457SAndroid Build Coastguard Worker .m(m)
1994*4bdc9457SAndroid Build Coastguard Worker .n(n)
1995*4bdc9457SAndroid Build Coastguard Worker .k(1)
1996*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1997*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
1998*4bdc9457SAndroid Build Coastguard Worker }
1999*4bdc9457SAndroid Build Coastguard Worker }
2000*4bdc9457SAndroid Build Coastguard Worker }
2001*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)2002*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
2003*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2004*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2005*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2006*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2007*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2008*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2009*4bdc9457SAndroid Build Coastguard Worker .m(m)
2010*4bdc9457SAndroid Build Coastguard Worker .n(8)
2011*4bdc9457SAndroid Build Coastguard Worker .k(1)
2012*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2013*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2014*4bdc9457SAndroid Build Coastguard Worker }
2015*4bdc9457SAndroid Build Coastguard Worker }
2016*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)2017*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
2018*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2019*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2020*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2021*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2022*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2023*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2024*4bdc9457SAndroid Build Coastguard Worker .m(6)
2025*4bdc9457SAndroid Build Coastguard Worker .n(n)
2026*4bdc9457SAndroid Build Coastguard Worker .k(1)
2027*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2028*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2029*4bdc9457SAndroid Build Coastguard Worker }
2030*4bdc9457SAndroid Build Coastguard Worker }
2031*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_gt_1)2032*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_gt_1) {
2033*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2034*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2035*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2036*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2037*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2038*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2039*4bdc9457SAndroid Build Coastguard Worker .m(6)
2040*4bdc9457SAndroid Build Coastguard Worker .n(8)
2041*4bdc9457SAndroid Build Coastguard Worker .k(k)
2042*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2043*4bdc9457SAndroid Build Coastguard Worker }
2044*4bdc9457SAndroid Build Coastguard Worker }
2045*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_gt_1_strided_a)2046*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_gt_1_strided_a) {
2047*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2048*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2049*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2050*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2051*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2052*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2053*4bdc9457SAndroid Build Coastguard Worker .m(6)
2054*4bdc9457SAndroid Build Coastguard Worker .n(8)
2055*4bdc9457SAndroid Build Coastguard Worker .k(k)
2056*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
2057*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2058*4bdc9457SAndroid Build Coastguard Worker }
2059*4bdc9457SAndroid Build Coastguard Worker }
2060*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)2061*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
2062*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2063*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2064*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2065*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2066*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2067*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2068*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2069*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2070*4bdc9457SAndroid Build Coastguard Worker .m(m)
2071*4bdc9457SAndroid Build Coastguard Worker .n(n)
2072*4bdc9457SAndroid Build Coastguard Worker .k(k)
2073*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2074*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2075*4bdc9457SAndroid Build Coastguard Worker }
2076*4bdc9457SAndroid Build Coastguard Worker }
2077*4bdc9457SAndroid Build Coastguard Worker }
2078*4bdc9457SAndroid Build Coastguard Worker }
2079*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_gt_8)2080*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_gt_8) {
2081*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2082*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2083*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2084*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2085*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2086*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2087*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2088*4bdc9457SAndroid Build Coastguard Worker .m(6)
2089*4bdc9457SAndroid Build Coastguard Worker .n(n)
2090*4bdc9457SAndroid Build Coastguard Worker .k(k)
2091*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2092*4bdc9457SAndroid Build Coastguard Worker }
2093*4bdc9457SAndroid Build Coastguard Worker }
2094*4bdc9457SAndroid Build Coastguard Worker }
2095*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)2096*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
2097*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2098*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2099*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2100*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2101*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2102*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2103*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2104*4bdc9457SAndroid Build Coastguard Worker .m(6)
2105*4bdc9457SAndroid Build Coastguard Worker .n(n)
2106*4bdc9457SAndroid Build Coastguard Worker .k(k)
2107*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2108*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2109*4bdc9457SAndroid Build Coastguard Worker }
2110*4bdc9457SAndroid Build Coastguard Worker }
2111*4bdc9457SAndroid Build Coastguard Worker }
2112*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_a)2113*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_a) {
2114*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2115*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2116*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2117*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2118*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2119*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2120*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2121*4bdc9457SAndroid Build Coastguard Worker .m(6)
2122*4bdc9457SAndroid Build Coastguard Worker .n(n)
2123*4bdc9457SAndroid Build Coastguard Worker .k(k)
2124*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2125*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2126*4bdc9457SAndroid Build Coastguard Worker }
2127*4bdc9457SAndroid Build Coastguard Worker }
2128*4bdc9457SAndroid Build Coastguard Worker }
2129*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)2130*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
2131*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2132*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2133*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2134*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2135*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2136*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2137*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2138*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2139*4bdc9457SAndroid Build Coastguard Worker .m(m)
2140*4bdc9457SAndroid Build Coastguard Worker .n(n)
2141*4bdc9457SAndroid Build Coastguard Worker .k(k)
2142*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2143*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2144*4bdc9457SAndroid Build Coastguard Worker }
2145*4bdc9457SAndroid Build Coastguard Worker }
2146*4bdc9457SAndroid Build Coastguard Worker }
2147*4bdc9457SAndroid Build Coastguard Worker }
2148*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_div_8)2149*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_div_8) {
2150*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2151*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2152*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2153*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2154*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2155*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2156*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2157*4bdc9457SAndroid Build Coastguard Worker .m(6)
2158*4bdc9457SAndroid Build Coastguard Worker .n(n)
2159*4bdc9457SAndroid Build Coastguard Worker .k(k)
2160*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2161*4bdc9457SAndroid Build Coastguard Worker }
2162*4bdc9457SAndroid Build Coastguard Worker }
2163*4bdc9457SAndroid Build Coastguard Worker }
2164*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)2165*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
2166*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2167*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2168*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2169*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2170*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2171*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2172*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2173*4bdc9457SAndroid Build Coastguard Worker .m(6)
2174*4bdc9457SAndroid Build Coastguard Worker .n(n)
2175*4bdc9457SAndroid Build Coastguard Worker .k(k)
2176*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2177*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2178*4bdc9457SAndroid Build Coastguard Worker }
2179*4bdc9457SAndroid Build Coastguard Worker }
2180*4bdc9457SAndroid Build Coastguard Worker }
2181*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_div_8_strided_a)2182*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_div_8_strided_a) {
2183*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2184*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2185*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2186*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2187*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2188*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2189*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2190*4bdc9457SAndroid Build Coastguard Worker .m(6)
2191*4bdc9457SAndroid Build Coastguard Worker .n(n)
2192*4bdc9457SAndroid Build Coastguard Worker .k(k)
2193*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2194*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2195*4bdc9457SAndroid Build Coastguard Worker }
2196*4bdc9457SAndroid Build Coastguard Worker }
2197*4bdc9457SAndroid Build Coastguard Worker }
2198*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)2199*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
2200*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2201*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2202*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2203*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2204*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2205*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2206*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2207*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2208*4bdc9457SAndroid Build Coastguard Worker .m(m)
2209*4bdc9457SAndroid Build Coastguard Worker .n(n)
2210*4bdc9457SAndroid Build Coastguard Worker .k(k)
2211*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2212*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2213*4bdc9457SAndroid Build Coastguard Worker }
2214*4bdc9457SAndroid Build Coastguard Worker }
2215*4bdc9457SAndroid Build Coastguard Worker }
2216*4bdc9457SAndroid Build Coastguard Worker }
2217*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)2218*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
2219*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2220*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2221*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2222*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2223*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2224*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2225*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2226*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2227*4bdc9457SAndroid Build Coastguard Worker .m(m)
2228*4bdc9457SAndroid Build Coastguard Worker .n(n)
2229*4bdc9457SAndroid Build Coastguard Worker .k(k)
2230*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2231*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2232*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2233*4bdc9457SAndroid Build Coastguard Worker }
2234*4bdc9457SAndroid Build Coastguard Worker }
2235*4bdc9457SAndroid Build Coastguard Worker }
2236*4bdc9457SAndroid Build Coastguard Worker }
2237*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT,strided_cm)2238*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMSIMD_LOADSPLAT, strided_cm) {
2239*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2240*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2241*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2242*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2243*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2244*4bdc9457SAndroid Build Coastguard Worker .m(6)
2245*4bdc9457SAndroid Build Coastguard Worker .n(8)
2246*4bdc9457SAndroid Build Coastguard Worker .k(1)
2247*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2248*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmsimd_loadsplat);
2249*4bdc9457SAndroid Build Coastguard Worker }
2250*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2251*4bdc9457SAndroid Build Coastguard Worker
2252*4bdc9457SAndroid Build Coastguard Worker
2253*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_eq_4)2254*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_eq_4) {
2255*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2256*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2257*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2258*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2259*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2260*4bdc9457SAndroid Build Coastguard Worker .m(6)
2261*4bdc9457SAndroid Build Coastguard Worker .n(8)
2262*4bdc9457SAndroid Build Coastguard Worker .k(4)
2263*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2264*4bdc9457SAndroid Build Coastguard Worker }
2265*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,strided_cn)2266*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, strided_cn) {
2267*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2268*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2269*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2270*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2271*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2272*4bdc9457SAndroid Build Coastguard Worker .m(6)
2273*4bdc9457SAndroid Build Coastguard Worker .n(8)
2274*4bdc9457SAndroid Build Coastguard Worker .k(4)
2275*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2276*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2277*4bdc9457SAndroid Build Coastguard Worker }
2278*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_eq_4_strided_a)2279*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_eq_4_strided_a) {
2280*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2281*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2282*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2283*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2284*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2285*4bdc9457SAndroid Build Coastguard Worker .m(6)
2286*4bdc9457SAndroid Build Coastguard Worker .n(8)
2287*4bdc9457SAndroid Build Coastguard Worker .k(4)
2288*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2289*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2290*4bdc9457SAndroid Build Coastguard Worker }
2291*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_eq_4_subtile)2292*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_eq_4_subtile) {
2293*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2294*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2295*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2296*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2297*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2298*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2299*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2300*4bdc9457SAndroid Build Coastguard Worker .m(m)
2301*4bdc9457SAndroid Build Coastguard Worker .n(n)
2302*4bdc9457SAndroid Build Coastguard Worker .k(4)
2303*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2304*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2305*4bdc9457SAndroid Build Coastguard Worker }
2306*4bdc9457SAndroid Build Coastguard Worker }
2307*4bdc9457SAndroid Build Coastguard Worker }
2308*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_eq_4_subtile_m)2309*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_eq_4_subtile_m) {
2310*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2311*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2312*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2313*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2314*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2315*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2316*4bdc9457SAndroid Build Coastguard Worker .m(m)
2317*4bdc9457SAndroid Build Coastguard Worker .n(8)
2318*4bdc9457SAndroid Build Coastguard Worker .k(4)
2319*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2320*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2321*4bdc9457SAndroid Build Coastguard Worker }
2322*4bdc9457SAndroid Build Coastguard Worker }
2323*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_eq_4_subtile_n)2324*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_eq_4_subtile_n) {
2325*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2326*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2327*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2328*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2329*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2330*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2331*4bdc9457SAndroid Build Coastguard Worker .m(6)
2332*4bdc9457SAndroid Build Coastguard Worker .n(n)
2333*4bdc9457SAndroid Build Coastguard Worker .k(4)
2334*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2335*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2336*4bdc9457SAndroid Build Coastguard Worker }
2337*4bdc9457SAndroid Build Coastguard Worker }
2338*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_lt_4)2339*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_lt_4) {
2340*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2341*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2342*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2343*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2344*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2345*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2346*4bdc9457SAndroid Build Coastguard Worker .m(6)
2347*4bdc9457SAndroid Build Coastguard Worker .n(8)
2348*4bdc9457SAndroid Build Coastguard Worker .k(k)
2349*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2350*4bdc9457SAndroid Build Coastguard Worker }
2351*4bdc9457SAndroid Build Coastguard Worker }
2352*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_lt_4_strided_a)2353*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_lt_4_strided_a) {
2354*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2355*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2356*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2357*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2358*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2359*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2360*4bdc9457SAndroid Build Coastguard Worker .m(6)
2361*4bdc9457SAndroid Build Coastguard Worker .n(8)
2362*4bdc9457SAndroid Build Coastguard Worker .k(k)
2363*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2364*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2365*4bdc9457SAndroid Build Coastguard Worker }
2366*4bdc9457SAndroid Build Coastguard Worker }
2367*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_lt_4_subtile)2368*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_lt_4_subtile) {
2369*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2370*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2371*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2372*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2373*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2374*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2375*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2376*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2377*4bdc9457SAndroid Build Coastguard Worker .m(m)
2378*4bdc9457SAndroid Build Coastguard Worker .n(n)
2379*4bdc9457SAndroid Build Coastguard Worker .k(k)
2380*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2381*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2382*4bdc9457SAndroid Build Coastguard Worker }
2383*4bdc9457SAndroid Build Coastguard Worker }
2384*4bdc9457SAndroid Build Coastguard Worker }
2385*4bdc9457SAndroid Build Coastguard Worker }
2386*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_gt_4)2387*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_gt_4) {
2388*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2389*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2390*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2391*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2392*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2393*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2394*4bdc9457SAndroid Build Coastguard Worker .m(6)
2395*4bdc9457SAndroid Build Coastguard Worker .n(8)
2396*4bdc9457SAndroid Build Coastguard Worker .k(k)
2397*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2398*4bdc9457SAndroid Build Coastguard Worker }
2399*4bdc9457SAndroid Build Coastguard Worker }
2400*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_gt_4_strided_a)2401*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_gt_4_strided_a) {
2402*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2403*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2404*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2405*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2406*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2407*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2408*4bdc9457SAndroid Build Coastguard Worker .m(6)
2409*4bdc9457SAndroid Build Coastguard Worker .n(8)
2410*4bdc9457SAndroid Build Coastguard Worker .k(k)
2411*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
2412*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2413*4bdc9457SAndroid Build Coastguard Worker }
2414*4bdc9457SAndroid Build Coastguard Worker }
2415*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_gt_4_subtile)2416*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_gt_4_subtile) {
2417*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2418*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2419*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2420*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2421*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2422*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2423*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2424*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2425*4bdc9457SAndroid Build Coastguard Worker .m(m)
2426*4bdc9457SAndroid Build Coastguard Worker .n(n)
2427*4bdc9457SAndroid Build Coastguard Worker .k(k)
2428*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2429*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2430*4bdc9457SAndroid Build Coastguard Worker }
2431*4bdc9457SAndroid Build Coastguard Worker }
2432*4bdc9457SAndroid Build Coastguard Worker }
2433*4bdc9457SAndroid Build Coastguard Worker }
2434*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_div_4)2435*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_div_4) {
2436*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2437*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2438*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2439*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2440*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2441*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2442*4bdc9457SAndroid Build Coastguard Worker .m(6)
2443*4bdc9457SAndroid Build Coastguard Worker .n(8)
2444*4bdc9457SAndroid Build Coastguard Worker .k(k)
2445*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2446*4bdc9457SAndroid Build Coastguard Worker }
2447*4bdc9457SAndroid Build Coastguard Worker }
2448*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_div_4_strided_a)2449*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_div_4_strided_a) {
2450*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2451*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2452*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2453*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2454*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2455*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2456*4bdc9457SAndroid Build Coastguard Worker .m(6)
2457*4bdc9457SAndroid Build Coastguard Worker .n(8)
2458*4bdc9457SAndroid Build Coastguard Worker .k(k)
2459*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
2460*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2461*4bdc9457SAndroid Build Coastguard Worker }
2462*4bdc9457SAndroid Build Coastguard Worker }
2463*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,k_div_4_subtile)2464*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, k_div_4_subtile) {
2465*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2466*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2467*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2468*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2469*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2470*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2471*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2472*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2473*4bdc9457SAndroid Build Coastguard Worker .m(m)
2474*4bdc9457SAndroid Build Coastguard Worker .n(n)
2475*4bdc9457SAndroid Build Coastguard Worker .k(k)
2476*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2477*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2478*4bdc9457SAndroid Build Coastguard Worker }
2479*4bdc9457SAndroid Build Coastguard Worker }
2480*4bdc9457SAndroid Build Coastguard Worker }
2481*4bdc9457SAndroid Build Coastguard Worker }
2482*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,n_gt_8)2483*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, n_gt_8) {
2484*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2485*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2486*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2487*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2488*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2489*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2490*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2491*4bdc9457SAndroid Build Coastguard Worker .m(6)
2492*4bdc9457SAndroid Build Coastguard Worker .n(n)
2493*4bdc9457SAndroid Build Coastguard Worker .k(k)
2494*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2495*4bdc9457SAndroid Build Coastguard Worker }
2496*4bdc9457SAndroid Build Coastguard Worker }
2497*4bdc9457SAndroid Build Coastguard Worker }
2498*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,n_gt_8_strided_cn)2499*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, n_gt_8_strided_cn) {
2500*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2501*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2502*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2503*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2504*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2505*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2506*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2507*4bdc9457SAndroid Build Coastguard Worker .m(6)
2508*4bdc9457SAndroid Build Coastguard Worker .n(n)
2509*4bdc9457SAndroid Build Coastguard Worker .k(k)
2510*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2511*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2512*4bdc9457SAndroid Build Coastguard Worker }
2513*4bdc9457SAndroid Build Coastguard Worker }
2514*4bdc9457SAndroid Build Coastguard Worker }
2515*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,n_gt_8_strided_a)2516*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, n_gt_8_strided_a) {
2517*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2518*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2519*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2520*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2521*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2522*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2523*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2524*4bdc9457SAndroid Build Coastguard Worker .m(6)
2525*4bdc9457SAndroid Build Coastguard Worker .n(n)
2526*4bdc9457SAndroid Build Coastguard Worker .k(k)
2527*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
2528*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2529*4bdc9457SAndroid Build Coastguard Worker }
2530*4bdc9457SAndroid Build Coastguard Worker }
2531*4bdc9457SAndroid Build Coastguard Worker }
2532*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,n_gt_8_subtile)2533*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, n_gt_8_subtile) {
2534*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2535*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2536*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2537*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2538*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2539*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2540*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2541*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2542*4bdc9457SAndroid Build Coastguard Worker .m(m)
2543*4bdc9457SAndroid Build Coastguard Worker .n(n)
2544*4bdc9457SAndroid Build Coastguard Worker .k(k)
2545*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2546*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2547*4bdc9457SAndroid Build Coastguard Worker }
2548*4bdc9457SAndroid Build Coastguard Worker }
2549*4bdc9457SAndroid Build Coastguard Worker }
2550*4bdc9457SAndroid Build Coastguard Worker }
2551*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,n_div_8)2552*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, n_div_8) {
2553*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2554*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2555*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2556*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2557*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2558*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2559*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2560*4bdc9457SAndroid Build Coastguard Worker .m(6)
2561*4bdc9457SAndroid Build Coastguard Worker .n(n)
2562*4bdc9457SAndroid Build Coastguard Worker .k(k)
2563*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2564*4bdc9457SAndroid Build Coastguard Worker }
2565*4bdc9457SAndroid Build Coastguard Worker }
2566*4bdc9457SAndroid Build Coastguard Worker }
2567*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,n_div_8_strided_cn)2568*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, n_div_8_strided_cn) {
2569*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2570*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2571*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2572*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2573*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2574*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2575*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2576*4bdc9457SAndroid Build Coastguard Worker .m(6)
2577*4bdc9457SAndroid Build Coastguard Worker .n(n)
2578*4bdc9457SAndroid Build Coastguard Worker .k(k)
2579*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2580*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2581*4bdc9457SAndroid Build Coastguard Worker }
2582*4bdc9457SAndroid Build Coastguard Worker }
2583*4bdc9457SAndroid Build Coastguard Worker }
2584*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,n_div_8_strided_a)2585*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, n_div_8_strided_a) {
2586*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2587*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2588*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2589*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2590*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2591*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2592*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2593*4bdc9457SAndroid Build Coastguard Worker .m(6)
2594*4bdc9457SAndroid Build Coastguard Worker .n(n)
2595*4bdc9457SAndroid Build Coastguard Worker .k(k)
2596*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
2597*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2598*4bdc9457SAndroid Build Coastguard Worker }
2599*4bdc9457SAndroid Build Coastguard Worker }
2600*4bdc9457SAndroid Build Coastguard Worker }
2601*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,n_div_8_subtile)2602*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, n_div_8_subtile) {
2603*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2604*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2605*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2606*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2607*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2608*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2609*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2610*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2611*4bdc9457SAndroid Build Coastguard Worker .m(m)
2612*4bdc9457SAndroid Build Coastguard Worker .n(n)
2613*4bdc9457SAndroid Build Coastguard Worker .k(k)
2614*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2615*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2616*4bdc9457SAndroid Build Coastguard Worker }
2617*4bdc9457SAndroid Build Coastguard Worker }
2618*4bdc9457SAndroid Build Coastguard Worker }
2619*4bdc9457SAndroid Build Coastguard Worker }
2620*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,strided_cm_subtile)2621*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, strided_cm_subtile) {
2622*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2623*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2624*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
2625*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2626*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2627*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2628*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2629*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2630*4bdc9457SAndroid Build Coastguard Worker .m(m)
2631*4bdc9457SAndroid Build Coastguard Worker .n(n)
2632*4bdc9457SAndroid Build Coastguard Worker .k(k)
2633*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2634*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2635*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2636*4bdc9457SAndroid Build Coastguard Worker }
2637*4bdc9457SAndroid Build Coastguard Worker }
2638*4bdc9457SAndroid Build Coastguard Worker }
2639*4bdc9457SAndroid Build Coastguard Worker }
2640*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8S4__WASMSIMD,strided_cm)2641*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8S4__WASMSIMD, strided_cm) {
2642*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2643*4bdc9457SAndroid Build Coastguard Worker .mr(6)
2644*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2645*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2646*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2647*4bdc9457SAndroid Build Coastguard Worker .m(6)
2648*4bdc9457SAndroid Build Coastguard Worker .n(8)
2649*4bdc9457SAndroid Build Coastguard Worker .k(4)
2650*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2651*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8s4__wasmsimd);
2652*4bdc9457SAndroid Build Coastguard Worker }
2653*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2654*4bdc9457SAndroid Build Coastguard Worker
2655*4bdc9457SAndroid Build Coastguard Worker
2656*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)2657*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
2658*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2659*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2660*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2661*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2662*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2663*4bdc9457SAndroid Build Coastguard Worker .m(1)
2664*4bdc9457SAndroid Build Coastguard Worker .n(8)
2665*4bdc9457SAndroid Build Coastguard Worker .k(4)
2666*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2667*4bdc9457SAndroid Build Coastguard Worker }
2668*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)2669*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
2670*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2671*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2672*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2673*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2674*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2675*4bdc9457SAndroid Build Coastguard Worker .m(1)
2676*4bdc9457SAndroid Build Coastguard Worker .n(8)
2677*4bdc9457SAndroid Build Coastguard Worker .k(4)
2678*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2679*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2680*4bdc9457SAndroid Build Coastguard Worker }
2681*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_strided_a)2682*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_strided_a) {
2683*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2684*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2685*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2686*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2687*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2688*4bdc9457SAndroid Build Coastguard Worker .m(1)
2689*4bdc9457SAndroid Build Coastguard Worker .n(8)
2690*4bdc9457SAndroid Build Coastguard Worker .k(4)
2691*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2692*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2693*4bdc9457SAndroid Build Coastguard Worker }
2694*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)2695*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
2696*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2697*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
2698*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2699*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2700*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2701*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2702*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2703*4bdc9457SAndroid Build Coastguard Worker .m(m)
2704*4bdc9457SAndroid Build Coastguard Worker .n(n)
2705*4bdc9457SAndroid Build Coastguard Worker .k(4)
2706*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2707*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2708*4bdc9457SAndroid Build Coastguard Worker }
2709*4bdc9457SAndroid Build Coastguard Worker }
2710*4bdc9457SAndroid Build Coastguard Worker }
2711*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)2712*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
2713*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
2714*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2715*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2716*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2717*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2718*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2719*4bdc9457SAndroid Build Coastguard Worker .m(m)
2720*4bdc9457SAndroid Build Coastguard Worker .n(8)
2721*4bdc9457SAndroid Build Coastguard Worker .k(4)
2722*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2723*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2724*4bdc9457SAndroid Build Coastguard Worker }
2725*4bdc9457SAndroid Build Coastguard Worker }
2726*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)2727*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
2728*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2729*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2730*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2731*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2732*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2733*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2734*4bdc9457SAndroid Build Coastguard Worker .m(1)
2735*4bdc9457SAndroid Build Coastguard Worker .n(n)
2736*4bdc9457SAndroid Build Coastguard Worker .k(4)
2737*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2738*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2739*4bdc9457SAndroid Build Coastguard Worker }
2740*4bdc9457SAndroid Build Coastguard Worker }
2741*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)2742*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
2743*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2744*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2745*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2746*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2747*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2748*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2749*4bdc9457SAndroid Build Coastguard Worker .m(1)
2750*4bdc9457SAndroid Build Coastguard Worker .n(8)
2751*4bdc9457SAndroid Build Coastguard Worker .k(k)
2752*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2753*4bdc9457SAndroid Build Coastguard Worker }
2754*4bdc9457SAndroid Build Coastguard Worker }
2755*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_strided_a)2756*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_strided_a) {
2757*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2758*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2759*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2760*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2761*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2762*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2763*4bdc9457SAndroid Build Coastguard Worker .m(1)
2764*4bdc9457SAndroid Build Coastguard Worker .n(8)
2765*4bdc9457SAndroid Build Coastguard Worker .k(k)
2766*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2767*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2768*4bdc9457SAndroid Build Coastguard Worker }
2769*4bdc9457SAndroid Build Coastguard Worker }
2770*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)2771*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
2772*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2773*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2774*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
2775*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2776*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2777*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2778*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2779*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2780*4bdc9457SAndroid Build Coastguard Worker .m(m)
2781*4bdc9457SAndroid Build Coastguard Worker .n(n)
2782*4bdc9457SAndroid Build Coastguard Worker .k(k)
2783*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2784*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2785*4bdc9457SAndroid Build Coastguard Worker }
2786*4bdc9457SAndroid Build Coastguard Worker }
2787*4bdc9457SAndroid Build Coastguard Worker }
2788*4bdc9457SAndroid Build Coastguard Worker }
2789*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)2790*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
2791*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2792*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2793*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2794*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2795*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2796*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2797*4bdc9457SAndroid Build Coastguard Worker .m(1)
2798*4bdc9457SAndroid Build Coastguard Worker .n(8)
2799*4bdc9457SAndroid Build Coastguard Worker .k(k)
2800*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2801*4bdc9457SAndroid Build Coastguard Worker }
2802*4bdc9457SAndroid Build Coastguard Worker }
2803*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_strided_a)2804*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_strided_a) {
2805*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2806*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2807*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2808*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2809*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2810*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2811*4bdc9457SAndroid Build Coastguard Worker .m(1)
2812*4bdc9457SAndroid Build Coastguard Worker .n(8)
2813*4bdc9457SAndroid Build Coastguard Worker .k(k)
2814*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
2815*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2816*4bdc9457SAndroid Build Coastguard Worker }
2817*4bdc9457SAndroid Build Coastguard Worker }
2818*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)2819*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
2820*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2821*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2822*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
2823*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2824*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2825*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2826*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2827*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2828*4bdc9457SAndroid Build Coastguard Worker .m(m)
2829*4bdc9457SAndroid Build Coastguard Worker .n(n)
2830*4bdc9457SAndroid Build Coastguard Worker .k(k)
2831*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2832*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2833*4bdc9457SAndroid Build Coastguard Worker }
2834*4bdc9457SAndroid Build Coastguard Worker }
2835*4bdc9457SAndroid Build Coastguard Worker }
2836*4bdc9457SAndroid Build Coastguard Worker }
2837*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)2838*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
2839*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2840*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2841*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2842*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2843*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2844*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2845*4bdc9457SAndroid Build Coastguard Worker .m(1)
2846*4bdc9457SAndroid Build Coastguard Worker .n(8)
2847*4bdc9457SAndroid Build Coastguard Worker .k(k)
2848*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2849*4bdc9457SAndroid Build Coastguard Worker }
2850*4bdc9457SAndroid Build Coastguard Worker }
2851*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_strided_a)2852*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_strided_a) {
2853*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2854*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2855*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2856*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2857*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2858*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2859*4bdc9457SAndroid Build Coastguard Worker .m(1)
2860*4bdc9457SAndroid Build Coastguard Worker .n(8)
2861*4bdc9457SAndroid Build Coastguard Worker .k(k)
2862*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
2863*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2864*4bdc9457SAndroid Build Coastguard Worker }
2865*4bdc9457SAndroid Build Coastguard Worker }
2866*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)2867*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
2868*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2869*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2870*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
2871*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2872*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2873*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2874*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2875*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2876*4bdc9457SAndroid Build Coastguard Worker .m(m)
2877*4bdc9457SAndroid Build Coastguard Worker .n(n)
2878*4bdc9457SAndroid Build Coastguard Worker .k(k)
2879*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2880*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2881*4bdc9457SAndroid Build Coastguard Worker }
2882*4bdc9457SAndroid Build Coastguard Worker }
2883*4bdc9457SAndroid Build Coastguard Worker }
2884*4bdc9457SAndroid Build Coastguard Worker }
2885*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)2886*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
2887*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2888*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2889*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2890*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2891*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2892*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2893*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2894*4bdc9457SAndroid Build Coastguard Worker .m(1)
2895*4bdc9457SAndroid Build Coastguard Worker .n(n)
2896*4bdc9457SAndroid Build Coastguard Worker .k(k)
2897*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2898*4bdc9457SAndroid Build Coastguard Worker }
2899*4bdc9457SAndroid Build Coastguard Worker }
2900*4bdc9457SAndroid Build Coastguard Worker }
2901*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)2902*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
2903*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2904*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2905*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2906*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2907*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2908*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2909*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2910*4bdc9457SAndroid Build Coastguard Worker .m(1)
2911*4bdc9457SAndroid Build Coastguard Worker .n(n)
2912*4bdc9457SAndroid Build Coastguard Worker .k(k)
2913*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2914*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2915*4bdc9457SAndroid Build Coastguard Worker }
2916*4bdc9457SAndroid Build Coastguard Worker }
2917*4bdc9457SAndroid Build Coastguard Worker }
2918*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_a)2919*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_a) {
2920*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2921*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2922*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2923*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2924*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2925*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2926*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2927*4bdc9457SAndroid Build Coastguard Worker .m(1)
2928*4bdc9457SAndroid Build Coastguard Worker .n(n)
2929*4bdc9457SAndroid Build Coastguard Worker .k(k)
2930*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
2931*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2932*4bdc9457SAndroid Build Coastguard Worker }
2933*4bdc9457SAndroid Build Coastguard Worker }
2934*4bdc9457SAndroid Build Coastguard Worker }
2935*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)2936*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
2937*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2938*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2939*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
2940*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2941*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2942*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2943*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2944*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2945*4bdc9457SAndroid Build Coastguard Worker .m(m)
2946*4bdc9457SAndroid Build Coastguard Worker .n(n)
2947*4bdc9457SAndroid Build Coastguard Worker .k(k)
2948*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2949*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2950*4bdc9457SAndroid Build Coastguard Worker }
2951*4bdc9457SAndroid Build Coastguard Worker }
2952*4bdc9457SAndroid Build Coastguard Worker }
2953*4bdc9457SAndroid Build Coastguard Worker }
2954*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)2955*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
2956*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2957*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2958*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2959*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2960*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2961*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2962*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2963*4bdc9457SAndroid Build Coastguard Worker .m(1)
2964*4bdc9457SAndroid Build Coastguard Worker .n(n)
2965*4bdc9457SAndroid Build Coastguard Worker .k(k)
2966*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2967*4bdc9457SAndroid Build Coastguard Worker }
2968*4bdc9457SAndroid Build Coastguard Worker }
2969*4bdc9457SAndroid Build Coastguard Worker }
2970*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)2971*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
2972*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2973*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2974*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2975*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2976*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2977*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2978*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2979*4bdc9457SAndroid Build Coastguard Worker .m(1)
2980*4bdc9457SAndroid Build Coastguard Worker .n(n)
2981*4bdc9457SAndroid Build Coastguard Worker .k(k)
2982*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2983*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
2984*4bdc9457SAndroid Build Coastguard Worker }
2985*4bdc9457SAndroid Build Coastguard Worker }
2986*4bdc9457SAndroid Build Coastguard Worker }
2987*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_a)2988*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_a) {
2989*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2990*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2991*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2992*4bdc9457SAndroid Build Coastguard Worker .mr(1)
2993*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2994*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2995*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2996*4bdc9457SAndroid Build Coastguard Worker .m(1)
2997*4bdc9457SAndroid Build Coastguard Worker .n(n)
2998*4bdc9457SAndroid Build Coastguard Worker .k(k)
2999*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3000*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3001*4bdc9457SAndroid Build Coastguard Worker }
3002*4bdc9457SAndroid Build Coastguard Worker }
3003*4bdc9457SAndroid Build Coastguard Worker }
3004*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)3005*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
3006*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3007*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3008*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3009*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3010*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3011*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3012*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3013*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3014*4bdc9457SAndroid Build Coastguard Worker .m(m)
3015*4bdc9457SAndroid Build Coastguard Worker .n(n)
3016*4bdc9457SAndroid Build Coastguard Worker .k(k)
3017*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3018*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3019*4bdc9457SAndroid Build Coastguard Worker }
3020*4bdc9457SAndroid Build Coastguard Worker }
3021*4bdc9457SAndroid Build Coastguard Worker }
3022*4bdc9457SAndroid Build Coastguard Worker }
3023*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)3024*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
3025*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3026*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3027*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3028*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3029*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3030*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3031*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3032*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3033*4bdc9457SAndroid Build Coastguard Worker .m(m)
3034*4bdc9457SAndroid Build Coastguard Worker .n(n)
3035*4bdc9457SAndroid Build Coastguard Worker .k(k)
3036*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3037*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3038*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3039*4bdc9457SAndroid Build Coastguard Worker }
3040*4bdc9457SAndroid Build Coastguard Worker }
3041*4bdc9457SAndroid Build Coastguard Worker }
3042*4bdc9457SAndroid Build Coastguard Worker }
3043*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)3044*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
3045*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3046*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3047*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3048*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3049*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3050*4bdc9457SAndroid Build Coastguard Worker .m(1)
3051*4bdc9457SAndroid Build Coastguard Worker .n(8)
3052*4bdc9457SAndroid Build Coastguard Worker .k(4)
3053*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3054*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x8__wasmrelaxedsimd_fma_splat);
3055*4bdc9457SAndroid Build Coastguard Worker }
3056*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
3057*4bdc9457SAndroid Build Coastguard Worker
3058*4bdc9457SAndroid Build Coastguard Worker
3059*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)3060*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
3061*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3062*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3063*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3064*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3065*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3066*4bdc9457SAndroid Build Coastguard Worker .m(3)
3067*4bdc9457SAndroid Build Coastguard Worker .n(8)
3068*4bdc9457SAndroid Build Coastguard Worker .k(4)
3069*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3070*4bdc9457SAndroid Build Coastguard Worker }
3071*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)3072*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
3073*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3074*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3075*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3076*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3077*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3078*4bdc9457SAndroid Build Coastguard Worker .m(3)
3079*4bdc9457SAndroid Build Coastguard Worker .n(8)
3080*4bdc9457SAndroid Build Coastguard Worker .k(4)
3081*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3082*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3083*4bdc9457SAndroid Build Coastguard Worker }
3084*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_strided_a)3085*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_strided_a) {
3086*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3087*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3088*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3089*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3090*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3091*4bdc9457SAndroid Build Coastguard Worker .m(3)
3092*4bdc9457SAndroid Build Coastguard Worker .n(8)
3093*4bdc9457SAndroid Build Coastguard Worker .k(4)
3094*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3095*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3096*4bdc9457SAndroid Build Coastguard Worker }
3097*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)3098*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
3099*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3100*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3101*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3102*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3103*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3104*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3105*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3106*4bdc9457SAndroid Build Coastguard Worker .m(m)
3107*4bdc9457SAndroid Build Coastguard Worker .n(n)
3108*4bdc9457SAndroid Build Coastguard Worker .k(4)
3109*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3110*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3111*4bdc9457SAndroid Build Coastguard Worker }
3112*4bdc9457SAndroid Build Coastguard Worker }
3113*4bdc9457SAndroid Build Coastguard Worker }
3114*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)3115*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
3116*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3117*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3118*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3119*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3120*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3121*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3122*4bdc9457SAndroid Build Coastguard Worker .m(m)
3123*4bdc9457SAndroid Build Coastguard Worker .n(8)
3124*4bdc9457SAndroid Build Coastguard Worker .k(4)
3125*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3126*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3127*4bdc9457SAndroid Build Coastguard Worker }
3128*4bdc9457SAndroid Build Coastguard Worker }
3129*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)3130*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
3131*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3132*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3133*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3134*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3135*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3136*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3137*4bdc9457SAndroid Build Coastguard Worker .m(3)
3138*4bdc9457SAndroid Build Coastguard Worker .n(n)
3139*4bdc9457SAndroid Build Coastguard Worker .k(4)
3140*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3141*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3142*4bdc9457SAndroid Build Coastguard Worker }
3143*4bdc9457SAndroid Build Coastguard Worker }
3144*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)3145*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
3146*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3147*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3148*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3149*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3150*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3151*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3152*4bdc9457SAndroid Build Coastguard Worker .m(3)
3153*4bdc9457SAndroid Build Coastguard Worker .n(8)
3154*4bdc9457SAndroid Build Coastguard Worker .k(k)
3155*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3156*4bdc9457SAndroid Build Coastguard Worker }
3157*4bdc9457SAndroid Build Coastguard Worker }
3158*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_strided_a)3159*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_strided_a) {
3160*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3161*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3162*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3163*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3164*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3165*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3166*4bdc9457SAndroid Build Coastguard Worker .m(3)
3167*4bdc9457SAndroid Build Coastguard Worker .n(8)
3168*4bdc9457SAndroid Build Coastguard Worker .k(k)
3169*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3170*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3171*4bdc9457SAndroid Build Coastguard Worker }
3172*4bdc9457SAndroid Build Coastguard Worker }
3173*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)3174*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
3175*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3176*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3177*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3178*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3179*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3180*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3181*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3182*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3183*4bdc9457SAndroid Build Coastguard Worker .m(m)
3184*4bdc9457SAndroid Build Coastguard Worker .n(n)
3185*4bdc9457SAndroid Build Coastguard Worker .k(k)
3186*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3187*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3188*4bdc9457SAndroid Build Coastguard Worker }
3189*4bdc9457SAndroid Build Coastguard Worker }
3190*4bdc9457SAndroid Build Coastguard Worker }
3191*4bdc9457SAndroid Build Coastguard Worker }
3192*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)3193*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
3194*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3195*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3196*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3197*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3198*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3199*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3200*4bdc9457SAndroid Build Coastguard Worker .m(3)
3201*4bdc9457SAndroid Build Coastguard Worker .n(8)
3202*4bdc9457SAndroid Build Coastguard Worker .k(k)
3203*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3204*4bdc9457SAndroid Build Coastguard Worker }
3205*4bdc9457SAndroid Build Coastguard Worker }
3206*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_strided_a)3207*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_strided_a) {
3208*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3209*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3210*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3211*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3212*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3213*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3214*4bdc9457SAndroid Build Coastguard Worker .m(3)
3215*4bdc9457SAndroid Build Coastguard Worker .n(8)
3216*4bdc9457SAndroid Build Coastguard Worker .k(k)
3217*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
3218*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3219*4bdc9457SAndroid Build Coastguard Worker }
3220*4bdc9457SAndroid Build Coastguard Worker }
3221*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)3222*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
3223*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3224*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3225*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3226*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3227*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3228*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3229*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3230*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3231*4bdc9457SAndroid Build Coastguard Worker .m(m)
3232*4bdc9457SAndroid Build Coastguard Worker .n(n)
3233*4bdc9457SAndroid Build Coastguard Worker .k(k)
3234*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3235*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3236*4bdc9457SAndroid Build Coastguard Worker }
3237*4bdc9457SAndroid Build Coastguard Worker }
3238*4bdc9457SAndroid Build Coastguard Worker }
3239*4bdc9457SAndroid Build Coastguard Worker }
3240*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)3241*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
3242*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3243*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3244*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3245*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3246*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3247*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3248*4bdc9457SAndroid Build Coastguard Worker .m(3)
3249*4bdc9457SAndroid Build Coastguard Worker .n(8)
3250*4bdc9457SAndroid Build Coastguard Worker .k(k)
3251*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3252*4bdc9457SAndroid Build Coastguard Worker }
3253*4bdc9457SAndroid Build Coastguard Worker }
3254*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_strided_a)3255*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_strided_a) {
3256*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3257*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3258*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3259*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3260*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3261*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3262*4bdc9457SAndroid Build Coastguard Worker .m(3)
3263*4bdc9457SAndroid Build Coastguard Worker .n(8)
3264*4bdc9457SAndroid Build Coastguard Worker .k(k)
3265*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
3266*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3267*4bdc9457SAndroid Build Coastguard Worker }
3268*4bdc9457SAndroid Build Coastguard Worker }
3269*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)3270*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
3271*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3272*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3273*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3274*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3275*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3276*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3277*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3278*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3279*4bdc9457SAndroid Build Coastguard Worker .m(m)
3280*4bdc9457SAndroid Build Coastguard Worker .n(n)
3281*4bdc9457SAndroid Build Coastguard Worker .k(k)
3282*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3283*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3284*4bdc9457SAndroid Build Coastguard Worker }
3285*4bdc9457SAndroid Build Coastguard Worker }
3286*4bdc9457SAndroid Build Coastguard Worker }
3287*4bdc9457SAndroid Build Coastguard Worker }
3288*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)3289*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
3290*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3291*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3292*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3293*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3294*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3295*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3296*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3297*4bdc9457SAndroid Build Coastguard Worker .m(3)
3298*4bdc9457SAndroid Build Coastguard Worker .n(n)
3299*4bdc9457SAndroid Build Coastguard Worker .k(k)
3300*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3301*4bdc9457SAndroid Build Coastguard Worker }
3302*4bdc9457SAndroid Build Coastguard Worker }
3303*4bdc9457SAndroid Build Coastguard Worker }
3304*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)3305*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
3306*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3307*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3308*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3309*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3310*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3311*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3312*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3313*4bdc9457SAndroid Build Coastguard Worker .m(3)
3314*4bdc9457SAndroid Build Coastguard Worker .n(n)
3315*4bdc9457SAndroid Build Coastguard Worker .k(k)
3316*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3317*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3318*4bdc9457SAndroid Build Coastguard Worker }
3319*4bdc9457SAndroid Build Coastguard Worker }
3320*4bdc9457SAndroid Build Coastguard Worker }
3321*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_a)3322*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_a) {
3323*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3324*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3325*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3326*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3327*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3328*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3329*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3330*4bdc9457SAndroid Build Coastguard Worker .m(3)
3331*4bdc9457SAndroid Build Coastguard Worker .n(n)
3332*4bdc9457SAndroid Build Coastguard Worker .k(k)
3333*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3334*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3335*4bdc9457SAndroid Build Coastguard Worker }
3336*4bdc9457SAndroid Build Coastguard Worker }
3337*4bdc9457SAndroid Build Coastguard Worker }
3338*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)3339*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
3340*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3341*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3342*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3343*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3344*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3345*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3346*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3347*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3348*4bdc9457SAndroid Build Coastguard Worker .m(m)
3349*4bdc9457SAndroid Build Coastguard Worker .n(n)
3350*4bdc9457SAndroid Build Coastguard Worker .k(k)
3351*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3352*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3353*4bdc9457SAndroid Build Coastguard Worker }
3354*4bdc9457SAndroid Build Coastguard Worker }
3355*4bdc9457SAndroid Build Coastguard Worker }
3356*4bdc9457SAndroid Build Coastguard Worker }
3357*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)3358*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
3359*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3360*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3361*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3362*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3363*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3364*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3365*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3366*4bdc9457SAndroid Build Coastguard Worker .m(3)
3367*4bdc9457SAndroid Build Coastguard Worker .n(n)
3368*4bdc9457SAndroid Build Coastguard Worker .k(k)
3369*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3370*4bdc9457SAndroid Build Coastguard Worker }
3371*4bdc9457SAndroid Build Coastguard Worker }
3372*4bdc9457SAndroid Build Coastguard Worker }
3373*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)3374*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
3375*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3376*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3377*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3378*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3379*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3380*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3381*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3382*4bdc9457SAndroid Build Coastguard Worker .m(3)
3383*4bdc9457SAndroid Build Coastguard Worker .n(n)
3384*4bdc9457SAndroid Build Coastguard Worker .k(k)
3385*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3386*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3387*4bdc9457SAndroid Build Coastguard Worker }
3388*4bdc9457SAndroid Build Coastguard Worker }
3389*4bdc9457SAndroid Build Coastguard Worker }
3390*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_a)3391*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_a) {
3392*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3393*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3394*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3395*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3396*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3397*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3398*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3399*4bdc9457SAndroid Build Coastguard Worker .m(3)
3400*4bdc9457SAndroid Build Coastguard Worker .n(n)
3401*4bdc9457SAndroid Build Coastguard Worker .k(k)
3402*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3403*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3404*4bdc9457SAndroid Build Coastguard Worker }
3405*4bdc9457SAndroid Build Coastguard Worker }
3406*4bdc9457SAndroid Build Coastguard Worker }
3407*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)3408*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
3409*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3410*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3411*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3412*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3413*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3414*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3415*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3416*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3417*4bdc9457SAndroid Build Coastguard Worker .m(m)
3418*4bdc9457SAndroid Build Coastguard Worker .n(n)
3419*4bdc9457SAndroid Build Coastguard Worker .k(k)
3420*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3421*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3422*4bdc9457SAndroid Build Coastguard Worker }
3423*4bdc9457SAndroid Build Coastguard Worker }
3424*4bdc9457SAndroid Build Coastguard Worker }
3425*4bdc9457SAndroid Build Coastguard Worker }
3426*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)3427*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
3428*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3429*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3430*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3431*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3432*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3433*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3434*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3435*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3436*4bdc9457SAndroid Build Coastguard Worker .m(m)
3437*4bdc9457SAndroid Build Coastguard Worker .n(n)
3438*4bdc9457SAndroid Build Coastguard Worker .k(k)
3439*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3440*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3441*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3442*4bdc9457SAndroid Build Coastguard Worker }
3443*4bdc9457SAndroid Build Coastguard Worker }
3444*4bdc9457SAndroid Build Coastguard Worker }
3445*4bdc9457SAndroid Build Coastguard Worker }
3446*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)3447*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
3448*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3449*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3450*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3451*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3452*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3453*4bdc9457SAndroid Build Coastguard Worker .m(3)
3454*4bdc9457SAndroid Build Coastguard Worker .n(8)
3455*4bdc9457SAndroid Build Coastguard Worker .k(4)
3456*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3457*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat);
3458*4bdc9457SAndroid Build Coastguard Worker }
3459*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
3460*4bdc9457SAndroid Build Coastguard Worker
3461*4bdc9457SAndroid Build Coastguard Worker
3462*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)3463*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
3464*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3465*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3466*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3467*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3468*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3469*4bdc9457SAndroid Build Coastguard Worker .m(3)
3470*4bdc9457SAndroid Build Coastguard Worker .n(8)
3471*4bdc9457SAndroid Build Coastguard Worker .k(4)
3472*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3473*4bdc9457SAndroid Build Coastguard Worker }
3474*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,strided_cn)3475*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
3476*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3477*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3478*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3479*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3480*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3481*4bdc9457SAndroid Build Coastguard Worker .m(3)
3482*4bdc9457SAndroid Build Coastguard Worker .n(8)
3483*4bdc9457SAndroid Build Coastguard Worker .k(4)
3484*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3485*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3486*4bdc9457SAndroid Build Coastguard Worker }
3487*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_strided_a)3488*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_strided_a) {
3489*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3490*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3491*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3492*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3493*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3494*4bdc9457SAndroid Build Coastguard Worker .m(3)
3495*4bdc9457SAndroid Build Coastguard Worker .n(8)
3496*4bdc9457SAndroid Build Coastguard Worker .k(4)
3497*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3498*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3499*4bdc9457SAndroid Build Coastguard Worker }
3500*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)3501*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
3502*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3503*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3504*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3505*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3506*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3507*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3508*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3509*4bdc9457SAndroid Build Coastguard Worker .m(m)
3510*4bdc9457SAndroid Build Coastguard Worker .n(n)
3511*4bdc9457SAndroid Build Coastguard Worker .k(4)
3512*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3513*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3514*4bdc9457SAndroid Build Coastguard Worker }
3515*4bdc9457SAndroid Build Coastguard Worker }
3516*4bdc9457SAndroid Build Coastguard Worker }
3517*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)3518*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
3519*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3520*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3521*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3522*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3523*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3524*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3525*4bdc9457SAndroid Build Coastguard Worker .m(m)
3526*4bdc9457SAndroid Build Coastguard Worker .n(8)
3527*4bdc9457SAndroid Build Coastguard Worker .k(4)
3528*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3529*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3530*4bdc9457SAndroid Build Coastguard Worker }
3531*4bdc9457SAndroid Build Coastguard Worker }
3532*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)3533*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
3534*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3535*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3536*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3537*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3538*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3539*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3540*4bdc9457SAndroid Build Coastguard Worker .m(3)
3541*4bdc9457SAndroid Build Coastguard Worker .n(n)
3542*4bdc9457SAndroid Build Coastguard Worker .k(4)
3543*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3544*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3545*4bdc9457SAndroid Build Coastguard Worker }
3546*4bdc9457SAndroid Build Coastguard Worker }
3547*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)3548*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
3549*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3550*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3551*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3552*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3553*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3554*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3555*4bdc9457SAndroid Build Coastguard Worker .m(3)
3556*4bdc9457SAndroid Build Coastguard Worker .n(8)
3557*4bdc9457SAndroid Build Coastguard Worker .k(k)
3558*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3559*4bdc9457SAndroid Build Coastguard Worker }
3560*4bdc9457SAndroid Build Coastguard Worker }
3561*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_strided_a)3562*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_strided_a) {
3563*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3564*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3565*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3566*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3567*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3568*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3569*4bdc9457SAndroid Build Coastguard Worker .m(3)
3570*4bdc9457SAndroid Build Coastguard Worker .n(8)
3571*4bdc9457SAndroid Build Coastguard Worker .k(k)
3572*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3573*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3574*4bdc9457SAndroid Build Coastguard Worker }
3575*4bdc9457SAndroid Build Coastguard Worker }
3576*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)3577*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
3578*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3579*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3580*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3581*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3582*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3583*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3584*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3585*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3586*4bdc9457SAndroid Build Coastguard Worker .m(m)
3587*4bdc9457SAndroid Build Coastguard Worker .n(n)
3588*4bdc9457SAndroid Build Coastguard Worker .k(k)
3589*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3590*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3591*4bdc9457SAndroid Build Coastguard Worker }
3592*4bdc9457SAndroid Build Coastguard Worker }
3593*4bdc9457SAndroid Build Coastguard Worker }
3594*4bdc9457SAndroid Build Coastguard Worker }
3595*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)3596*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
3597*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3598*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3599*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3600*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3601*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3602*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3603*4bdc9457SAndroid Build Coastguard Worker .m(3)
3604*4bdc9457SAndroid Build Coastguard Worker .n(8)
3605*4bdc9457SAndroid Build Coastguard Worker .k(k)
3606*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3607*4bdc9457SAndroid Build Coastguard Worker }
3608*4bdc9457SAndroid Build Coastguard Worker }
3609*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_strided_a)3610*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_strided_a) {
3611*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3612*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3613*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3614*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3615*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3616*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3617*4bdc9457SAndroid Build Coastguard Worker .m(3)
3618*4bdc9457SAndroid Build Coastguard Worker .n(8)
3619*4bdc9457SAndroid Build Coastguard Worker .k(k)
3620*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
3621*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3622*4bdc9457SAndroid Build Coastguard Worker }
3623*4bdc9457SAndroid Build Coastguard Worker }
3624*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)3625*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
3626*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3627*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3628*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3629*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3630*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3631*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3632*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3633*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3634*4bdc9457SAndroid Build Coastguard Worker .m(m)
3635*4bdc9457SAndroid Build Coastguard Worker .n(n)
3636*4bdc9457SAndroid Build Coastguard Worker .k(k)
3637*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3638*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3639*4bdc9457SAndroid Build Coastguard Worker }
3640*4bdc9457SAndroid Build Coastguard Worker }
3641*4bdc9457SAndroid Build Coastguard Worker }
3642*4bdc9457SAndroid Build Coastguard Worker }
3643*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_div_4)3644*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
3645*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3646*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3647*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3648*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3649*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3650*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3651*4bdc9457SAndroid Build Coastguard Worker .m(3)
3652*4bdc9457SAndroid Build Coastguard Worker .n(8)
3653*4bdc9457SAndroid Build Coastguard Worker .k(k)
3654*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3655*4bdc9457SAndroid Build Coastguard Worker }
3656*4bdc9457SAndroid Build Coastguard Worker }
3657*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_div_4_strided_a)3658*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_div_4_strided_a) {
3659*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3660*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3661*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3662*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3663*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3664*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3665*4bdc9457SAndroid Build Coastguard Worker .m(3)
3666*4bdc9457SAndroid Build Coastguard Worker .n(8)
3667*4bdc9457SAndroid Build Coastguard Worker .k(k)
3668*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
3669*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3670*4bdc9457SAndroid Build Coastguard Worker }
3671*4bdc9457SAndroid Build Coastguard Worker }
3672*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)3673*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
3674*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3675*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3676*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3677*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3678*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3679*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3680*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3681*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3682*4bdc9457SAndroid Build Coastguard Worker .m(m)
3683*4bdc9457SAndroid Build Coastguard Worker .n(n)
3684*4bdc9457SAndroid Build Coastguard Worker .k(k)
3685*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3686*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3687*4bdc9457SAndroid Build Coastguard Worker }
3688*4bdc9457SAndroid Build Coastguard Worker }
3689*4bdc9457SAndroid Build Coastguard Worker }
3690*4bdc9457SAndroid Build Coastguard Worker }
3691*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)3692*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
3693*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3694*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3695*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3696*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3697*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3698*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3699*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3700*4bdc9457SAndroid Build Coastguard Worker .m(3)
3701*4bdc9457SAndroid Build Coastguard Worker .n(n)
3702*4bdc9457SAndroid Build Coastguard Worker .k(k)
3703*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3704*4bdc9457SAndroid Build Coastguard Worker }
3705*4bdc9457SAndroid Build Coastguard Worker }
3706*4bdc9457SAndroid Build Coastguard Worker }
3707*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)3708*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
3709*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3710*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3711*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3712*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3713*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3714*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3715*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3716*4bdc9457SAndroid Build Coastguard Worker .m(3)
3717*4bdc9457SAndroid Build Coastguard Worker .n(n)
3718*4bdc9457SAndroid Build Coastguard Worker .k(k)
3719*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3720*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3721*4bdc9457SAndroid Build Coastguard Worker }
3722*4bdc9457SAndroid Build Coastguard Worker }
3723*4bdc9457SAndroid Build Coastguard Worker }
3724*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_a)3725*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_a) {
3726*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3727*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3728*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3729*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3730*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3731*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3732*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3733*4bdc9457SAndroid Build Coastguard Worker .m(3)
3734*4bdc9457SAndroid Build Coastguard Worker .n(n)
3735*4bdc9457SAndroid Build Coastguard Worker .k(k)
3736*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3737*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3738*4bdc9457SAndroid Build Coastguard Worker }
3739*4bdc9457SAndroid Build Coastguard Worker }
3740*4bdc9457SAndroid Build Coastguard Worker }
3741*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)3742*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
3743*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3744*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3745*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3746*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3747*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3748*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3749*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3750*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3751*4bdc9457SAndroid Build Coastguard Worker .m(m)
3752*4bdc9457SAndroid Build Coastguard Worker .n(n)
3753*4bdc9457SAndroid Build Coastguard Worker .k(k)
3754*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3755*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3756*4bdc9457SAndroid Build Coastguard Worker }
3757*4bdc9457SAndroid Build Coastguard Worker }
3758*4bdc9457SAndroid Build Coastguard Worker }
3759*4bdc9457SAndroid Build Coastguard Worker }
3760*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8)3761*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
3762*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3763*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3764*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3765*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3766*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3767*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3768*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3769*4bdc9457SAndroid Build Coastguard Worker .m(3)
3770*4bdc9457SAndroid Build Coastguard Worker .n(n)
3771*4bdc9457SAndroid Build Coastguard Worker .k(k)
3772*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3773*4bdc9457SAndroid Build Coastguard Worker }
3774*4bdc9457SAndroid Build Coastguard Worker }
3775*4bdc9457SAndroid Build Coastguard Worker }
3776*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)3777*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
3778*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3779*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3780*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3781*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3782*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3783*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3784*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3785*4bdc9457SAndroid Build Coastguard Worker .m(3)
3786*4bdc9457SAndroid Build Coastguard Worker .n(n)
3787*4bdc9457SAndroid Build Coastguard Worker .k(k)
3788*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3789*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3790*4bdc9457SAndroid Build Coastguard Worker }
3791*4bdc9457SAndroid Build Coastguard Worker }
3792*4bdc9457SAndroid Build Coastguard Worker }
3793*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_a)3794*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_a) {
3795*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3796*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3797*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3798*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3799*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3800*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3801*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3802*4bdc9457SAndroid Build Coastguard Worker .m(3)
3803*4bdc9457SAndroid Build Coastguard Worker .n(n)
3804*4bdc9457SAndroid Build Coastguard Worker .k(k)
3805*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3806*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3807*4bdc9457SAndroid Build Coastguard Worker }
3808*4bdc9457SAndroid Build Coastguard Worker }
3809*4bdc9457SAndroid Build Coastguard Worker }
3810*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)3811*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
3812*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3813*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3814*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3815*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3816*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3817*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3818*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3819*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3820*4bdc9457SAndroid Build Coastguard Worker .m(m)
3821*4bdc9457SAndroid Build Coastguard Worker .n(n)
3822*4bdc9457SAndroid Build Coastguard Worker .k(k)
3823*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3824*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3825*4bdc9457SAndroid Build Coastguard Worker }
3826*4bdc9457SAndroid Build Coastguard Worker }
3827*4bdc9457SAndroid Build Coastguard Worker }
3828*4bdc9457SAndroid Build Coastguard Worker }
3829*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)3830*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
3831*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3832*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3833*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
3834*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3835*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3836*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3837*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3838*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3839*4bdc9457SAndroid Build Coastguard Worker .m(m)
3840*4bdc9457SAndroid Build Coastguard Worker .n(n)
3841*4bdc9457SAndroid Build Coastguard Worker .k(k)
3842*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3843*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3844*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3845*4bdc9457SAndroid Build Coastguard Worker }
3846*4bdc9457SAndroid Build Coastguard Worker }
3847*4bdc9457SAndroid Build Coastguard Worker }
3848*4bdc9457SAndroid Build Coastguard Worker }
3849*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA,strided_cm)3850*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_3X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
3851*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3852*4bdc9457SAndroid Build Coastguard Worker .mr(3)
3853*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3854*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3855*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3856*4bdc9457SAndroid Build Coastguard Worker .m(3)
3857*4bdc9457SAndroid Build Coastguard Worker .n(8)
3858*4bdc9457SAndroid Build Coastguard Worker .k(4)
3859*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3860*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_3x8s4__wasmrelaxedsimd_fma);
3861*4bdc9457SAndroid Build Coastguard Worker }
3862*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
3863*4bdc9457SAndroid Build Coastguard Worker
3864*4bdc9457SAndroid Build Coastguard Worker
3865*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)3866*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
3867*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3868*4bdc9457SAndroid Build Coastguard Worker .mr(4)
3869*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3870*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3871*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3872*4bdc9457SAndroid Build Coastguard Worker .m(4)
3873*4bdc9457SAndroid Build Coastguard Worker .n(8)
3874*4bdc9457SAndroid Build Coastguard Worker .k(4)
3875*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
3876*4bdc9457SAndroid Build Coastguard Worker }
3877*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)3878*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
3879*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3880*4bdc9457SAndroid Build Coastguard Worker .mr(4)
3881*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3882*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3883*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3884*4bdc9457SAndroid Build Coastguard Worker .m(4)
3885*4bdc9457SAndroid Build Coastguard Worker .n(8)
3886*4bdc9457SAndroid Build Coastguard Worker .k(4)
3887*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3888*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
3889*4bdc9457SAndroid Build Coastguard Worker }
3890*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_strided_a)3891*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_strided_a) {
3892*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3893*4bdc9457SAndroid Build Coastguard Worker .mr(4)
3894*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3895*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3896*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3897*4bdc9457SAndroid Build Coastguard Worker .m(4)
3898*4bdc9457SAndroid Build Coastguard Worker .n(8)
3899*4bdc9457SAndroid Build Coastguard Worker .k(4)
3900*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3901*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
3902*4bdc9457SAndroid Build Coastguard Worker }
3903*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)3904*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
3905*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3906*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
3907*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3908*4bdc9457SAndroid Build Coastguard Worker .mr(4)
3909*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3910*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3911*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3912*4bdc9457SAndroid Build Coastguard Worker .m(m)
3913*4bdc9457SAndroid Build Coastguard Worker .n(n)
3914*4bdc9457SAndroid Build Coastguard Worker .k(4)
3915*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3916*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
3917*4bdc9457SAndroid Build Coastguard Worker }
3918*4bdc9457SAndroid Build Coastguard Worker }
3919*4bdc9457SAndroid Build Coastguard Worker }
3920*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)3921*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
3922*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
3923*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3924*4bdc9457SAndroid Build Coastguard Worker .mr(4)
3925*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3926*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3927*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3928*4bdc9457SAndroid Build Coastguard Worker .m(m)
3929*4bdc9457SAndroid Build Coastguard Worker .n(8)
3930*4bdc9457SAndroid Build Coastguard Worker .k(4)
3931*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3932*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
3933*4bdc9457SAndroid Build Coastguard Worker }
3934*4bdc9457SAndroid Build Coastguard Worker }
3935*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)3936*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
3937*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3938*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3939*4bdc9457SAndroid Build Coastguard Worker .mr(4)
3940*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3941*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3942*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3943*4bdc9457SAndroid Build Coastguard Worker .m(4)
3944*4bdc9457SAndroid Build Coastguard Worker .n(n)
3945*4bdc9457SAndroid Build Coastguard Worker .k(4)
3946*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3947*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
3948*4bdc9457SAndroid Build Coastguard Worker }
3949*4bdc9457SAndroid Build Coastguard Worker }
3950*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)3951*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
3952*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3953*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3954*4bdc9457SAndroid Build Coastguard Worker .mr(4)
3955*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3956*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3957*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3958*4bdc9457SAndroid Build Coastguard Worker .m(4)
3959*4bdc9457SAndroid Build Coastguard Worker .n(8)
3960*4bdc9457SAndroid Build Coastguard Worker .k(k)
3961*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
3962*4bdc9457SAndroid Build Coastguard Worker }
3963*4bdc9457SAndroid Build Coastguard Worker }
3964*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_strided_a)3965*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_strided_a) {
3966*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3967*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3968*4bdc9457SAndroid Build Coastguard Worker .mr(4)
3969*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3970*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3971*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3972*4bdc9457SAndroid Build Coastguard Worker .m(4)
3973*4bdc9457SAndroid Build Coastguard Worker .n(8)
3974*4bdc9457SAndroid Build Coastguard Worker .k(k)
3975*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3976*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
3977*4bdc9457SAndroid Build Coastguard Worker }
3978*4bdc9457SAndroid Build Coastguard Worker }
3979*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)3980*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
3981*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3982*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3983*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
3984*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3985*4bdc9457SAndroid Build Coastguard Worker .mr(4)
3986*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3987*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3988*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3989*4bdc9457SAndroid Build Coastguard Worker .m(m)
3990*4bdc9457SAndroid Build Coastguard Worker .n(n)
3991*4bdc9457SAndroid Build Coastguard Worker .k(k)
3992*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3993*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
3994*4bdc9457SAndroid Build Coastguard Worker }
3995*4bdc9457SAndroid Build Coastguard Worker }
3996*4bdc9457SAndroid Build Coastguard Worker }
3997*4bdc9457SAndroid Build Coastguard Worker }
3998*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)3999*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
4000*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4001*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4002*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4003*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4004*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4005*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4006*4bdc9457SAndroid Build Coastguard Worker .m(4)
4007*4bdc9457SAndroid Build Coastguard Worker .n(8)
4008*4bdc9457SAndroid Build Coastguard Worker .k(k)
4009*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4010*4bdc9457SAndroid Build Coastguard Worker }
4011*4bdc9457SAndroid Build Coastguard Worker }
4012*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_strided_a)4013*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_strided_a) {
4014*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4015*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4016*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4017*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4018*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4019*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4020*4bdc9457SAndroid Build Coastguard Worker .m(4)
4021*4bdc9457SAndroid Build Coastguard Worker .n(8)
4022*4bdc9457SAndroid Build Coastguard Worker .k(k)
4023*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
4024*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4025*4bdc9457SAndroid Build Coastguard Worker }
4026*4bdc9457SAndroid Build Coastguard Worker }
4027*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)4028*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
4029*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4030*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4031*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4032*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4033*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4034*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4035*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4036*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4037*4bdc9457SAndroid Build Coastguard Worker .m(m)
4038*4bdc9457SAndroid Build Coastguard Worker .n(n)
4039*4bdc9457SAndroid Build Coastguard Worker .k(k)
4040*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4041*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4042*4bdc9457SAndroid Build Coastguard Worker }
4043*4bdc9457SAndroid Build Coastguard Worker }
4044*4bdc9457SAndroid Build Coastguard Worker }
4045*4bdc9457SAndroid Build Coastguard Worker }
4046*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)4047*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
4048*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4049*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4050*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4051*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4052*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4053*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4054*4bdc9457SAndroid Build Coastguard Worker .m(4)
4055*4bdc9457SAndroid Build Coastguard Worker .n(8)
4056*4bdc9457SAndroid Build Coastguard Worker .k(k)
4057*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4058*4bdc9457SAndroid Build Coastguard Worker }
4059*4bdc9457SAndroid Build Coastguard Worker }
4060*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_strided_a)4061*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_strided_a) {
4062*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4063*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4064*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4065*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4066*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4067*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4068*4bdc9457SAndroid Build Coastguard Worker .m(4)
4069*4bdc9457SAndroid Build Coastguard Worker .n(8)
4070*4bdc9457SAndroid Build Coastguard Worker .k(k)
4071*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
4072*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4073*4bdc9457SAndroid Build Coastguard Worker }
4074*4bdc9457SAndroid Build Coastguard Worker }
4075*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)4076*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
4077*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4078*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4079*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4080*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4081*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4082*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4083*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4084*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4085*4bdc9457SAndroid Build Coastguard Worker .m(m)
4086*4bdc9457SAndroid Build Coastguard Worker .n(n)
4087*4bdc9457SAndroid Build Coastguard Worker .k(k)
4088*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4089*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4090*4bdc9457SAndroid Build Coastguard Worker }
4091*4bdc9457SAndroid Build Coastguard Worker }
4092*4bdc9457SAndroid Build Coastguard Worker }
4093*4bdc9457SAndroid Build Coastguard Worker }
4094*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)4095*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
4096*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4097*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4098*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4099*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4100*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4101*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4102*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4103*4bdc9457SAndroid Build Coastguard Worker .m(4)
4104*4bdc9457SAndroid Build Coastguard Worker .n(n)
4105*4bdc9457SAndroid Build Coastguard Worker .k(k)
4106*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4107*4bdc9457SAndroid Build Coastguard Worker }
4108*4bdc9457SAndroid Build Coastguard Worker }
4109*4bdc9457SAndroid Build Coastguard Worker }
4110*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)4111*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
4112*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4113*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4114*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4115*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4116*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4117*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4118*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4119*4bdc9457SAndroid Build Coastguard Worker .m(4)
4120*4bdc9457SAndroid Build Coastguard Worker .n(n)
4121*4bdc9457SAndroid Build Coastguard Worker .k(k)
4122*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4123*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4124*4bdc9457SAndroid Build Coastguard Worker }
4125*4bdc9457SAndroid Build Coastguard Worker }
4126*4bdc9457SAndroid Build Coastguard Worker }
4127*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_a)4128*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_a) {
4129*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4130*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4131*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4132*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4133*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4134*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4135*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4136*4bdc9457SAndroid Build Coastguard Worker .m(4)
4137*4bdc9457SAndroid Build Coastguard Worker .n(n)
4138*4bdc9457SAndroid Build Coastguard Worker .k(k)
4139*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4140*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4141*4bdc9457SAndroid Build Coastguard Worker }
4142*4bdc9457SAndroid Build Coastguard Worker }
4143*4bdc9457SAndroid Build Coastguard Worker }
4144*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)4145*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
4146*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4147*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4148*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4149*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4150*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4151*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4152*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4153*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4154*4bdc9457SAndroid Build Coastguard Worker .m(m)
4155*4bdc9457SAndroid Build Coastguard Worker .n(n)
4156*4bdc9457SAndroid Build Coastguard Worker .k(k)
4157*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4158*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4159*4bdc9457SAndroid Build Coastguard Worker }
4160*4bdc9457SAndroid Build Coastguard Worker }
4161*4bdc9457SAndroid Build Coastguard Worker }
4162*4bdc9457SAndroid Build Coastguard Worker }
4163*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)4164*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
4165*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4166*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4167*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4168*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4169*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4170*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4171*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4172*4bdc9457SAndroid Build Coastguard Worker .m(4)
4173*4bdc9457SAndroid Build Coastguard Worker .n(n)
4174*4bdc9457SAndroid Build Coastguard Worker .k(k)
4175*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4176*4bdc9457SAndroid Build Coastguard Worker }
4177*4bdc9457SAndroid Build Coastguard Worker }
4178*4bdc9457SAndroid Build Coastguard Worker }
4179*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)4180*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
4181*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4182*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4183*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4184*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4185*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4186*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4187*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4188*4bdc9457SAndroid Build Coastguard Worker .m(4)
4189*4bdc9457SAndroid Build Coastguard Worker .n(n)
4190*4bdc9457SAndroid Build Coastguard Worker .k(k)
4191*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4192*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4193*4bdc9457SAndroid Build Coastguard Worker }
4194*4bdc9457SAndroid Build Coastguard Worker }
4195*4bdc9457SAndroid Build Coastguard Worker }
4196*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_a)4197*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_a) {
4198*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4199*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4200*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4201*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4202*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4203*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4204*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4205*4bdc9457SAndroid Build Coastguard Worker .m(4)
4206*4bdc9457SAndroid Build Coastguard Worker .n(n)
4207*4bdc9457SAndroid Build Coastguard Worker .k(k)
4208*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4209*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4210*4bdc9457SAndroid Build Coastguard Worker }
4211*4bdc9457SAndroid Build Coastguard Worker }
4212*4bdc9457SAndroid Build Coastguard Worker }
4213*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)4214*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
4215*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4216*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4217*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4218*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4219*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4220*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4221*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4222*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4223*4bdc9457SAndroid Build Coastguard Worker .m(m)
4224*4bdc9457SAndroid Build Coastguard Worker .n(n)
4225*4bdc9457SAndroid Build Coastguard Worker .k(k)
4226*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4227*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4228*4bdc9457SAndroid Build Coastguard Worker }
4229*4bdc9457SAndroid Build Coastguard Worker }
4230*4bdc9457SAndroid Build Coastguard Worker }
4231*4bdc9457SAndroid Build Coastguard Worker }
4232*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)4233*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
4234*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4235*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4236*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4237*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4238*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4239*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4240*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4241*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4242*4bdc9457SAndroid Build Coastguard Worker .m(m)
4243*4bdc9457SAndroid Build Coastguard Worker .n(n)
4244*4bdc9457SAndroid Build Coastguard Worker .k(k)
4245*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4246*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4247*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4248*4bdc9457SAndroid Build Coastguard Worker }
4249*4bdc9457SAndroid Build Coastguard Worker }
4250*4bdc9457SAndroid Build Coastguard Worker }
4251*4bdc9457SAndroid Build Coastguard Worker }
4252*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)4253*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
4254*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4255*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4256*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4257*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4258*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4259*4bdc9457SAndroid Build Coastguard Worker .m(4)
4260*4bdc9457SAndroid Build Coastguard Worker .n(8)
4261*4bdc9457SAndroid Build Coastguard Worker .k(4)
4262*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4263*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8__wasmrelaxedsimd_fma_splat);
4264*4bdc9457SAndroid Build Coastguard Worker }
4265*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4266*4bdc9457SAndroid Build Coastguard Worker
4267*4bdc9457SAndroid Build Coastguard Worker
4268*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)4269*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
4270*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4271*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4272*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4273*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4274*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4275*4bdc9457SAndroid Build Coastguard Worker .m(4)
4276*4bdc9457SAndroid Build Coastguard Worker .n(8)
4277*4bdc9457SAndroid Build Coastguard Worker .k(4)
4278*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4279*4bdc9457SAndroid Build Coastguard Worker }
4280*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,strided_cn)4281*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
4282*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4283*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4284*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4285*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4286*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4287*4bdc9457SAndroid Build Coastguard Worker .m(4)
4288*4bdc9457SAndroid Build Coastguard Worker .n(8)
4289*4bdc9457SAndroid Build Coastguard Worker .k(4)
4290*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4291*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4292*4bdc9457SAndroid Build Coastguard Worker }
4293*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_strided_a)4294*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_strided_a) {
4295*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4296*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4297*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4298*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4299*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4300*4bdc9457SAndroid Build Coastguard Worker .m(4)
4301*4bdc9457SAndroid Build Coastguard Worker .n(8)
4302*4bdc9457SAndroid Build Coastguard Worker .k(4)
4303*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4304*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4305*4bdc9457SAndroid Build Coastguard Worker }
4306*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)4307*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
4308*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4309*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4310*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4311*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4312*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4313*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4314*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4315*4bdc9457SAndroid Build Coastguard Worker .m(m)
4316*4bdc9457SAndroid Build Coastguard Worker .n(n)
4317*4bdc9457SAndroid Build Coastguard Worker .k(4)
4318*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4319*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4320*4bdc9457SAndroid Build Coastguard Worker }
4321*4bdc9457SAndroid Build Coastguard Worker }
4322*4bdc9457SAndroid Build Coastguard Worker }
4323*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)4324*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
4325*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4326*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4327*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4328*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4329*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4330*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4331*4bdc9457SAndroid Build Coastguard Worker .m(m)
4332*4bdc9457SAndroid Build Coastguard Worker .n(8)
4333*4bdc9457SAndroid Build Coastguard Worker .k(4)
4334*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4335*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4336*4bdc9457SAndroid Build Coastguard Worker }
4337*4bdc9457SAndroid Build Coastguard Worker }
4338*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)4339*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
4340*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4341*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4342*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4343*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4344*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4345*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4346*4bdc9457SAndroid Build Coastguard Worker .m(4)
4347*4bdc9457SAndroid Build Coastguard Worker .n(n)
4348*4bdc9457SAndroid Build Coastguard Worker .k(4)
4349*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4350*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4351*4bdc9457SAndroid Build Coastguard Worker }
4352*4bdc9457SAndroid Build Coastguard Worker }
4353*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)4354*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
4355*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4356*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4357*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4358*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4359*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4360*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4361*4bdc9457SAndroid Build Coastguard Worker .m(4)
4362*4bdc9457SAndroid Build Coastguard Worker .n(8)
4363*4bdc9457SAndroid Build Coastguard Worker .k(k)
4364*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4365*4bdc9457SAndroid Build Coastguard Worker }
4366*4bdc9457SAndroid Build Coastguard Worker }
4367*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_strided_a)4368*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_strided_a) {
4369*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4370*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4371*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4372*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4373*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4374*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4375*4bdc9457SAndroid Build Coastguard Worker .m(4)
4376*4bdc9457SAndroid Build Coastguard Worker .n(8)
4377*4bdc9457SAndroid Build Coastguard Worker .k(k)
4378*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4379*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4380*4bdc9457SAndroid Build Coastguard Worker }
4381*4bdc9457SAndroid Build Coastguard Worker }
4382*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)4383*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
4384*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4385*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4386*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4387*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4388*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4389*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4390*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4391*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4392*4bdc9457SAndroid Build Coastguard Worker .m(m)
4393*4bdc9457SAndroid Build Coastguard Worker .n(n)
4394*4bdc9457SAndroid Build Coastguard Worker .k(k)
4395*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4396*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4397*4bdc9457SAndroid Build Coastguard Worker }
4398*4bdc9457SAndroid Build Coastguard Worker }
4399*4bdc9457SAndroid Build Coastguard Worker }
4400*4bdc9457SAndroid Build Coastguard Worker }
4401*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)4402*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
4403*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4404*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4405*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4406*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4407*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4408*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4409*4bdc9457SAndroid Build Coastguard Worker .m(4)
4410*4bdc9457SAndroid Build Coastguard Worker .n(8)
4411*4bdc9457SAndroid Build Coastguard Worker .k(k)
4412*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4413*4bdc9457SAndroid Build Coastguard Worker }
4414*4bdc9457SAndroid Build Coastguard Worker }
4415*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_strided_a)4416*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_strided_a) {
4417*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4418*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4419*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4420*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4421*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4422*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4423*4bdc9457SAndroid Build Coastguard Worker .m(4)
4424*4bdc9457SAndroid Build Coastguard Worker .n(8)
4425*4bdc9457SAndroid Build Coastguard Worker .k(k)
4426*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
4427*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4428*4bdc9457SAndroid Build Coastguard Worker }
4429*4bdc9457SAndroid Build Coastguard Worker }
4430*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)4431*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
4432*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4433*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4434*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4435*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4436*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4437*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4438*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4439*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4440*4bdc9457SAndroid Build Coastguard Worker .m(m)
4441*4bdc9457SAndroid Build Coastguard Worker .n(n)
4442*4bdc9457SAndroid Build Coastguard Worker .k(k)
4443*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4444*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4445*4bdc9457SAndroid Build Coastguard Worker }
4446*4bdc9457SAndroid Build Coastguard Worker }
4447*4bdc9457SAndroid Build Coastguard Worker }
4448*4bdc9457SAndroid Build Coastguard Worker }
4449*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_div_4)4450*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
4451*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4452*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4453*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4454*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4455*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4456*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4457*4bdc9457SAndroid Build Coastguard Worker .m(4)
4458*4bdc9457SAndroid Build Coastguard Worker .n(8)
4459*4bdc9457SAndroid Build Coastguard Worker .k(k)
4460*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4461*4bdc9457SAndroid Build Coastguard Worker }
4462*4bdc9457SAndroid Build Coastguard Worker }
4463*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_div_4_strided_a)4464*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_div_4_strided_a) {
4465*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4466*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4467*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4468*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4469*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4470*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4471*4bdc9457SAndroid Build Coastguard Worker .m(4)
4472*4bdc9457SAndroid Build Coastguard Worker .n(8)
4473*4bdc9457SAndroid Build Coastguard Worker .k(k)
4474*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
4475*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4476*4bdc9457SAndroid Build Coastguard Worker }
4477*4bdc9457SAndroid Build Coastguard Worker }
4478*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)4479*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
4480*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4481*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4482*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4483*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4484*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4485*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4486*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4487*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4488*4bdc9457SAndroid Build Coastguard Worker .m(m)
4489*4bdc9457SAndroid Build Coastguard Worker .n(n)
4490*4bdc9457SAndroid Build Coastguard Worker .k(k)
4491*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4492*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4493*4bdc9457SAndroid Build Coastguard Worker }
4494*4bdc9457SAndroid Build Coastguard Worker }
4495*4bdc9457SAndroid Build Coastguard Worker }
4496*4bdc9457SAndroid Build Coastguard Worker }
4497*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)4498*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
4499*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4500*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4501*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4502*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4503*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4504*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4505*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4506*4bdc9457SAndroid Build Coastguard Worker .m(4)
4507*4bdc9457SAndroid Build Coastguard Worker .n(n)
4508*4bdc9457SAndroid Build Coastguard Worker .k(k)
4509*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4510*4bdc9457SAndroid Build Coastguard Worker }
4511*4bdc9457SAndroid Build Coastguard Worker }
4512*4bdc9457SAndroid Build Coastguard Worker }
4513*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)4514*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
4515*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4516*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4517*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4518*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4519*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4520*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4521*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4522*4bdc9457SAndroid Build Coastguard Worker .m(4)
4523*4bdc9457SAndroid Build Coastguard Worker .n(n)
4524*4bdc9457SAndroid Build Coastguard Worker .k(k)
4525*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4526*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4527*4bdc9457SAndroid Build Coastguard Worker }
4528*4bdc9457SAndroid Build Coastguard Worker }
4529*4bdc9457SAndroid Build Coastguard Worker }
4530*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_a)4531*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_a) {
4532*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4533*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4534*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4535*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4536*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4537*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4538*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4539*4bdc9457SAndroid Build Coastguard Worker .m(4)
4540*4bdc9457SAndroid Build Coastguard Worker .n(n)
4541*4bdc9457SAndroid Build Coastguard Worker .k(k)
4542*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4543*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4544*4bdc9457SAndroid Build Coastguard Worker }
4545*4bdc9457SAndroid Build Coastguard Worker }
4546*4bdc9457SAndroid Build Coastguard Worker }
4547*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)4548*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
4549*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4550*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4551*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4552*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4553*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4554*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4555*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4556*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4557*4bdc9457SAndroid Build Coastguard Worker .m(m)
4558*4bdc9457SAndroid Build Coastguard Worker .n(n)
4559*4bdc9457SAndroid Build Coastguard Worker .k(k)
4560*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4561*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4562*4bdc9457SAndroid Build Coastguard Worker }
4563*4bdc9457SAndroid Build Coastguard Worker }
4564*4bdc9457SAndroid Build Coastguard Worker }
4565*4bdc9457SAndroid Build Coastguard Worker }
4566*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8)4567*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
4568*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4569*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4570*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4571*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4572*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4573*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4574*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4575*4bdc9457SAndroid Build Coastguard Worker .m(4)
4576*4bdc9457SAndroid Build Coastguard Worker .n(n)
4577*4bdc9457SAndroid Build Coastguard Worker .k(k)
4578*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4579*4bdc9457SAndroid Build Coastguard Worker }
4580*4bdc9457SAndroid Build Coastguard Worker }
4581*4bdc9457SAndroid Build Coastguard Worker }
4582*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)4583*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
4584*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4585*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4586*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4587*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4588*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4589*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4590*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4591*4bdc9457SAndroid Build Coastguard Worker .m(4)
4592*4bdc9457SAndroid Build Coastguard Worker .n(n)
4593*4bdc9457SAndroid Build Coastguard Worker .k(k)
4594*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4595*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4596*4bdc9457SAndroid Build Coastguard Worker }
4597*4bdc9457SAndroid Build Coastguard Worker }
4598*4bdc9457SAndroid Build Coastguard Worker }
4599*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_a)4600*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_a) {
4601*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4602*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4603*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4604*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4605*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4606*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4607*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4608*4bdc9457SAndroid Build Coastguard Worker .m(4)
4609*4bdc9457SAndroid Build Coastguard Worker .n(n)
4610*4bdc9457SAndroid Build Coastguard Worker .k(k)
4611*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4612*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4613*4bdc9457SAndroid Build Coastguard Worker }
4614*4bdc9457SAndroid Build Coastguard Worker }
4615*4bdc9457SAndroid Build Coastguard Worker }
4616*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)4617*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
4618*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4619*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4620*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4621*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4622*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4623*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4624*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4625*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4626*4bdc9457SAndroid Build Coastguard Worker .m(m)
4627*4bdc9457SAndroid Build Coastguard Worker .n(n)
4628*4bdc9457SAndroid Build Coastguard Worker .k(k)
4629*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4630*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4631*4bdc9457SAndroid Build Coastguard Worker }
4632*4bdc9457SAndroid Build Coastguard Worker }
4633*4bdc9457SAndroid Build Coastguard Worker }
4634*4bdc9457SAndroid Build Coastguard Worker }
4635*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)4636*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
4637*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4638*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4639*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4640*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4641*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4642*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4643*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4644*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4645*4bdc9457SAndroid Build Coastguard Worker .m(m)
4646*4bdc9457SAndroid Build Coastguard Worker .n(n)
4647*4bdc9457SAndroid Build Coastguard Worker .k(k)
4648*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4649*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4650*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4651*4bdc9457SAndroid Build Coastguard Worker }
4652*4bdc9457SAndroid Build Coastguard Worker }
4653*4bdc9457SAndroid Build Coastguard Worker }
4654*4bdc9457SAndroid Build Coastguard Worker }
4655*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA,strided_cm)4656*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
4657*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4658*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4659*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4660*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4661*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4662*4bdc9457SAndroid Build Coastguard Worker .m(4)
4663*4bdc9457SAndroid Build Coastguard Worker .n(8)
4664*4bdc9457SAndroid Build Coastguard Worker .k(4)
4665*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4666*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x8s4__wasmrelaxedsimd_fma);
4667*4bdc9457SAndroid Build Coastguard Worker }
4668*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4669*4bdc9457SAndroid Build Coastguard Worker
4670*4bdc9457SAndroid Build Coastguard Worker
4671*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)4672*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
4673*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4674*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4675*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4676*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4677*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4678*4bdc9457SAndroid Build Coastguard Worker .m(5)
4679*4bdc9457SAndroid Build Coastguard Worker .n(8)
4680*4bdc9457SAndroid Build Coastguard Worker .k(4)
4681*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4682*4bdc9457SAndroid Build Coastguard Worker }
4683*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)4684*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
4685*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4686*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4687*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4688*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4689*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4690*4bdc9457SAndroid Build Coastguard Worker .m(5)
4691*4bdc9457SAndroid Build Coastguard Worker .n(8)
4692*4bdc9457SAndroid Build Coastguard Worker .k(4)
4693*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4694*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4695*4bdc9457SAndroid Build Coastguard Worker }
4696*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_strided_a)4697*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_strided_a) {
4698*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4699*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4700*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4701*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4702*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4703*4bdc9457SAndroid Build Coastguard Worker .m(5)
4704*4bdc9457SAndroid Build Coastguard Worker .n(8)
4705*4bdc9457SAndroid Build Coastguard Worker .k(4)
4706*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4707*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4708*4bdc9457SAndroid Build Coastguard Worker }
4709*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)4710*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
4711*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4712*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
4713*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4714*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4715*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4716*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4717*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4718*4bdc9457SAndroid Build Coastguard Worker .m(m)
4719*4bdc9457SAndroid Build Coastguard Worker .n(n)
4720*4bdc9457SAndroid Build Coastguard Worker .k(4)
4721*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4722*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4723*4bdc9457SAndroid Build Coastguard Worker }
4724*4bdc9457SAndroid Build Coastguard Worker }
4725*4bdc9457SAndroid Build Coastguard Worker }
4726*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)4727*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
4728*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
4729*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4730*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4731*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4732*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4733*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4734*4bdc9457SAndroid Build Coastguard Worker .m(m)
4735*4bdc9457SAndroid Build Coastguard Worker .n(8)
4736*4bdc9457SAndroid Build Coastguard Worker .k(4)
4737*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4738*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4739*4bdc9457SAndroid Build Coastguard Worker }
4740*4bdc9457SAndroid Build Coastguard Worker }
4741*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)4742*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
4743*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4744*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4745*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4746*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4747*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4748*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4749*4bdc9457SAndroid Build Coastguard Worker .m(5)
4750*4bdc9457SAndroid Build Coastguard Worker .n(n)
4751*4bdc9457SAndroid Build Coastguard Worker .k(4)
4752*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4753*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4754*4bdc9457SAndroid Build Coastguard Worker }
4755*4bdc9457SAndroid Build Coastguard Worker }
4756*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)4757*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
4758*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4759*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4760*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4761*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4762*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4763*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4764*4bdc9457SAndroid Build Coastguard Worker .m(5)
4765*4bdc9457SAndroid Build Coastguard Worker .n(8)
4766*4bdc9457SAndroid Build Coastguard Worker .k(k)
4767*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4768*4bdc9457SAndroid Build Coastguard Worker }
4769*4bdc9457SAndroid Build Coastguard Worker }
4770*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_strided_a)4771*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_strided_a) {
4772*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4773*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4774*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4775*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4776*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4777*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4778*4bdc9457SAndroid Build Coastguard Worker .m(5)
4779*4bdc9457SAndroid Build Coastguard Worker .n(8)
4780*4bdc9457SAndroid Build Coastguard Worker .k(k)
4781*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4782*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4783*4bdc9457SAndroid Build Coastguard Worker }
4784*4bdc9457SAndroid Build Coastguard Worker }
4785*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)4786*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
4787*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4788*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4789*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
4790*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4791*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4792*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4793*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4794*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4795*4bdc9457SAndroid Build Coastguard Worker .m(m)
4796*4bdc9457SAndroid Build Coastguard Worker .n(n)
4797*4bdc9457SAndroid Build Coastguard Worker .k(k)
4798*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4799*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4800*4bdc9457SAndroid Build Coastguard Worker }
4801*4bdc9457SAndroid Build Coastguard Worker }
4802*4bdc9457SAndroid Build Coastguard Worker }
4803*4bdc9457SAndroid Build Coastguard Worker }
4804*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)4805*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
4806*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4807*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4808*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4809*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4810*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4811*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4812*4bdc9457SAndroid Build Coastguard Worker .m(5)
4813*4bdc9457SAndroid Build Coastguard Worker .n(8)
4814*4bdc9457SAndroid Build Coastguard Worker .k(k)
4815*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4816*4bdc9457SAndroid Build Coastguard Worker }
4817*4bdc9457SAndroid Build Coastguard Worker }
4818*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_strided_a)4819*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_strided_a) {
4820*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4821*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4822*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4823*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4824*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4825*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4826*4bdc9457SAndroid Build Coastguard Worker .m(5)
4827*4bdc9457SAndroid Build Coastguard Worker .n(8)
4828*4bdc9457SAndroid Build Coastguard Worker .k(k)
4829*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
4830*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4831*4bdc9457SAndroid Build Coastguard Worker }
4832*4bdc9457SAndroid Build Coastguard Worker }
4833*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)4834*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
4835*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4836*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4837*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
4838*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4839*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4840*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4841*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4842*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4843*4bdc9457SAndroid Build Coastguard Worker .m(m)
4844*4bdc9457SAndroid Build Coastguard Worker .n(n)
4845*4bdc9457SAndroid Build Coastguard Worker .k(k)
4846*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4847*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4848*4bdc9457SAndroid Build Coastguard Worker }
4849*4bdc9457SAndroid Build Coastguard Worker }
4850*4bdc9457SAndroid Build Coastguard Worker }
4851*4bdc9457SAndroid Build Coastguard Worker }
4852*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)4853*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
4854*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4855*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4856*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4857*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4858*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4859*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4860*4bdc9457SAndroid Build Coastguard Worker .m(5)
4861*4bdc9457SAndroid Build Coastguard Worker .n(8)
4862*4bdc9457SAndroid Build Coastguard Worker .k(k)
4863*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4864*4bdc9457SAndroid Build Coastguard Worker }
4865*4bdc9457SAndroid Build Coastguard Worker }
4866*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_strided_a)4867*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_strided_a) {
4868*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4869*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4870*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4871*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4872*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4873*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4874*4bdc9457SAndroid Build Coastguard Worker .m(5)
4875*4bdc9457SAndroid Build Coastguard Worker .n(8)
4876*4bdc9457SAndroid Build Coastguard Worker .k(k)
4877*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
4878*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4879*4bdc9457SAndroid Build Coastguard Worker }
4880*4bdc9457SAndroid Build Coastguard Worker }
4881*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)4882*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
4883*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4884*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4885*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
4886*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4887*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4888*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4889*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4890*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4891*4bdc9457SAndroid Build Coastguard Worker .m(m)
4892*4bdc9457SAndroid Build Coastguard Worker .n(n)
4893*4bdc9457SAndroid Build Coastguard Worker .k(k)
4894*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4895*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4896*4bdc9457SAndroid Build Coastguard Worker }
4897*4bdc9457SAndroid Build Coastguard Worker }
4898*4bdc9457SAndroid Build Coastguard Worker }
4899*4bdc9457SAndroid Build Coastguard Worker }
4900*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)4901*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
4902*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4903*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4904*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4905*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4906*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4907*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4908*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4909*4bdc9457SAndroid Build Coastguard Worker .m(5)
4910*4bdc9457SAndroid Build Coastguard Worker .n(n)
4911*4bdc9457SAndroid Build Coastguard Worker .k(k)
4912*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4913*4bdc9457SAndroid Build Coastguard Worker }
4914*4bdc9457SAndroid Build Coastguard Worker }
4915*4bdc9457SAndroid Build Coastguard Worker }
4916*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)4917*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
4918*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4919*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4920*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4921*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4922*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4923*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4924*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4925*4bdc9457SAndroid Build Coastguard Worker .m(5)
4926*4bdc9457SAndroid Build Coastguard Worker .n(n)
4927*4bdc9457SAndroid Build Coastguard Worker .k(k)
4928*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4929*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4930*4bdc9457SAndroid Build Coastguard Worker }
4931*4bdc9457SAndroid Build Coastguard Worker }
4932*4bdc9457SAndroid Build Coastguard Worker }
4933*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_a)4934*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_a) {
4935*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4936*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4937*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4938*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4939*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4940*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4941*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4942*4bdc9457SAndroid Build Coastguard Worker .m(5)
4943*4bdc9457SAndroid Build Coastguard Worker .n(n)
4944*4bdc9457SAndroid Build Coastguard Worker .k(k)
4945*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4946*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4947*4bdc9457SAndroid Build Coastguard Worker }
4948*4bdc9457SAndroid Build Coastguard Worker }
4949*4bdc9457SAndroid Build Coastguard Worker }
4950*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)4951*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
4952*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4953*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4954*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
4955*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4956*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4957*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4958*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4959*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4960*4bdc9457SAndroid Build Coastguard Worker .m(m)
4961*4bdc9457SAndroid Build Coastguard Worker .n(n)
4962*4bdc9457SAndroid Build Coastguard Worker .k(k)
4963*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4964*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4965*4bdc9457SAndroid Build Coastguard Worker }
4966*4bdc9457SAndroid Build Coastguard Worker }
4967*4bdc9457SAndroid Build Coastguard Worker }
4968*4bdc9457SAndroid Build Coastguard Worker }
4969*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)4970*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
4971*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4972*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4973*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4974*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4975*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4976*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4977*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4978*4bdc9457SAndroid Build Coastguard Worker .m(5)
4979*4bdc9457SAndroid Build Coastguard Worker .n(n)
4980*4bdc9457SAndroid Build Coastguard Worker .k(k)
4981*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4982*4bdc9457SAndroid Build Coastguard Worker }
4983*4bdc9457SAndroid Build Coastguard Worker }
4984*4bdc9457SAndroid Build Coastguard Worker }
4985*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)4986*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
4987*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4988*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4989*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4990*4bdc9457SAndroid Build Coastguard Worker .mr(5)
4991*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4992*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4993*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4994*4bdc9457SAndroid Build Coastguard Worker .m(5)
4995*4bdc9457SAndroid Build Coastguard Worker .n(n)
4996*4bdc9457SAndroid Build Coastguard Worker .k(k)
4997*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4998*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
4999*4bdc9457SAndroid Build Coastguard Worker }
5000*4bdc9457SAndroid Build Coastguard Worker }
5001*4bdc9457SAndroid Build Coastguard Worker }
5002*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_a)5003*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_a) {
5004*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5005*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5006*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5007*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5008*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5009*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5010*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5011*4bdc9457SAndroid Build Coastguard Worker .m(5)
5012*4bdc9457SAndroid Build Coastguard Worker .n(n)
5013*4bdc9457SAndroid Build Coastguard Worker .k(k)
5014*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
5015*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5016*4bdc9457SAndroid Build Coastguard Worker }
5017*4bdc9457SAndroid Build Coastguard Worker }
5018*4bdc9457SAndroid Build Coastguard Worker }
5019*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)5020*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
5021*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5022*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5023*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5024*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5025*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5026*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5027*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5028*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5029*4bdc9457SAndroid Build Coastguard Worker .m(m)
5030*4bdc9457SAndroid Build Coastguard Worker .n(n)
5031*4bdc9457SAndroid Build Coastguard Worker .k(k)
5032*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5033*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5034*4bdc9457SAndroid Build Coastguard Worker }
5035*4bdc9457SAndroid Build Coastguard Worker }
5036*4bdc9457SAndroid Build Coastguard Worker }
5037*4bdc9457SAndroid Build Coastguard Worker }
5038*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)5039*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
5040*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5041*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5042*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5043*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5044*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5045*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5046*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5047*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5048*4bdc9457SAndroid Build Coastguard Worker .m(m)
5049*4bdc9457SAndroid Build Coastguard Worker .n(n)
5050*4bdc9457SAndroid Build Coastguard Worker .k(k)
5051*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5052*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5053*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5054*4bdc9457SAndroid Build Coastguard Worker }
5055*4bdc9457SAndroid Build Coastguard Worker }
5056*4bdc9457SAndroid Build Coastguard Worker }
5057*4bdc9457SAndroid Build Coastguard Worker }
5058*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)5059*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_5X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
5060*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5061*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5062*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5063*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5064*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5065*4bdc9457SAndroid Build Coastguard Worker .m(5)
5066*4bdc9457SAndroid Build Coastguard Worker .n(8)
5067*4bdc9457SAndroid Build Coastguard Worker .k(4)
5068*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5069*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_5x8__wasmrelaxedsimd_fma_splat);
5070*4bdc9457SAndroid Build Coastguard Worker }
5071*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5072*4bdc9457SAndroid Build Coastguard Worker
5073*4bdc9457SAndroid Build Coastguard Worker
5074*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4)5075*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4) {
5076*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5077*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5078*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5079*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5080*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5081*4bdc9457SAndroid Build Coastguard Worker .m(6)
5082*4bdc9457SAndroid Build Coastguard Worker .n(8)
5083*4bdc9457SAndroid Build Coastguard Worker .k(4)
5084*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5085*4bdc9457SAndroid Build Coastguard Worker }
5086*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cn)5087*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cn) {
5088*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5089*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5090*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5091*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5092*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5093*4bdc9457SAndroid Build Coastguard Worker .m(6)
5094*4bdc9457SAndroid Build Coastguard Worker .n(8)
5095*4bdc9457SAndroid Build Coastguard Worker .k(4)
5096*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5097*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5098*4bdc9457SAndroid Build Coastguard Worker }
5099*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_strided_a)5100*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_strided_a) {
5101*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5102*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5103*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5104*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5105*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5106*4bdc9457SAndroid Build Coastguard Worker .m(6)
5107*4bdc9457SAndroid Build Coastguard Worker .n(8)
5108*4bdc9457SAndroid Build Coastguard Worker .k(4)
5109*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5110*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5111*4bdc9457SAndroid Build Coastguard Worker }
5112*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile)5113*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile) {
5114*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5115*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5116*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5117*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5118*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5119*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5120*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5121*4bdc9457SAndroid Build Coastguard Worker .m(m)
5122*4bdc9457SAndroid Build Coastguard Worker .n(n)
5123*4bdc9457SAndroid Build Coastguard Worker .k(4)
5124*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5125*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5126*4bdc9457SAndroid Build Coastguard Worker }
5127*4bdc9457SAndroid Build Coastguard Worker }
5128*4bdc9457SAndroid Build Coastguard Worker }
5129*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_m)5130*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_m) {
5131*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5132*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5133*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5134*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5135*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5136*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5137*4bdc9457SAndroid Build Coastguard Worker .m(m)
5138*4bdc9457SAndroid Build Coastguard Worker .n(8)
5139*4bdc9457SAndroid Build Coastguard Worker .k(4)
5140*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5141*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5142*4bdc9457SAndroid Build Coastguard Worker }
5143*4bdc9457SAndroid Build Coastguard Worker }
5144*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_eq_4_subtile_n)5145*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_eq_4_subtile_n) {
5146*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5147*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5148*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5149*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5150*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5151*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5152*4bdc9457SAndroid Build Coastguard Worker .m(6)
5153*4bdc9457SAndroid Build Coastguard Worker .n(n)
5154*4bdc9457SAndroid Build Coastguard Worker .k(4)
5155*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5156*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5157*4bdc9457SAndroid Build Coastguard Worker }
5158*4bdc9457SAndroid Build Coastguard Worker }
5159*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4)5160*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4) {
5161*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
5162*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5163*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5164*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5165*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5166*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5167*4bdc9457SAndroid Build Coastguard Worker .m(6)
5168*4bdc9457SAndroid Build Coastguard Worker .n(8)
5169*4bdc9457SAndroid Build Coastguard Worker .k(k)
5170*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5171*4bdc9457SAndroid Build Coastguard Worker }
5172*4bdc9457SAndroid Build Coastguard Worker }
5173*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_strided_a)5174*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_strided_a) {
5175*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
5176*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5177*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5178*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5179*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5180*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5181*4bdc9457SAndroid Build Coastguard Worker .m(6)
5182*4bdc9457SAndroid Build Coastguard Worker .n(8)
5183*4bdc9457SAndroid Build Coastguard Worker .k(k)
5184*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5185*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5186*4bdc9457SAndroid Build Coastguard Worker }
5187*4bdc9457SAndroid Build Coastguard Worker }
5188*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_lt_4_subtile)5189*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_lt_4_subtile) {
5190*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
5191*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5192*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5193*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5194*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5195*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5196*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5197*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5198*4bdc9457SAndroid Build Coastguard Worker .m(m)
5199*4bdc9457SAndroid Build Coastguard Worker .n(n)
5200*4bdc9457SAndroid Build Coastguard Worker .k(k)
5201*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5202*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5203*4bdc9457SAndroid Build Coastguard Worker }
5204*4bdc9457SAndroid Build Coastguard Worker }
5205*4bdc9457SAndroid Build Coastguard Worker }
5206*4bdc9457SAndroid Build Coastguard Worker }
5207*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4)5208*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4) {
5209*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
5210*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5211*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5212*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5213*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5214*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5215*4bdc9457SAndroid Build Coastguard Worker .m(6)
5216*4bdc9457SAndroid Build Coastguard Worker .n(8)
5217*4bdc9457SAndroid Build Coastguard Worker .k(k)
5218*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5219*4bdc9457SAndroid Build Coastguard Worker }
5220*4bdc9457SAndroid Build Coastguard Worker }
5221*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_strided_a)5222*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_strided_a) {
5223*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
5224*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5225*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5226*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5227*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5228*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5229*4bdc9457SAndroid Build Coastguard Worker .m(6)
5230*4bdc9457SAndroid Build Coastguard Worker .n(8)
5231*4bdc9457SAndroid Build Coastguard Worker .k(k)
5232*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
5233*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5234*4bdc9457SAndroid Build Coastguard Worker }
5235*4bdc9457SAndroid Build Coastguard Worker }
5236*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_gt_4_subtile)5237*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_gt_4_subtile) {
5238*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
5239*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5240*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5241*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5242*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5243*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5244*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5245*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5246*4bdc9457SAndroid Build Coastguard Worker .m(m)
5247*4bdc9457SAndroid Build Coastguard Worker .n(n)
5248*4bdc9457SAndroid Build Coastguard Worker .k(k)
5249*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5250*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5251*4bdc9457SAndroid Build Coastguard Worker }
5252*4bdc9457SAndroid Build Coastguard Worker }
5253*4bdc9457SAndroid Build Coastguard Worker }
5254*4bdc9457SAndroid Build Coastguard Worker }
5255*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4)5256*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4) {
5257*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
5258*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5259*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5260*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5261*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5262*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5263*4bdc9457SAndroid Build Coastguard Worker .m(6)
5264*4bdc9457SAndroid Build Coastguard Worker .n(8)
5265*4bdc9457SAndroid Build Coastguard Worker .k(k)
5266*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5267*4bdc9457SAndroid Build Coastguard Worker }
5268*4bdc9457SAndroid Build Coastguard Worker }
5269*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_strided_a)5270*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_strided_a) {
5271*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
5272*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5273*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5274*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5275*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5276*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5277*4bdc9457SAndroid Build Coastguard Worker .m(6)
5278*4bdc9457SAndroid Build Coastguard Worker .n(8)
5279*4bdc9457SAndroid Build Coastguard Worker .k(k)
5280*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
5281*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5282*4bdc9457SAndroid Build Coastguard Worker }
5283*4bdc9457SAndroid Build Coastguard Worker }
5284*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,k_div_4_subtile)5285*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, k_div_4_subtile) {
5286*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
5287*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5288*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5289*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5290*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5291*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5292*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5293*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5294*4bdc9457SAndroid Build Coastguard Worker .m(m)
5295*4bdc9457SAndroid Build Coastguard Worker .n(n)
5296*4bdc9457SAndroid Build Coastguard Worker .k(k)
5297*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5298*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5299*4bdc9457SAndroid Build Coastguard Worker }
5300*4bdc9457SAndroid Build Coastguard Worker }
5301*4bdc9457SAndroid Build Coastguard Worker }
5302*4bdc9457SAndroid Build Coastguard Worker }
5303*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8)5304*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8) {
5305*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5306*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5307*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5308*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5309*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5310*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5311*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5312*4bdc9457SAndroid Build Coastguard Worker .m(6)
5313*4bdc9457SAndroid Build Coastguard Worker .n(n)
5314*4bdc9457SAndroid Build Coastguard Worker .k(k)
5315*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5316*4bdc9457SAndroid Build Coastguard Worker }
5317*4bdc9457SAndroid Build Coastguard Worker }
5318*4bdc9457SAndroid Build Coastguard Worker }
5319*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_cn)5320*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_cn) {
5321*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5322*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5323*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5324*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5325*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5326*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5327*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5328*4bdc9457SAndroid Build Coastguard Worker .m(6)
5329*4bdc9457SAndroid Build Coastguard Worker .n(n)
5330*4bdc9457SAndroid Build Coastguard Worker .k(k)
5331*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5332*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5333*4bdc9457SAndroid Build Coastguard Worker }
5334*4bdc9457SAndroid Build Coastguard Worker }
5335*4bdc9457SAndroid Build Coastguard Worker }
5336*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_strided_a)5337*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_strided_a) {
5338*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5339*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5340*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5341*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5342*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5343*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5344*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5345*4bdc9457SAndroid Build Coastguard Worker .m(6)
5346*4bdc9457SAndroid Build Coastguard Worker .n(n)
5347*4bdc9457SAndroid Build Coastguard Worker .k(k)
5348*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
5349*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5350*4bdc9457SAndroid Build Coastguard Worker }
5351*4bdc9457SAndroid Build Coastguard Worker }
5352*4bdc9457SAndroid Build Coastguard Worker }
5353*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_gt_8_subtile)5354*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_gt_8_subtile) {
5355*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5356*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5357*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5358*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5359*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5360*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5361*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5362*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5363*4bdc9457SAndroid Build Coastguard Worker .m(m)
5364*4bdc9457SAndroid Build Coastguard Worker .n(n)
5365*4bdc9457SAndroid Build Coastguard Worker .k(k)
5366*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5367*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5368*4bdc9457SAndroid Build Coastguard Worker }
5369*4bdc9457SAndroid Build Coastguard Worker }
5370*4bdc9457SAndroid Build Coastguard Worker }
5371*4bdc9457SAndroid Build Coastguard Worker }
5372*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8)5373*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8) {
5374*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5375*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5376*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5377*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5378*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5379*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5380*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5381*4bdc9457SAndroid Build Coastguard Worker .m(6)
5382*4bdc9457SAndroid Build Coastguard Worker .n(n)
5383*4bdc9457SAndroid Build Coastguard Worker .k(k)
5384*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5385*4bdc9457SAndroid Build Coastguard Worker }
5386*4bdc9457SAndroid Build Coastguard Worker }
5387*4bdc9457SAndroid Build Coastguard Worker }
5388*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_cn)5389*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_cn) {
5390*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5391*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5392*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5393*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5394*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5395*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5396*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5397*4bdc9457SAndroid Build Coastguard Worker .m(6)
5398*4bdc9457SAndroid Build Coastguard Worker .n(n)
5399*4bdc9457SAndroid Build Coastguard Worker .k(k)
5400*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5401*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5402*4bdc9457SAndroid Build Coastguard Worker }
5403*4bdc9457SAndroid Build Coastguard Worker }
5404*4bdc9457SAndroid Build Coastguard Worker }
5405*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_strided_a)5406*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_strided_a) {
5407*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5408*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5409*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5410*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5411*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5412*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5413*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5414*4bdc9457SAndroid Build Coastguard Worker .m(6)
5415*4bdc9457SAndroid Build Coastguard Worker .n(n)
5416*4bdc9457SAndroid Build Coastguard Worker .k(k)
5417*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
5418*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5419*4bdc9457SAndroid Build Coastguard Worker }
5420*4bdc9457SAndroid Build Coastguard Worker }
5421*4bdc9457SAndroid Build Coastguard Worker }
5422*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,n_div_8_subtile)5423*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, n_div_8_subtile) {
5424*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5425*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5426*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5427*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5428*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5429*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5430*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5431*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5432*4bdc9457SAndroid Build Coastguard Worker .m(m)
5433*4bdc9457SAndroid Build Coastguard Worker .n(n)
5434*4bdc9457SAndroid Build Coastguard Worker .k(k)
5435*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5436*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5437*4bdc9457SAndroid Build Coastguard Worker }
5438*4bdc9457SAndroid Build Coastguard Worker }
5439*4bdc9457SAndroid Build Coastguard Worker }
5440*4bdc9457SAndroid Build Coastguard Worker }
5441*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm_subtile)5442*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm_subtile) {
5443*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5444*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5445*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5446*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5447*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5448*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5449*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5450*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5451*4bdc9457SAndroid Build Coastguard Worker .m(m)
5452*4bdc9457SAndroid Build Coastguard Worker .n(n)
5453*4bdc9457SAndroid Build Coastguard Worker .k(k)
5454*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5455*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5456*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5457*4bdc9457SAndroid Build Coastguard Worker }
5458*4bdc9457SAndroid Build Coastguard Worker }
5459*4bdc9457SAndroid Build Coastguard Worker }
5460*4bdc9457SAndroid Build Coastguard Worker }
5461*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT,strided_cm)5462*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_6X8__WASMRELAXEDSIMD_FMA_SPLAT, strided_cm) {
5463*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5464*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5465*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5466*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5467*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5468*4bdc9457SAndroid Build Coastguard Worker .m(6)
5469*4bdc9457SAndroid Build Coastguard Worker .n(8)
5470*4bdc9457SAndroid Build Coastguard Worker .k(4)
5471*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5472*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_6x8__wasmrelaxedsimd_fma_splat);
5473*4bdc9457SAndroid Build Coastguard Worker }
5474*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5475*4bdc9457SAndroid Build Coastguard Worker
5476*4bdc9457SAndroid Build Coastguard Worker
5477*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_RELU_1X4__WASM,k_eq_1)5478*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, k_eq_1) {
5479*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5480*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5481*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5482*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5483*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5484*4bdc9457SAndroid Build Coastguard Worker .m(1)
5485*4bdc9457SAndroid Build Coastguard Worker .n(4)
5486*4bdc9457SAndroid Build Coastguard Worker .k(1)
5487*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5488*4bdc9457SAndroid Build Coastguard Worker }
5489*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,strided_cn)5490*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, strided_cn) {
5491*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5492*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5493*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5494*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5495*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5496*4bdc9457SAndroid Build Coastguard Worker .m(1)
5497*4bdc9457SAndroid Build Coastguard Worker .n(4)
5498*4bdc9457SAndroid Build Coastguard Worker .k(1)
5499*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
5500*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5501*4bdc9457SAndroid Build Coastguard Worker }
5502*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,k_eq_1_strided_a)5503*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, k_eq_1_strided_a) {
5504*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5505*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5506*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5507*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5508*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5509*4bdc9457SAndroid Build Coastguard Worker .m(1)
5510*4bdc9457SAndroid Build Coastguard Worker .n(4)
5511*4bdc9457SAndroid Build Coastguard Worker .k(1)
5512*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
5513*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5514*4bdc9457SAndroid Build Coastguard Worker }
5515*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,k_eq_1_subtile)5516*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, k_eq_1_subtile) {
5517*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5518*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5519*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5520*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5521*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5522*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5523*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5524*4bdc9457SAndroid Build Coastguard Worker .m(m)
5525*4bdc9457SAndroid Build Coastguard Worker .n(n)
5526*4bdc9457SAndroid Build Coastguard Worker .k(1)
5527*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5528*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5529*4bdc9457SAndroid Build Coastguard Worker }
5530*4bdc9457SAndroid Build Coastguard Worker }
5531*4bdc9457SAndroid Build Coastguard Worker }
5532*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,k_eq_1_subtile_m)5533*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, k_eq_1_subtile_m) {
5534*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5535*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5536*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5537*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5538*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5539*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5540*4bdc9457SAndroid Build Coastguard Worker .m(m)
5541*4bdc9457SAndroid Build Coastguard Worker .n(4)
5542*4bdc9457SAndroid Build Coastguard Worker .k(1)
5543*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5544*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5545*4bdc9457SAndroid Build Coastguard Worker }
5546*4bdc9457SAndroid Build Coastguard Worker }
5547*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,k_eq_1_subtile_n)5548*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, k_eq_1_subtile_n) {
5549*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5550*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5551*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5552*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5553*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5554*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5555*4bdc9457SAndroid Build Coastguard Worker .m(1)
5556*4bdc9457SAndroid Build Coastguard Worker .n(n)
5557*4bdc9457SAndroid Build Coastguard Worker .k(1)
5558*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5559*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5560*4bdc9457SAndroid Build Coastguard Worker }
5561*4bdc9457SAndroid Build Coastguard Worker }
5562*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,k_gt_1)5563*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, k_gt_1) {
5564*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5565*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5566*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5567*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5568*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5569*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5570*4bdc9457SAndroid Build Coastguard Worker .m(1)
5571*4bdc9457SAndroid Build Coastguard Worker .n(4)
5572*4bdc9457SAndroid Build Coastguard Worker .k(k)
5573*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5574*4bdc9457SAndroid Build Coastguard Worker }
5575*4bdc9457SAndroid Build Coastguard Worker }
5576*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,k_gt_1_strided_a)5577*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, k_gt_1_strided_a) {
5578*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5579*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5580*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5581*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5582*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5583*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5584*4bdc9457SAndroid Build Coastguard Worker .m(1)
5585*4bdc9457SAndroid Build Coastguard Worker .n(4)
5586*4bdc9457SAndroid Build Coastguard Worker .k(k)
5587*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
5588*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5589*4bdc9457SAndroid Build Coastguard Worker }
5590*4bdc9457SAndroid Build Coastguard Worker }
5591*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,k_gt_1_subtile)5592*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, k_gt_1_subtile) {
5593*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5594*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5595*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5596*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5597*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5598*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5599*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5600*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5601*4bdc9457SAndroid Build Coastguard Worker .m(m)
5602*4bdc9457SAndroid Build Coastguard Worker .n(n)
5603*4bdc9457SAndroid Build Coastguard Worker .k(k)
5604*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5605*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5606*4bdc9457SAndroid Build Coastguard Worker }
5607*4bdc9457SAndroid Build Coastguard Worker }
5608*4bdc9457SAndroid Build Coastguard Worker }
5609*4bdc9457SAndroid Build Coastguard Worker }
5610*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,n_gt_4)5611*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, n_gt_4) {
5612*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5613*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5614*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5615*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5616*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5617*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5618*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5619*4bdc9457SAndroid Build Coastguard Worker .m(1)
5620*4bdc9457SAndroid Build Coastguard Worker .n(n)
5621*4bdc9457SAndroid Build Coastguard Worker .k(k)
5622*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5623*4bdc9457SAndroid Build Coastguard Worker }
5624*4bdc9457SAndroid Build Coastguard Worker }
5625*4bdc9457SAndroid Build Coastguard Worker }
5626*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,n_gt_4_strided_cn)5627*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, n_gt_4_strided_cn) {
5628*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5629*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5630*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5631*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5632*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5633*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5634*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5635*4bdc9457SAndroid Build Coastguard Worker .m(1)
5636*4bdc9457SAndroid Build Coastguard Worker .n(n)
5637*4bdc9457SAndroid Build Coastguard Worker .k(k)
5638*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
5639*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5640*4bdc9457SAndroid Build Coastguard Worker }
5641*4bdc9457SAndroid Build Coastguard Worker }
5642*4bdc9457SAndroid Build Coastguard Worker }
5643*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,n_gt_4_strided_a)5644*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, n_gt_4_strided_a) {
5645*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5646*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5647*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5648*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5649*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5650*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5651*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5652*4bdc9457SAndroid Build Coastguard Worker .m(1)
5653*4bdc9457SAndroid Build Coastguard Worker .n(n)
5654*4bdc9457SAndroid Build Coastguard Worker .k(k)
5655*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5656*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5657*4bdc9457SAndroid Build Coastguard Worker }
5658*4bdc9457SAndroid Build Coastguard Worker }
5659*4bdc9457SAndroid Build Coastguard Worker }
5660*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,n_gt_4_subtile)5661*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, n_gt_4_subtile) {
5662*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5663*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5664*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5665*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5666*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5667*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5668*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5669*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5670*4bdc9457SAndroid Build Coastguard Worker .m(m)
5671*4bdc9457SAndroid Build Coastguard Worker .n(n)
5672*4bdc9457SAndroid Build Coastguard Worker .k(k)
5673*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5674*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5675*4bdc9457SAndroid Build Coastguard Worker }
5676*4bdc9457SAndroid Build Coastguard Worker }
5677*4bdc9457SAndroid Build Coastguard Worker }
5678*4bdc9457SAndroid Build Coastguard Worker }
5679*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,n_div_4)5680*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, n_div_4) {
5681*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
5682*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5683*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5684*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5685*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5686*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5687*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5688*4bdc9457SAndroid Build Coastguard Worker .m(1)
5689*4bdc9457SAndroid Build Coastguard Worker .n(n)
5690*4bdc9457SAndroid Build Coastguard Worker .k(k)
5691*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5692*4bdc9457SAndroid Build Coastguard Worker }
5693*4bdc9457SAndroid Build Coastguard Worker }
5694*4bdc9457SAndroid Build Coastguard Worker }
5695*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,n_div_4_strided_cn)5696*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, n_div_4_strided_cn) {
5697*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
5698*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5699*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5700*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5701*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5702*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5703*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5704*4bdc9457SAndroid Build Coastguard Worker .m(1)
5705*4bdc9457SAndroid Build Coastguard Worker .n(n)
5706*4bdc9457SAndroid Build Coastguard Worker .k(k)
5707*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
5708*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5709*4bdc9457SAndroid Build Coastguard Worker }
5710*4bdc9457SAndroid Build Coastguard Worker }
5711*4bdc9457SAndroid Build Coastguard Worker }
5712*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,n_div_4_strided_a)5713*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, n_div_4_strided_a) {
5714*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
5715*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5716*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5717*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5718*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5719*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5720*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5721*4bdc9457SAndroid Build Coastguard Worker .m(1)
5722*4bdc9457SAndroid Build Coastguard Worker .n(n)
5723*4bdc9457SAndroid Build Coastguard Worker .k(k)
5724*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5725*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5726*4bdc9457SAndroid Build Coastguard Worker }
5727*4bdc9457SAndroid Build Coastguard Worker }
5728*4bdc9457SAndroid Build Coastguard Worker }
5729*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,n_div_4_subtile)5730*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, n_div_4_subtile) {
5731*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
5732*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5733*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5734*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5735*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5736*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5737*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5738*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5739*4bdc9457SAndroid Build Coastguard Worker .m(m)
5740*4bdc9457SAndroid Build Coastguard Worker .n(n)
5741*4bdc9457SAndroid Build Coastguard Worker .k(k)
5742*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5743*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5744*4bdc9457SAndroid Build Coastguard Worker }
5745*4bdc9457SAndroid Build Coastguard Worker }
5746*4bdc9457SAndroid Build Coastguard Worker }
5747*4bdc9457SAndroid Build Coastguard Worker }
5748*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,strided_cm_subtile)5749*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, strided_cm_subtile) {
5750*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5751*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5752*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5753*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5754*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5755*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5756*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5757*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5758*4bdc9457SAndroid Build Coastguard Worker .m(m)
5759*4bdc9457SAndroid Build Coastguard Worker .n(n)
5760*4bdc9457SAndroid Build Coastguard Worker .k(k)
5761*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
5762*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5763*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5764*4bdc9457SAndroid Build Coastguard Worker }
5765*4bdc9457SAndroid Build Coastguard Worker }
5766*4bdc9457SAndroid Build Coastguard Worker }
5767*4bdc9457SAndroid Build Coastguard Worker }
5768*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__WASM,strided_cm)5769*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__WASM, strided_cm) {
5770*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5771*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5772*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5773*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5774*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5775*4bdc9457SAndroid Build Coastguard Worker .m(1)
5776*4bdc9457SAndroid Build Coastguard Worker .n(4)
5777*4bdc9457SAndroid Build Coastguard Worker .k(1)
5778*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
5779*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__wasm);
5780*4bdc9457SAndroid Build Coastguard Worker }
5781*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASM || XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
5782*4bdc9457SAndroid Build Coastguard Worker
5783*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,k_eq_1)5784*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, k_eq_1) {
5785*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5786*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5787*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5788*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5789*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5790*4bdc9457SAndroid Build Coastguard Worker .m(1)
5791*4bdc9457SAndroid Build Coastguard Worker .n(4)
5792*4bdc9457SAndroid Build Coastguard Worker .k(1)
5793*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5794*4bdc9457SAndroid Build Coastguard Worker }
5795*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,strided_cn)5796*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, strided_cn) {
5797*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5798*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5799*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5800*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5801*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5802*4bdc9457SAndroid Build Coastguard Worker .m(1)
5803*4bdc9457SAndroid Build Coastguard Worker .n(4)
5804*4bdc9457SAndroid Build Coastguard Worker .k(1)
5805*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
5806*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5807*4bdc9457SAndroid Build Coastguard Worker }
5808*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,k_eq_1_strided_a)5809*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, k_eq_1_strided_a) {
5810*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5811*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5812*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5813*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5814*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5815*4bdc9457SAndroid Build Coastguard Worker .m(1)
5816*4bdc9457SAndroid Build Coastguard Worker .n(4)
5817*4bdc9457SAndroid Build Coastguard Worker .k(1)
5818*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
5819*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5820*4bdc9457SAndroid Build Coastguard Worker }
5821*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,k_eq_1_subtile)5822*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, k_eq_1_subtile) {
5823*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5824*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5825*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5826*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5827*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5828*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5829*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5830*4bdc9457SAndroid Build Coastguard Worker .m(m)
5831*4bdc9457SAndroid Build Coastguard Worker .n(n)
5832*4bdc9457SAndroid Build Coastguard Worker .k(1)
5833*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5834*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5835*4bdc9457SAndroid Build Coastguard Worker }
5836*4bdc9457SAndroid Build Coastguard Worker }
5837*4bdc9457SAndroid Build Coastguard Worker }
5838*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,k_eq_1_subtile_m)5839*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, k_eq_1_subtile_m) {
5840*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5841*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5842*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5843*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5844*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5845*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5846*4bdc9457SAndroid Build Coastguard Worker .m(m)
5847*4bdc9457SAndroid Build Coastguard Worker .n(4)
5848*4bdc9457SAndroid Build Coastguard Worker .k(1)
5849*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5850*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5851*4bdc9457SAndroid Build Coastguard Worker }
5852*4bdc9457SAndroid Build Coastguard Worker }
5853*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,k_eq_1_subtile_n)5854*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, k_eq_1_subtile_n) {
5855*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5856*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5857*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5858*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5859*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5860*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5861*4bdc9457SAndroid Build Coastguard Worker .m(1)
5862*4bdc9457SAndroid Build Coastguard Worker .n(n)
5863*4bdc9457SAndroid Build Coastguard Worker .k(1)
5864*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5865*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5866*4bdc9457SAndroid Build Coastguard Worker }
5867*4bdc9457SAndroid Build Coastguard Worker }
5868*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,k_gt_1)5869*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, k_gt_1) {
5870*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5871*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5872*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5873*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5874*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5875*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5876*4bdc9457SAndroid Build Coastguard Worker .m(1)
5877*4bdc9457SAndroid Build Coastguard Worker .n(4)
5878*4bdc9457SAndroid Build Coastguard Worker .k(k)
5879*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5880*4bdc9457SAndroid Build Coastguard Worker }
5881*4bdc9457SAndroid Build Coastguard Worker }
5882*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,k_gt_1_strided_a)5883*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, k_gt_1_strided_a) {
5884*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5885*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5886*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5887*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5888*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5889*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5890*4bdc9457SAndroid Build Coastguard Worker .m(1)
5891*4bdc9457SAndroid Build Coastguard Worker .n(4)
5892*4bdc9457SAndroid Build Coastguard Worker .k(k)
5893*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
5894*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5895*4bdc9457SAndroid Build Coastguard Worker }
5896*4bdc9457SAndroid Build Coastguard Worker }
5897*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,k_gt_1_subtile)5898*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, k_gt_1_subtile) {
5899*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5900*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
5901*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5902*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5903*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5904*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5905*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5906*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5907*4bdc9457SAndroid Build Coastguard Worker .m(m)
5908*4bdc9457SAndroid Build Coastguard Worker .n(n)
5909*4bdc9457SAndroid Build Coastguard Worker .k(k)
5910*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5911*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5912*4bdc9457SAndroid Build Coastguard Worker }
5913*4bdc9457SAndroid Build Coastguard Worker }
5914*4bdc9457SAndroid Build Coastguard Worker }
5915*4bdc9457SAndroid Build Coastguard Worker }
5916*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,n_gt_4)5917*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, n_gt_4) {
5918*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5919*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5920*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5921*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5922*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5923*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5924*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5925*4bdc9457SAndroid Build Coastguard Worker .m(1)
5926*4bdc9457SAndroid Build Coastguard Worker .n(n)
5927*4bdc9457SAndroid Build Coastguard Worker .k(k)
5928*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5929*4bdc9457SAndroid Build Coastguard Worker }
5930*4bdc9457SAndroid Build Coastguard Worker }
5931*4bdc9457SAndroid Build Coastguard Worker }
5932*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,n_gt_4_strided_cn)5933*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, n_gt_4_strided_cn) {
5934*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5935*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5936*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5937*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5938*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5939*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5940*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5941*4bdc9457SAndroid Build Coastguard Worker .m(1)
5942*4bdc9457SAndroid Build Coastguard Worker .n(n)
5943*4bdc9457SAndroid Build Coastguard Worker .k(k)
5944*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
5945*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5946*4bdc9457SAndroid Build Coastguard Worker }
5947*4bdc9457SAndroid Build Coastguard Worker }
5948*4bdc9457SAndroid Build Coastguard Worker }
5949*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,n_gt_4_strided_a)5950*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, n_gt_4_strided_a) {
5951*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5952*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5953*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5954*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5955*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5956*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5957*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5958*4bdc9457SAndroid Build Coastguard Worker .m(1)
5959*4bdc9457SAndroid Build Coastguard Worker .n(n)
5960*4bdc9457SAndroid Build Coastguard Worker .k(k)
5961*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5962*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5963*4bdc9457SAndroid Build Coastguard Worker }
5964*4bdc9457SAndroid Build Coastguard Worker }
5965*4bdc9457SAndroid Build Coastguard Worker }
5966*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,n_gt_4_subtile)5967*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, n_gt_4_subtile) {
5968*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
5969*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5970*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
5971*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5972*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5973*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5974*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5975*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5976*4bdc9457SAndroid Build Coastguard Worker .m(m)
5977*4bdc9457SAndroid Build Coastguard Worker .n(n)
5978*4bdc9457SAndroid Build Coastguard Worker .k(k)
5979*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5980*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5981*4bdc9457SAndroid Build Coastguard Worker }
5982*4bdc9457SAndroid Build Coastguard Worker }
5983*4bdc9457SAndroid Build Coastguard Worker }
5984*4bdc9457SAndroid Build Coastguard Worker }
5985*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,n_div_4)5986*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, n_div_4) {
5987*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
5988*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5989*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5990*4bdc9457SAndroid Build Coastguard Worker .mr(1)
5991*4bdc9457SAndroid Build Coastguard Worker .nr(4)
5992*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5993*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5994*4bdc9457SAndroid Build Coastguard Worker .m(1)
5995*4bdc9457SAndroid Build Coastguard Worker .n(n)
5996*4bdc9457SAndroid Build Coastguard Worker .k(k)
5997*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
5998*4bdc9457SAndroid Build Coastguard Worker }
5999*4bdc9457SAndroid Build Coastguard Worker }
6000*4bdc9457SAndroid Build Coastguard Worker }
6001*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,n_div_4_strided_cn)6002*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, n_div_4_strided_cn) {
6003*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6004*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6005*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6006*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6007*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6008*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6009*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6010*4bdc9457SAndroid Build Coastguard Worker .m(1)
6011*4bdc9457SAndroid Build Coastguard Worker .n(n)
6012*4bdc9457SAndroid Build Coastguard Worker .k(k)
6013*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6014*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
6015*4bdc9457SAndroid Build Coastguard Worker }
6016*4bdc9457SAndroid Build Coastguard Worker }
6017*4bdc9457SAndroid Build Coastguard Worker }
6018*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,n_div_4_strided_a)6019*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, n_div_4_strided_a) {
6020*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6021*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6022*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6023*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6024*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6025*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6026*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6027*4bdc9457SAndroid Build Coastguard Worker .m(1)
6028*4bdc9457SAndroid Build Coastguard Worker .n(n)
6029*4bdc9457SAndroid Build Coastguard Worker .k(k)
6030*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6031*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
6032*4bdc9457SAndroid Build Coastguard Worker }
6033*4bdc9457SAndroid Build Coastguard Worker }
6034*4bdc9457SAndroid Build Coastguard Worker }
6035*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,n_div_4_subtile)6036*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, n_div_4_subtile) {
6037*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6038*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6039*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
6040*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6041*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6042*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6043*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6044*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6045*4bdc9457SAndroid Build Coastguard Worker .m(m)
6046*4bdc9457SAndroid Build Coastguard Worker .n(n)
6047*4bdc9457SAndroid Build Coastguard Worker .k(k)
6048*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6049*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
6050*4bdc9457SAndroid Build Coastguard Worker }
6051*4bdc9457SAndroid Build Coastguard Worker }
6052*4bdc9457SAndroid Build Coastguard Worker }
6053*4bdc9457SAndroid Build Coastguard Worker }
6054*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,strided_cm_subtile)6055*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, strided_cm_subtile) {
6056*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6057*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6058*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
6059*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6060*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6061*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6062*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6063*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6064*4bdc9457SAndroid Build Coastguard Worker .m(m)
6065*4bdc9457SAndroid Build Coastguard Worker .n(n)
6066*4bdc9457SAndroid Build Coastguard Worker .k(k)
6067*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6068*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6069*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
6070*4bdc9457SAndroid Build Coastguard Worker }
6071*4bdc9457SAndroid Build Coastguard Worker }
6072*4bdc9457SAndroid Build Coastguard Worker }
6073*4bdc9457SAndroid Build Coastguard Worker }
6074*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_1X4__SCALAR,strided_cm)6075*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_1X4__SCALAR, strided_cm) {
6076*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6077*4bdc9457SAndroid Build Coastguard Worker .mr(1)
6078*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6079*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6080*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6081*4bdc9457SAndroid Build Coastguard Worker .m(1)
6082*4bdc9457SAndroid Build Coastguard Worker .n(4)
6083*4bdc9457SAndroid Build Coastguard Worker .k(1)
6084*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6085*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_1x4__scalar);
6086*4bdc9457SAndroid Build Coastguard Worker }
6087*4bdc9457SAndroid Build Coastguard Worker
6088*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,k_eq_1)6089*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, k_eq_1) {
6090*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6091*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6092*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6093*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6094*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6095*4bdc9457SAndroid Build Coastguard Worker .m(4)
6096*4bdc9457SAndroid Build Coastguard Worker .n(2)
6097*4bdc9457SAndroid Build Coastguard Worker .k(1)
6098*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6099*4bdc9457SAndroid Build Coastguard Worker }
6100*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,strided_cn)6101*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, strided_cn) {
6102*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6103*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6104*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6105*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6106*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6107*4bdc9457SAndroid Build Coastguard Worker .m(4)
6108*4bdc9457SAndroid Build Coastguard Worker .n(2)
6109*4bdc9457SAndroid Build Coastguard Worker .k(1)
6110*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
6111*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6112*4bdc9457SAndroid Build Coastguard Worker }
6113*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,k_eq_1_strided_a)6114*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, k_eq_1_strided_a) {
6115*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6116*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6117*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6118*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6119*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6120*4bdc9457SAndroid Build Coastguard Worker .m(4)
6121*4bdc9457SAndroid Build Coastguard Worker .n(2)
6122*4bdc9457SAndroid Build Coastguard Worker .k(1)
6123*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
6124*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6125*4bdc9457SAndroid Build Coastguard Worker }
6126*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,k_eq_1_subtile)6127*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, k_eq_1_subtile) {
6128*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6129*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6130*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6131*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6132*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6133*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6134*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6135*4bdc9457SAndroid Build Coastguard Worker .m(m)
6136*4bdc9457SAndroid Build Coastguard Worker .n(n)
6137*4bdc9457SAndroid Build Coastguard Worker .k(1)
6138*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6139*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6140*4bdc9457SAndroid Build Coastguard Worker }
6141*4bdc9457SAndroid Build Coastguard Worker }
6142*4bdc9457SAndroid Build Coastguard Worker }
6143*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,k_eq_1_subtile_m)6144*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, k_eq_1_subtile_m) {
6145*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6146*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6147*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6148*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6149*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6150*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6151*4bdc9457SAndroid Build Coastguard Worker .m(m)
6152*4bdc9457SAndroid Build Coastguard Worker .n(2)
6153*4bdc9457SAndroid Build Coastguard Worker .k(1)
6154*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6155*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6156*4bdc9457SAndroid Build Coastguard Worker }
6157*4bdc9457SAndroid Build Coastguard Worker }
6158*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,k_eq_1_subtile_n)6159*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, k_eq_1_subtile_n) {
6160*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6161*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6162*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6163*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6164*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6165*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6166*4bdc9457SAndroid Build Coastguard Worker .m(4)
6167*4bdc9457SAndroid Build Coastguard Worker .n(n)
6168*4bdc9457SAndroid Build Coastguard Worker .k(1)
6169*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6170*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6171*4bdc9457SAndroid Build Coastguard Worker }
6172*4bdc9457SAndroid Build Coastguard Worker }
6173*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,k_gt_1)6174*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, k_gt_1) {
6175*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6176*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6177*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6178*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6179*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6180*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6181*4bdc9457SAndroid Build Coastguard Worker .m(4)
6182*4bdc9457SAndroid Build Coastguard Worker .n(2)
6183*4bdc9457SAndroid Build Coastguard Worker .k(k)
6184*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6185*4bdc9457SAndroid Build Coastguard Worker }
6186*4bdc9457SAndroid Build Coastguard Worker }
6187*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,k_gt_1_strided_a)6188*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, k_gt_1_strided_a) {
6189*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6190*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6191*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6192*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6193*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6194*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6195*4bdc9457SAndroid Build Coastguard Worker .m(4)
6196*4bdc9457SAndroid Build Coastguard Worker .n(2)
6197*4bdc9457SAndroid Build Coastguard Worker .k(k)
6198*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
6199*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6200*4bdc9457SAndroid Build Coastguard Worker }
6201*4bdc9457SAndroid Build Coastguard Worker }
6202*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,k_gt_1_subtile)6203*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, k_gt_1_subtile) {
6204*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6205*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6206*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6207*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6208*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6209*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6210*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6211*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6212*4bdc9457SAndroid Build Coastguard Worker .m(m)
6213*4bdc9457SAndroid Build Coastguard Worker .n(n)
6214*4bdc9457SAndroid Build Coastguard Worker .k(k)
6215*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6216*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6217*4bdc9457SAndroid Build Coastguard Worker }
6218*4bdc9457SAndroid Build Coastguard Worker }
6219*4bdc9457SAndroid Build Coastguard Worker }
6220*4bdc9457SAndroid Build Coastguard Worker }
6221*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,n_gt_2)6222*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, n_gt_2) {
6223*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6224*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6225*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6226*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6227*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6228*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6229*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6230*4bdc9457SAndroid Build Coastguard Worker .m(4)
6231*4bdc9457SAndroid Build Coastguard Worker .n(n)
6232*4bdc9457SAndroid Build Coastguard Worker .k(k)
6233*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6234*4bdc9457SAndroid Build Coastguard Worker }
6235*4bdc9457SAndroid Build Coastguard Worker }
6236*4bdc9457SAndroid Build Coastguard Worker }
6237*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,n_gt_2_strided_cn)6238*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, n_gt_2_strided_cn) {
6239*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6240*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6241*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6242*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6243*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6244*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6245*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6246*4bdc9457SAndroid Build Coastguard Worker .m(4)
6247*4bdc9457SAndroid Build Coastguard Worker .n(n)
6248*4bdc9457SAndroid Build Coastguard Worker .k(k)
6249*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
6250*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6251*4bdc9457SAndroid Build Coastguard Worker }
6252*4bdc9457SAndroid Build Coastguard Worker }
6253*4bdc9457SAndroid Build Coastguard Worker }
6254*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,n_gt_2_strided_a)6255*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, n_gt_2_strided_a) {
6256*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6257*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6258*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6259*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6260*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6261*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6262*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6263*4bdc9457SAndroid Build Coastguard Worker .m(4)
6264*4bdc9457SAndroid Build Coastguard Worker .n(n)
6265*4bdc9457SAndroid Build Coastguard Worker .k(k)
6266*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6267*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6268*4bdc9457SAndroid Build Coastguard Worker }
6269*4bdc9457SAndroid Build Coastguard Worker }
6270*4bdc9457SAndroid Build Coastguard Worker }
6271*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,n_gt_2_subtile)6272*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, n_gt_2_subtile) {
6273*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
6274*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6275*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6276*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6277*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6278*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6279*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6280*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6281*4bdc9457SAndroid Build Coastguard Worker .m(m)
6282*4bdc9457SAndroid Build Coastguard Worker .n(n)
6283*4bdc9457SAndroid Build Coastguard Worker .k(k)
6284*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6285*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6286*4bdc9457SAndroid Build Coastguard Worker }
6287*4bdc9457SAndroid Build Coastguard Worker }
6288*4bdc9457SAndroid Build Coastguard Worker }
6289*4bdc9457SAndroid Build Coastguard Worker }
6290*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,n_div_2)6291*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, n_div_2) {
6292*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
6293*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6294*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6295*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6296*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6297*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6298*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6299*4bdc9457SAndroid Build Coastguard Worker .m(4)
6300*4bdc9457SAndroid Build Coastguard Worker .n(n)
6301*4bdc9457SAndroid Build Coastguard Worker .k(k)
6302*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6303*4bdc9457SAndroid Build Coastguard Worker }
6304*4bdc9457SAndroid Build Coastguard Worker }
6305*4bdc9457SAndroid Build Coastguard Worker }
6306*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,n_div_2_strided_cn)6307*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, n_div_2_strided_cn) {
6308*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
6309*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6310*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6311*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6312*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6313*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6314*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6315*4bdc9457SAndroid Build Coastguard Worker .m(4)
6316*4bdc9457SAndroid Build Coastguard Worker .n(n)
6317*4bdc9457SAndroid Build Coastguard Worker .k(k)
6318*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
6319*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6320*4bdc9457SAndroid Build Coastguard Worker }
6321*4bdc9457SAndroid Build Coastguard Worker }
6322*4bdc9457SAndroid Build Coastguard Worker }
6323*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,n_div_2_strided_a)6324*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, n_div_2_strided_a) {
6325*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
6326*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6327*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6328*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6329*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6330*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6331*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6332*4bdc9457SAndroid Build Coastguard Worker .m(4)
6333*4bdc9457SAndroid Build Coastguard Worker .n(n)
6334*4bdc9457SAndroid Build Coastguard Worker .k(k)
6335*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6336*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6337*4bdc9457SAndroid Build Coastguard Worker }
6338*4bdc9457SAndroid Build Coastguard Worker }
6339*4bdc9457SAndroid Build Coastguard Worker }
6340*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,n_div_2_subtile)6341*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, n_div_2_subtile) {
6342*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
6343*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6344*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6345*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6346*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6347*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6348*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6349*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6350*4bdc9457SAndroid Build Coastguard Worker .m(m)
6351*4bdc9457SAndroid Build Coastguard Worker .n(n)
6352*4bdc9457SAndroid Build Coastguard Worker .k(k)
6353*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6354*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6355*4bdc9457SAndroid Build Coastguard Worker }
6356*4bdc9457SAndroid Build Coastguard Worker }
6357*4bdc9457SAndroid Build Coastguard Worker }
6358*4bdc9457SAndroid Build Coastguard Worker }
6359*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,strided_cm_subtile)6360*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, strided_cm_subtile) {
6361*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6362*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
6363*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6364*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6365*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6366*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6367*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6368*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6369*4bdc9457SAndroid Build Coastguard Worker .m(m)
6370*4bdc9457SAndroid Build Coastguard Worker .n(n)
6371*4bdc9457SAndroid Build Coastguard Worker .k(k)
6372*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
6373*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6374*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6375*4bdc9457SAndroid Build Coastguard Worker }
6376*4bdc9457SAndroid Build Coastguard Worker }
6377*4bdc9457SAndroid Build Coastguard Worker }
6378*4bdc9457SAndroid Build Coastguard Worker }
6379*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X2__SCALAR,strided_cm)6380*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X2__SCALAR, strided_cm) {
6381*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6382*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6383*4bdc9457SAndroid Build Coastguard Worker .nr(2)
6384*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6385*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6386*4bdc9457SAndroid Build Coastguard Worker .m(4)
6387*4bdc9457SAndroid Build Coastguard Worker .n(2)
6388*4bdc9457SAndroid Build Coastguard Worker .k(1)
6389*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
6390*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x2__scalar);
6391*4bdc9457SAndroid Build Coastguard Worker }
6392*4bdc9457SAndroid Build Coastguard Worker
6393*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,k_eq_1)6394*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, k_eq_1) {
6395*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6396*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6397*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6398*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6399*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6400*4bdc9457SAndroid Build Coastguard Worker .m(4)
6401*4bdc9457SAndroid Build Coastguard Worker .n(4)
6402*4bdc9457SAndroid Build Coastguard Worker .k(1)
6403*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6404*4bdc9457SAndroid Build Coastguard Worker }
6405*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,strided_cn)6406*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, strided_cn) {
6407*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6408*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6409*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6410*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6411*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6412*4bdc9457SAndroid Build Coastguard Worker .m(4)
6413*4bdc9457SAndroid Build Coastguard Worker .n(4)
6414*4bdc9457SAndroid Build Coastguard Worker .k(1)
6415*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6416*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6417*4bdc9457SAndroid Build Coastguard Worker }
6418*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,k_eq_1_strided_a)6419*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, k_eq_1_strided_a) {
6420*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6421*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6422*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6423*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6424*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6425*4bdc9457SAndroid Build Coastguard Worker .m(4)
6426*4bdc9457SAndroid Build Coastguard Worker .n(4)
6427*4bdc9457SAndroid Build Coastguard Worker .k(1)
6428*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
6429*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6430*4bdc9457SAndroid Build Coastguard Worker }
6431*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,k_eq_1_subtile)6432*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, k_eq_1_subtile) {
6433*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6434*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6435*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6436*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6437*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6438*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6439*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6440*4bdc9457SAndroid Build Coastguard Worker .m(m)
6441*4bdc9457SAndroid Build Coastguard Worker .n(n)
6442*4bdc9457SAndroid Build Coastguard Worker .k(1)
6443*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6444*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6445*4bdc9457SAndroid Build Coastguard Worker }
6446*4bdc9457SAndroid Build Coastguard Worker }
6447*4bdc9457SAndroid Build Coastguard Worker }
6448*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,k_eq_1_subtile_m)6449*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, k_eq_1_subtile_m) {
6450*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6451*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6452*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6453*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6454*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6455*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6456*4bdc9457SAndroid Build Coastguard Worker .m(m)
6457*4bdc9457SAndroid Build Coastguard Worker .n(4)
6458*4bdc9457SAndroid Build Coastguard Worker .k(1)
6459*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6460*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6461*4bdc9457SAndroid Build Coastguard Worker }
6462*4bdc9457SAndroid Build Coastguard Worker }
6463*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,k_eq_1_subtile_n)6464*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, k_eq_1_subtile_n) {
6465*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6466*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6467*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6468*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6469*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6470*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6471*4bdc9457SAndroid Build Coastguard Worker .m(4)
6472*4bdc9457SAndroid Build Coastguard Worker .n(n)
6473*4bdc9457SAndroid Build Coastguard Worker .k(1)
6474*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6475*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6476*4bdc9457SAndroid Build Coastguard Worker }
6477*4bdc9457SAndroid Build Coastguard Worker }
6478*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,k_gt_1)6479*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, k_gt_1) {
6480*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6481*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6482*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6483*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6484*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6485*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6486*4bdc9457SAndroid Build Coastguard Worker .m(4)
6487*4bdc9457SAndroid Build Coastguard Worker .n(4)
6488*4bdc9457SAndroid Build Coastguard Worker .k(k)
6489*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6490*4bdc9457SAndroid Build Coastguard Worker }
6491*4bdc9457SAndroid Build Coastguard Worker }
6492*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,k_gt_1_strided_a)6493*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, k_gt_1_strided_a) {
6494*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6495*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6496*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6497*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6498*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6499*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6500*4bdc9457SAndroid Build Coastguard Worker .m(4)
6501*4bdc9457SAndroid Build Coastguard Worker .n(4)
6502*4bdc9457SAndroid Build Coastguard Worker .k(k)
6503*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
6504*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6505*4bdc9457SAndroid Build Coastguard Worker }
6506*4bdc9457SAndroid Build Coastguard Worker }
6507*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,k_gt_1_subtile)6508*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, k_gt_1_subtile) {
6509*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6510*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6511*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6512*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6513*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6514*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6515*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6516*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6517*4bdc9457SAndroid Build Coastguard Worker .m(m)
6518*4bdc9457SAndroid Build Coastguard Worker .n(n)
6519*4bdc9457SAndroid Build Coastguard Worker .k(k)
6520*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6521*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6522*4bdc9457SAndroid Build Coastguard Worker }
6523*4bdc9457SAndroid Build Coastguard Worker }
6524*4bdc9457SAndroid Build Coastguard Worker }
6525*4bdc9457SAndroid Build Coastguard Worker }
6526*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,n_gt_4)6527*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, n_gt_4) {
6528*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6529*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6530*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6531*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6532*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6533*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6534*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6535*4bdc9457SAndroid Build Coastguard Worker .m(4)
6536*4bdc9457SAndroid Build Coastguard Worker .n(n)
6537*4bdc9457SAndroid Build Coastguard Worker .k(k)
6538*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6539*4bdc9457SAndroid Build Coastguard Worker }
6540*4bdc9457SAndroid Build Coastguard Worker }
6541*4bdc9457SAndroid Build Coastguard Worker }
6542*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,n_gt_4_strided_cn)6543*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, n_gt_4_strided_cn) {
6544*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6545*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6546*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6547*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6548*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6549*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6550*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6551*4bdc9457SAndroid Build Coastguard Worker .m(4)
6552*4bdc9457SAndroid Build Coastguard Worker .n(n)
6553*4bdc9457SAndroid Build Coastguard Worker .k(k)
6554*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6555*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6556*4bdc9457SAndroid Build Coastguard Worker }
6557*4bdc9457SAndroid Build Coastguard Worker }
6558*4bdc9457SAndroid Build Coastguard Worker }
6559*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,n_gt_4_strided_a)6560*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, n_gt_4_strided_a) {
6561*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6562*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6563*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6564*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6565*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6566*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6567*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6568*4bdc9457SAndroid Build Coastguard Worker .m(4)
6569*4bdc9457SAndroid Build Coastguard Worker .n(n)
6570*4bdc9457SAndroid Build Coastguard Worker .k(k)
6571*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6572*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6573*4bdc9457SAndroid Build Coastguard Worker }
6574*4bdc9457SAndroid Build Coastguard Worker }
6575*4bdc9457SAndroid Build Coastguard Worker }
6576*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,n_gt_4_subtile)6577*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, n_gt_4_subtile) {
6578*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6579*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6580*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6581*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6582*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6583*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6584*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6585*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6586*4bdc9457SAndroid Build Coastguard Worker .m(m)
6587*4bdc9457SAndroid Build Coastguard Worker .n(n)
6588*4bdc9457SAndroid Build Coastguard Worker .k(k)
6589*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6590*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6591*4bdc9457SAndroid Build Coastguard Worker }
6592*4bdc9457SAndroid Build Coastguard Worker }
6593*4bdc9457SAndroid Build Coastguard Worker }
6594*4bdc9457SAndroid Build Coastguard Worker }
6595*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,n_div_4)6596*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, n_div_4) {
6597*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6598*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6599*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6600*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6601*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6602*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6603*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6604*4bdc9457SAndroid Build Coastguard Worker .m(4)
6605*4bdc9457SAndroid Build Coastguard Worker .n(n)
6606*4bdc9457SAndroid Build Coastguard Worker .k(k)
6607*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6608*4bdc9457SAndroid Build Coastguard Worker }
6609*4bdc9457SAndroid Build Coastguard Worker }
6610*4bdc9457SAndroid Build Coastguard Worker }
6611*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,n_div_4_strided_cn)6612*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, n_div_4_strided_cn) {
6613*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6614*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6615*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6616*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6617*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6618*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6619*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6620*4bdc9457SAndroid Build Coastguard Worker .m(4)
6621*4bdc9457SAndroid Build Coastguard Worker .n(n)
6622*4bdc9457SAndroid Build Coastguard Worker .k(k)
6623*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6624*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6625*4bdc9457SAndroid Build Coastguard Worker }
6626*4bdc9457SAndroid Build Coastguard Worker }
6627*4bdc9457SAndroid Build Coastguard Worker }
6628*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,n_div_4_strided_a)6629*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, n_div_4_strided_a) {
6630*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6631*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6632*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6633*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6634*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6635*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6636*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6637*4bdc9457SAndroid Build Coastguard Worker .m(4)
6638*4bdc9457SAndroid Build Coastguard Worker .n(n)
6639*4bdc9457SAndroid Build Coastguard Worker .k(k)
6640*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6641*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6642*4bdc9457SAndroid Build Coastguard Worker }
6643*4bdc9457SAndroid Build Coastguard Worker }
6644*4bdc9457SAndroid Build Coastguard Worker }
6645*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,n_div_4_subtile)6646*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, n_div_4_subtile) {
6647*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6648*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6649*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6650*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6651*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6652*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6653*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6654*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6655*4bdc9457SAndroid Build Coastguard Worker .m(m)
6656*4bdc9457SAndroid Build Coastguard Worker .n(n)
6657*4bdc9457SAndroid Build Coastguard Worker .k(k)
6658*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6659*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6660*4bdc9457SAndroid Build Coastguard Worker }
6661*4bdc9457SAndroid Build Coastguard Worker }
6662*4bdc9457SAndroid Build Coastguard Worker }
6663*4bdc9457SAndroid Build Coastguard Worker }
6664*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,strided_cm_subtile)6665*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, strided_cm_subtile) {
6666*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6667*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6668*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
6669*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6670*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6671*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6672*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6673*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6674*4bdc9457SAndroid Build Coastguard Worker .m(m)
6675*4bdc9457SAndroid Build Coastguard Worker .n(n)
6676*4bdc9457SAndroid Build Coastguard Worker .k(k)
6677*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6678*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6679*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6680*4bdc9457SAndroid Build Coastguard Worker }
6681*4bdc9457SAndroid Build Coastguard Worker }
6682*4bdc9457SAndroid Build Coastguard Worker }
6683*4bdc9457SAndroid Build Coastguard Worker }
6684*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_RELU_4X4__SCALAR,strided_cm)6685*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_RELU_4X4__SCALAR, strided_cm) {
6686*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6687*4bdc9457SAndroid Build Coastguard Worker .mr(4)
6688*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6689*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6690*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6691*4bdc9457SAndroid Build Coastguard Worker .m(4)
6692*4bdc9457SAndroid Build Coastguard Worker .n(4)
6693*4bdc9457SAndroid Build Coastguard Worker .k(1)
6694*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6695*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_relu_ukernel_4x4__scalar);
6696*4bdc9457SAndroid Build Coastguard Worker }
6697