1*4bdc9457SAndroid Build Coastguard Worker // Copyright (c) Facebook, Inc. and its affiliates.
2*4bdc9457SAndroid Build Coastguard Worker // All rights reserved.
3*4bdc9457SAndroid Build Coastguard Worker //
4*4bdc9457SAndroid Build Coastguard Worker // Copyright 2019 Google LLC
5*4bdc9457SAndroid Build Coastguard Worker //
6*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
7*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
8*4bdc9457SAndroid Build Coastguard Worker //
9*4bdc9457SAndroid Build Coastguard Worker // Auto-generated file. Do not edit!
10*4bdc9457SAndroid Build Coastguard Worker // Specification: test/f32-gemm.yaml
11*4bdc9457SAndroid Build Coastguard Worker // Generator: tools/generate-gemm-test.py
12*4bdc9457SAndroid Build Coastguard Worker
13*4bdc9457SAndroid Build Coastguard Worker
14*4bdc9457SAndroid Build Coastguard Worker #include <gtest/gtest.h>
15*4bdc9457SAndroid Build Coastguard Worker
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/allocator.h>
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h>
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/isa-checks.h>
19*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microparams-init.h>
20*4bdc9457SAndroid Build Coastguard Worker
21*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/gemm.h>
22*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/igemm.h>
23*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/ppmm.h>
24*4bdc9457SAndroid Build Coastguard Worker #include "gemm-microkernel-tester.h"
25*4bdc9457SAndroid Build Coastguard Worker
26*4bdc9457SAndroid Build Coastguard Worker
27*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_ARM && XNN_ENABLE_ASSEMBLY
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_eq_2)28*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_eq_2) {
29*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
30*4bdc9457SAndroid Build Coastguard Worker .mr(4)
31*4bdc9457SAndroid Build Coastguard Worker .nr(4)
32*4bdc9457SAndroid Build Coastguard Worker .kr(1)
33*4bdc9457SAndroid Build Coastguard Worker .sr(1)
34*4bdc9457SAndroid Build Coastguard Worker .m(4)
35*4bdc9457SAndroid Build Coastguard Worker .n(4)
36*4bdc9457SAndroid Build Coastguard Worker .k(2)
37*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
38*4bdc9457SAndroid Build Coastguard Worker }
39*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,strided_cn)40*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, strided_cn) {
41*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
42*4bdc9457SAndroid Build Coastguard Worker .mr(4)
43*4bdc9457SAndroid Build Coastguard Worker .nr(4)
44*4bdc9457SAndroid Build Coastguard Worker .kr(1)
45*4bdc9457SAndroid Build Coastguard Worker .sr(1)
46*4bdc9457SAndroid Build Coastguard Worker .m(4)
47*4bdc9457SAndroid Build Coastguard Worker .n(4)
48*4bdc9457SAndroid Build Coastguard Worker .k(2)
49*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
50*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
51*4bdc9457SAndroid Build Coastguard Worker }
52*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_eq_2_strided_a)53*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_eq_2_strided_a) {
54*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
55*4bdc9457SAndroid Build Coastguard Worker .mr(4)
56*4bdc9457SAndroid Build Coastguard Worker .nr(4)
57*4bdc9457SAndroid Build Coastguard Worker .kr(1)
58*4bdc9457SAndroid Build Coastguard Worker .sr(1)
59*4bdc9457SAndroid Build Coastguard Worker .m(4)
60*4bdc9457SAndroid Build Coastguard Worker .n(4)
61*4bdc9457SAndroid Build Coastguard Worker .k(2)
62*4bdc9457SAndroid Build Coastguard Worker .a_stride(5)
63*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
64*4bdc9457SAndroid Build Coastguard Worker }
65*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_eq_2_subtile)66*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_eq_2_subtile) {
67*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
68*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
69*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
70*4bdc9457SAndroid Build Coastguard Worker .mr(4)
71*4bdc9457SAndroid Build Coastguard Worker .nr(4)
72*4bdc9457SAndroid Build Coastguard Worker .kr(1)
73*4bdc9457SAndroid Build Coastguard Worker .sr(1)
74*4bdc9457SAndroid Build Coastguard Worker .m(m)
75*4bdc9457SAndroid Build Coastguard Worker .n(n)
76*4bdc9457SAndroid Build Coastguard Worker .k(2)
77*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
78*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
79*4bdc9457SAndroid Build Coastguard Worker }
80*4bdc9457SAndroid Build Coastguard Worker }
81*4bdc9457SAndroid Build Coastguard Worker }
82*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_eq_2_subtile_m)83*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_eq_2_subtile_m) {
84*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
85*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
86*4bdc9457SAndroid Build Coastguard Worker .mr(4)
87*4bdc9457SAndroid Build Coastguard Worker .nr(4)
88*4bdc9457SAndroid Build Coastguard Worker .kr(1)
89*4bdc9457SAndroid Build Coastguard Worker .sr(1)
90*4bdc9457SAndroid Build Coastguard Worker .m(m)
91*4bdc9457SAndroid Build Coastguard Worker .n(4)
92*4bdc9457SAndroid Build Coastguard Worker .k(2)
93*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
94*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
95*4bdc9457SAndroid Build Coastguard Worker }
96*4bdc9457SAndroid Build Coastguard Worker }
97*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_eq_2_subtile_n)98*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_eq_2_subtile_n) {
99*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
100*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
101*4bdc9457SAndroid Build Coastguard Worker .mr(4)
102*4bdc9457SAndroid Build Coastguard Worker .nr(4)
103*4bdc9457SAndroid Build Coastguard Worker .kr(1)
104*4bdc9457SAndroid Build Coastguard Worker .sr(1)
105*4bdc9457SAndroid Build Coastguard Worker .m(4)
106*4bdc9457SAndroid Build Coastguard Worker .n(n)
107*4bdc9457SAndroid Build Coastguard Worker .k(2)
108*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
109*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
110*4bdc9457SAndroid Build Coastguard Worker }
111*4bdc9457SAndroid Build Coastguard Worker }
112*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_lt_2)113*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_lt_2) {
114*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 2; k++) {
115*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
116*4bdc9457SAndroid Build Coastguard Worker .mr(4)
117*4bdc9457SAndroid Build Coastguard Worker .nr(4)
118*4bdc9457SAndroid Build Coastguard Worker .kr(1)
119*4bdc9457SAndroid Build Coastguard Worker .sr(1)
120*4bdc9457SAndroid Build Coastguard Worker .m(4)
121*4bdc9457SAndroid Build Coastguard Worker .n(4)
122*4bdc9457SAndroid Build Coastguard Worker .k(k)
123*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
124*4bdc9457SAndroid Build Coastguard Worker }
125*4bdc9457SAndroid Build Coastguard Worker }
126*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_lt_2_strided_a)127*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_lt_2_strided_a) {
128*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 2; k++) {
129*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
130*4bdc9457SAndroid Build Coastguard Worker .mr(4)
131*4bdc9457SAndroid Build Coastguard Worker .nr(4)
132*4bdc9457SAndroid Build Coastguard Worker .kr(1)
133*4bdc9457SAndroid Build Coastguard Worker .sr(1)
134*4bdc9457SAndroid Build Coastguard Worker .m(4)
135*4bdc9457SAndroid Build Coastguard Worker .n(4)
136*4bdc9457SAndroid Build Coastguard Worker .k(k)
137*4bdc9457SAndroid Build Coastguard Worker .a_stride(5)
138*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
139*4bdc9457SAndroid Build Coastguard Worker }
140*4bdc9457SAndroid Build Coastguard Worker }
141*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_lt_2_subtile)142*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_lt_2_subtile) {
143*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 2; k++) {
144*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
145*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
146*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
147*4bdc9457SAndroid Build Coastguard Worker .mr(4)
148*4bdc9457SAndroid Build Coastguard Worker .nr(4)
149*4bdc9457SAndroid Build Coastguard Worker .kr(1)
150*4bdc9457SAndroid Build Coastguard Worker .sr(1)
151*4bdc9457SAndroid Build Coastguard Worker .m(m)
152*4bdc9457SAndroid Build Coastguard Worker .n(n)
153*4bdc9457SAndroid Build Coastguard Worker .k(k)
154*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
155*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
156*4bdc9457SAndroid Build Coastguard Worker }
157*4bdc9457SAndroid Build Coastguard Worker }
158*4bdc9457SAndroid Build Coastguard Worker }
159*4bdc9457SAndroid Build Coastguard Worker }
160*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_gt_2)161*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_gt_2) {
162*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 3; k < 4; k++) {
163*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
164*4bdc9457SAndroid Build Coastguard Worker .mr(4)
165*4bdc9457SAndroid Build Coastguard Worker .nr(4)
166*4bdc9457SAndroid Build Coastguard Worker .kr(1)
167*4bdc9457SAndroid Build Coastguard Worker .sr(1)
168*4bdc9457SAndroid Build Coastguard Worker .m(4)
169*4bdc9457SAndroid Build Coastguard Worker .n(4)
170*4bdc9457SAndroid Build Coastguard Worker .k(k)
171*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
172*4bdc9457SAndroid Build Coastguard Worker }
173*4bdc9457SAndroid Build Coastguard Worker }
174*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_gt_2_strided_a)175*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_gt_2_strided_a) {
176*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 3; k < 4; k++) {
177*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
178*4bdc9457SAndroid Build Coastguard Worker .mr(4)
179*4bdc9457SAndroid Build Coastguard Worker .nr(4)
180*4bdc9457SAndroid Build Coastguard Worker .kr(1)
181*4bdc9457SAndroid Build Coastguard Worker .sr(1)
182*4bdc9457SAndroid Build Coastguard Worker .m(4)
183*4bdc9457SAndroid Build Coastguard Worker .n(4)
184*4bdc9457SAndroid Build Coastguard Worker .k(k)
185*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
186*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
187*4bdc9457SAndroid Build Coastguard Worker }
188*4bdc9457SAndroid Build Coastguard Worker }
189*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_gt_2_subtile)190*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_gt_2_subtile) {
191*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 3; k < 4; k++) {
192*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
193*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
194*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
195*4bdc9457SAndroid Build Coastguard Worker .mr(4)
196*4bdc9457SAndroid Build Coastguard Worker .nr(4)
197*4bdc9457SAndroid Build Coastguard Worker .kr(1)
198*4bdc9457SAndroid Build Coastguard Worker .sr(1)
199*4bdc9457SAndroid Build Coastguard Worker .m(m)
200*4bdc9457SAndroid Build Coastguard Worker .n(n)
201*4bdc9457SAndroid Build Coastguard Worker .k(k)
202*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
203*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
204*4bdc9457SAndroid Build Coastguard Worker }
205*4bdc9457SAndroid Build Coastguard Worker }
206*4bdc9457SAndroid Build Coastguard Worker }
207*4bdc9457SAndroid Build Coastguard Worker }
208*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_div_2)209*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_div_2) {
210*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 4; k <= 20; k += 2) {
211*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
212*4bdc9457SAndroid Build Coastguard Worker .mr(4)
213*4bdc9457SAndroid Build Coastguard Worker .nr(4)
214*4bdc9457SAndroid Build Coastguard Worker .kr(1)
215*4bdc9457SAndroid Build Coastguard Worker .sr(1)
216*4bdc9457SAndroid Build Coastguard Worker .m(4)
217*4bdc9457SAndroid Build Coastguard Worker .n(4)
218*4bdc9457SAndroid Build Coastguard Worker .k(k)
219*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
220*4bdc9457SAndroid Build Coastguard Worker }
221*4bdc9457SAndroid Build Coastguard Worker }
222*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_div_2_strided_a)223*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_div_2_strided_a) {
224*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 4; k <= 20; k += 2) {
225*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
226*4bdc9457SAndroid Build Coastguard Worker .mr(4)
227*4bdc9457SAndroid Build Coastguard Worker .nr(4)
228*4bdc9457SAndroid Build Coastguard Worker .kr(1)
229*4bdc9457SAndroid Build Coastguard Worker .sr(1)
230*4bdc9457SAndroid Build Coastguard Worker .m(4)
231*4bdc9457SAndroid Build Coastguard Worker .n(4)
232*4bdc9457SAndroid Build Coastguard Worker .k(k)
233*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
234*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
235*4bdc9457SAndroid Build Coastguard Worker }
236*4bdc9457SAndroid Build Coastguard Worker }
237*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,k_div_2_subtile)238*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, k_div_2_subtile) {
239*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 4; k <= 20; k += 2) {
240*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
241*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
242*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
243*4bdc9457SAndroid Build Coastguard Worker .mr(4)
244*4bdc9457SAndroid Build Coastguard Worker .nr(4)
245*4bdc9457SAndroid Build Coastguard Worker .kr(1)
246*4bdc9457SAndroid Build Coastguard Worker .sr(1)
247*4bdc9457SAndroid Build Coastguard Worker .m(m)
248*4bdc9457SAndroid Build Coastguard Worker .n(n)
249*4bdc9457SAndroid Build Coastguard Worker .k(k)
250*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
251*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
252*4bdc9457SAndroid Build Coastguard Worker }
253*4bdc9457SAndroid Build Coastguard Worker }
254*4bdc9457SAndroid Build Coastguard Worker }
255*4bdc9457SAndroid Build Coastguard Worker }
256*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,n_gt_4)257*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, n_gt_4) {
258*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
259*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 10; k += 3) {
260*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
261*4bdc9457SAndroid Build Coastguard Worker .mr(4)
262*4bdc9457SAndroid Build Coastguard Worker .nr(4)
263*4bdc9457SAndroid Build Coastguard Worker .kr(1)
264*4bdc9457SAndroid Build Coastguard Worker .sr(1)
265*4bdc9457SAndroid Build Coastguard Worker .m(4)
266*4bdc9457SAndroid Build Coastguard Worker .n(n)
267*4bdc9457SAndroid Build Coastguard Worker .k(k)
268*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
269*4bdc9457SAndroid Build Coastguard Worker }
270*4bdc9457SAndroid Build Coastguard Worker }
271*4bdc9457SAndroid Build Coastguard Worker }
272*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,n_gt_4_strided_cn)273*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, n_gt_4_strided_cn) {
274*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
275*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 10; k += 3) {
276*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
277*4bdc9457SAndroid Build Coastguard Worker .mr(4)
278*4bdc9457SAndroid Build Coastguard Worker .nr(4)
279*4bdc9457SAndroid Build Coastguard Worker .kr(1)
280*4bdc9457SAndroid Build Coastguard Worker .sr(1)
281*4bdc9457SAndroid Build Coastguard Worker .m(4)
282*4bdc9457SAndroid Build Coastguard Worker .n(n)
283*4bdc9457SAndroid Build Coastguard Worker .k(k)
284*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
285*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
286*4bdc9457SAndroid Build Coastguard Worker }
287*4bdc9457SAndroid Build Coastguard Worker }
288*4bdc9457SAndroid Build Coastguard Worker }
289*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,n_gt_4_strided_a)290*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, n_gt_4_strided_a) {
291*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
292*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 10; k += 3) {
293*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
294*4bdc9457SAndroid Build Coastguard Worker .mr(4)
295*4bdc9457SAndroid Build Coastguard Worker .nr(4)
296*4bdc9457SAndroid Build Coastguard Worker .kr(1)
297*4bdc9457SAndroid Build Coastguard Worker .sr(1)
298*4bdc9457SAndroid Build Coastguard Worker .m(4)
299*4bdc9457SAndroid Build Coastguard Worker .n(n)
300*4bdc9457SAndroid Build Coastguard Worker .k(k)
301*4bdc9457SAndroid Build Coastguard Worker .a_stride(13)
302*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
303*4bdc9457SAndroid Build Coastguard Worker }
304*4bdc9457SAndroid Build Coastguard Worker }
305*4bdc9457SAndroid Build Coastguard Worker }
306*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,n_gt_4_subtile)307*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, n_gt_4_subtile) {
308*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
309*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 10; k += 3) {
310*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
311*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
312*4bdc9457SAndroid Build Coastguard Worker .mr(4)
313*4bdc9457SAndroid Build Coastguard Worker .nr(4)
314*4bdc9457SAndroid Build Coastguard Worker .kr(1)
315*4bdc9457SAndroid Build Coastguard Worker .sr(1)
316*4bdc9457SAndroid Build Coastguard Worker .m(m)
317*4bdc9457SAndroid Build Coastguard Worker .n(n)
318*4bdc9457SAndroid Build Coastguard Worker .k(k)
319*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
320*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
321*4bdc9457SAndroid Build Coastguard Worker }
322*4bdc9457SAndroid Build Coastguard Worker }
323*4bdc9457SAndroid Build Coastguard Worker }
324*4bdc9457SAndroid Build Coastguard Worker }
325*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,n_div_4)326*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, n_div_4) {
327*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
328*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 10; k += 3) {
329*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
330*4bdc9457SAndroid Build Coastguard Worker .mr(4)
331*4bdc9457SAndroid Build Coastguard Worker .nr(4)
332*4bdc9457SAndroid Build Coastguard Worker .kr(1)
333*4bdc9457SAndroid Build Coastguard Worker .sr(1)
334*4bdc9457SAndroid Build Coastguard Worker .m(4)
335*4bdc9457SAndroid Build Coastguard Worker .n(n)
336*4bdc9457SAndroid Build Coastguard Worker .k(k)
337*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
338*4bdc9457SAndroid Build Coastguard Worker }
339*4bdc9457SAndroid Build Coastguard Worker }
340*4bdc9457SAndroid Build Coastguard Worker }
341*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,n_div_4_strided_cn)342*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, n_div_4_strided_cn) {
343*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
344*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 10; k += 3) {
345*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
346*4bdc9457SAndroid Build Coastguard Worker .mr(4)
347*4bdc9457SAndroid Build Coastguard Worker .nr(4)
348*4bdc9457SAndroid Build Coastguard Worker .kr(1)
349*4bdc9457SAndroid Build Coastguard Worker .sr(1)
350*4bdc9457SAndroid Build Coastguard Worker .m(4)
351*4bdc9457SAndroid Build Coastguard Worker .n(n)
352*4bdc9457SAndroid Build Coastguard Worker .k(k)
353*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
354*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
355*4bdc9457SAndroid Build Coastguard Worker }
356*4bdc9457SAndroid Build Coastguard Worker }
357*4bdc9457SAndroid Build Coastguard Worker }
358*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,n_div_4_strided_a)359*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, n_div_4_strided_a) {
360*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
361*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 10; k += 3) {
362*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
363*4bdc9457SAndroid Build Coastguard Worker .mr(4)
364*4bdc9457SAndroid Build Coastguard Worker .nr(4)
365*4bdc9457SAndroid Build Coastguard Worker .kr(1)
366*4bdc9457SAndroid Build Coastguard Worker .sr(1)
367*4bdc9457SAndroid Build Coastguard Worker .m(4)
368*4bdc9457SAndroid Build Coastguard Worker .n(n)
369*4bdc9457SAndroid Build Coastguard Worker .k(k)
370*4bdc9457SAndroid Build Coastguard Worker .a_stride(13)
371*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
372*4bdc9457SAndroid Build Coastguard Worker }
373*4bdc9457SAndroid Build Coastguard Worker }
374*4bdc9457SAndroid Build Coastguard Worker }
375*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,n_div_4_subtile)376*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, n_div_4_subtile) {
377*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
378*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 10; k += 3) {
379*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
380*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
381*4bdc9457SAndroid Build Coastguard Worker .mr(4)
382*4bdc9457SAndroid Build Coastguard Worker .nr(4)
383*4bdc9457SAndroid Build Coastguard Worker .kr(1)
384*4bdc9457SAndroid Build Coastguard Worker .sr(1)
385*4bdc9457SAndroid Build Coastguard Worker .m(m)
386*4bdc9457SAndroid Build Coastguard Worker .n(n)
387*4bdc9457SAndroid Build Coastguard Worker .k(k)
388*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
389*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
390*4bdc9457SAndroid Build Coastguard Worker }
391*4bdc9457SAndroid Build Coastguard Worker }
392*4bdc9457SAndroid Build Coastguard Worker }
393*4bdc9457SAndroid Build Coastguard Worker }
394*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,strided_cm_subtile)395*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, strided_cm_subtile) {
396*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 10; k += 3) {
397*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
398*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
399*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
400*4bdc9457SAndroid Build Coastguard Worker .mr(4)
401*4bdc9457SAndroid Build Coastguard Worker .nr(4)
402*4bdc9457SAndroid Build Coastguard Worker .kr(1)
403*4bdc9457SAndroid Build Coastguard Worker .sr(1)
404*4bdc9457SAndroid Build Coastguard Worker .m(m)
405*4bdc9457SAndroid Build Coastguard Worker .n(n)
406*4bdc9457SAndroid Build Coastguard Worker .k(k)
407*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
408*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
409*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
410*4bdc9457SAndroid Build Coastguard Worker }
411*4bdc9457SAndroid Build Coastguard Worker }
412*4bdc9457SAndroid Build Coastguard Worker }
413*4bdc9457SAndroid Build Coastguard Worker }
414*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X4__AARCH32_VFP_LD64,strided_cm)415*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X4__AARCH32_VFP_LD64, strided_cm) {
416*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
417*4bdc9457SAndroid Build Coastguard Worker .mr(4)
418*4bdc9457SAndroid Build Coastguard Worker .nr(4)
419*4bdc9457SAndroid Build Coastguard Worker .kr(1)
420*4bdc9457SAndroid Build Coastguard Worker .sr(1)
421*4bdc9457SAndroid Build Coastguard Worker .m(4)
422*4bdc9457SAndroid Build Coastguard Worker .n(4)
423*4bdc9457SAndroid Build Coastguard Worker .k(2)
424*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
425*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64);
426*4bdc9457SAndroid Build Coastguard Worker }
427*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_ARM && XNN_ENABLE_ASSEMBLY
428*4bdc9457SAndroid Build Coastguard Worker
429*4bdc9457SAndroid Build Coastguard Worker
430*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,k_eq_1)431*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, k_eq_1) {
432*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
433*4bdc9457SAndroid Build Coastguard Worker .mr(3)
434*4bdc9457SAndroid Build Coastguard Worker .nr(8)
435*4bdc9457SAndroid Build Coastguard Worker .kr(1)
436*4bdc9457SAndroid Build Coastguard Worker .sr(1)
437*4bdc9457SAndroid Build Coastguard Worker .m(3)
438*4bdc9457SAndroid Build Coastguard Worker .n(8)
439*4bdc9457SAndroid Build Coastguard Worker .k(1)
440*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
441*4bdc9457SAndroid Build Coastguard Worker }
442*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,strided_cn)443*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, strided_cn) {
444*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
445*4bdc9457SAndroid Build Coastguard Worker .mr(3)
446*4bdc9457SAndroid Build Coastguard Worker .nr(8)
447*4bdc9457SAndroid Build Coastguard Worker .kr(1)
448*4bdc9457SAndroid Build Coastguard Worker .sr(1)
449*4bdc9457SAndroid Build Coastguard Worker .m(3)
450*4bdc9457SAndroid Build Coastguard Worker .n(8)
451*4bdc9457SAndroid Build Coastguard Worker .k(1)
452*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
453*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
454*4bdc9457SAndroid Build Coastguard Worker }
455*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,k_eq_1_strided_a)456*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, k_eq_1_strided_a) {
457*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
458*4bdc9457SAndroid Build Coastguard Worker .mr(3)
459*4bdc9457SAndroid Build Coastguard Worker .nr(8)
460*4bdc9457SAndroid Build Coastguard Worker .kr(1)
461*4bdc9457SAndroid Build Coastguard Worker .sr(1)
462*4bdc9457SAndroid Build Coastguard Worker .m(3)
463*4bdc9457SAndroid Build Coastguard Worker .n(8)
464*4bdc9457SAndroid Build Coastguard Worker .k(1)
465*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
466*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
467*4bdc9457SAndroid Build Coastguard Worker }
468*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)469*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
470*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
471*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
472*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
473*4bdc9457SAndroid Build Coastguard Worker .mr(3)
474*4bdc9457SAndroid Build Coastguard Worker .nr(8)
475*4bdc9457SAndroid Build Coastguard Worker .kr(1)
476*4bdc9457SAndroid Build Coastguard Worker .sr(1)
477*4bdc9457SAndroid Build Coastguard Worker .m(m)
478*4bdc9457SAndroid Build Coastguard Worker .n(n)
479*4bdc9457SAndroid Build Coastguard Worker .k(1)
480*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
481*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
482*4bdc9457SAndroid Build Coastguard Worker }
483*4bdc9457SAndroid Build Coastguard Worker }
484*4bdc9457SAndroid Build Coastguard Worker }
485*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)486*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
487*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
488*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
489*4bdc9457SAndroid Build Coastguard Worker .mr(3)
490*4bdc9457SAndroid Build Coastguard Worker .nr(8)
491*4bdc9457SAndroid Build Coastguard Worker .kr(1)
492*4bdc9457SAndroid Build Coastguard Worker .sr(1)
493*4bdc9457SAndroid Build Coastguard Worker .m(m)
494*4bdc9457SAndroid Build Coastguard Worker .n(8)
495*4bdc9457SAndroid Build Coastguard Worker .k(1)
496*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
497*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
498*4bdc9457SAndroid Build Coastguard Worker }
499*4bdc9457SAndroid Build Coastguard Worker }
500*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)501*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
502*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
503*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
504*4bdc9457SAndroid Build Coastguard Worker .mr(3)
505*4bdc9457SAndroid Build Coastguard Worker .nr(8)
506*4bdc9457SAndroid Build Coastguard Worker .kr(1)
507*4bdc9457SAndroid Build Coastguard Worker .sr(1)
508*4bdc9457SAndroid Build Coastguard Worker .m(3)
509*4bdc9457SAndroid Build Coastguard Worker .n(n)
510*4bdc9457SAndroid Build Coastguard Worker .k(1)
511*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
512*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
513*4bdc9457SAndroid Build Coastguard Worker }
514*4bdc9457SAndroid Build Coastguard Worker }
515*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,k_gt_1)516*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, k_gt_1) {
517*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
518*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
519*4bdc9457SAndroid Build Coastguard Worker .mr(3)
520*4bdc9457SAndroid Build Coastguard Worker .nr(8)
521*4bdc9457SAndroid Build Coastguard Worker .kr(1)
522*4bdc9457SAndroid Build Coastguard Worker .sr(1)
523*4bdc9457SAndroid Build Coastguard Worker .m(3)
524*4bdc9457SAndroid Build Coastguard Worker .n(8)
525*4bdc9457SAndroid Build Coastguard Worker .k(k)
526*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
527*4bdc9457SAndroid Build Coastguard Worker }
528*4bdc9457SAndroid Build Coastguard Worker }
529*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,k_gt_1_strided_a)530*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, k_gt_1_strided_a) {
531*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
532*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
533*4bdc9457SAndroid Build Coastguard Worker .mr(3)
534*4bdc9457SAndroid Build Coastguard Worker .nr(8)
535*4bdc9457SAndroid Build Coastguard Worker .kr(1)
536*4bdc9457SAndroid Build Coastguard Worker .sr(1)
537*4bdc9457SAndroid Build Coastguard Worker .m(3)
538*4bdc9457SAndroid Build Coastguard Worker .n(8)
539*4bdc9457SAndroid Build Coastguard Worker .k(k)
540*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
541*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
542*4bdc9457SAndroid Build Coastguard Worker }
543*4bdc9457SAndroid Build Coastguard Worker }
544*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)545*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
546*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
547*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
548*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
549*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
550*4bdc9457SAndroid Build Coastguard Worker .mr(3)
551*4bdc9457SAndroid Build Coastguard Worker .nr(8)
552*4bdc9457SAndroid Build Coastguard Worker .kr(1)
553*4bdc9457SAndroid Build Coastguard Worker .sr(1)
554*4bdc9457SAndroid Build Coastguard Worker .m(m)
555*4bdc9457SAndroid Build Coastguard Worker .n(n)
556*4bdc9457SAndroid Build Coastguard Worker .k(k)
557*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
558*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
559*4bdc9457SAndroid Build Coastguard Worker }
560*4bdc9457SAndroid Build Coastguard Worker }
561*4bdc9457SAndroid Build Coastguard Worker }
562*4bdc9457SAndroid Build Coastguard Worker }
563*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,n_gt_8)564*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, n_gt_8) {
565*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
566*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
567*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
568*4bdc9457SAndroid Build Coastguard Worker .mr(3)
569*4bdc9457SAndroid Build Coastguard Worker .nr(8)
570*4bdc9457SAndroid Build Coastguard Worker .kr(1)
571*4bdc9457SAndroid Build Coastguard Worker .sr(1)
572*4bdc9457SAndroid Build Coastguard Worker .m(3)
573*4bdc9457SAndroid Build Coastguard Worker .n(n)
574*4bdc9457SAndroid Build Coastguard Worker .k(k)
575*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
576*4bdc9457SAndroid Build Coastguard Worker }
577*4bdc9457SAndroid Build Coastguard Worker }
578*4bdc9457SAndroid Build Coastguard Worker }
579*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)580*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
581*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
582*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
583*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
584*4bdc9457SAndroid Build Coastguard Worker .mr(3)
585*4bdc9457SAndroid Build Coastguard Worker .nr(8)
586*4bdc9457SAndroid Build Coastguard Worker .kr(1)
587*4bdc9457SAndroid Build Coastguard Worker .sr(1)
588*4bdc9457SAndroid Build Coastguard Worker .m(3)
589*4bdc9457SAndroid Build Coastguard Worker .n(n)
590*4bdc9457SAndroid Build Coastguard Worker .k(k)
591*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
592*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
593*4bdc9457SAndroid Build Coastguard Worker }
594*4bdc9457SAndroid Build Coastguard Worker }
595*4bdc9457SAndroid Build Coastguard Worker }
596*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_a)597*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_a) {
598*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
599*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
600*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
601*4bdc9457SAndroid Build Coastguard Worker .mr(3)
602*4bdc9457SAndroid Build Coastguard Worker .nr(8)
603*4bdc9457SAndroid Build Coastguard Worker .kr(1)
604*4bdc9457SAndroid Build Coastguard Worker .sr(1)
605*4bdc9457SAndroid Build Coastguard Worker .m(3)
606*4bdc9457SAndroid Build Coastguard Worker .n(n)
607*4bdc9457SAndroid Build Coastguard Worker .k(k)
608*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
609*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
610*4bdc9457SAndroid Build Coastguard Worker }
611*4bdc9457SAndroid Build Coastguard Worker }
612*4bdc9457SAndroid Build Coastguard Worker }
613*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)614*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
615*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
616*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
617*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
618*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
619*4bdc9457SAndroid Build Coastguard Worker .mr(3)
620*4bdc9457SAndroid Build Coastguard Worker .nr(8)
621*4bdc9457SAndroid Build Coastguard Worker .kr(1)
622*4bdc9457SAndroid Build Coastguard Worker .sr(1)
623*4bdc9457SAndroid Build Coastguard Worker .m(m)
624*4bdc9457SAndroid Build Coastguard Worker .n(n)
625*4bdc9457SAndroid Build Coastguard Worker .k(k)
626*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
627*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
628*4bdc9457SAndroid Build Coastguard Worker }
629*4bdc9457SAndroid Build Coastguard Worker }
630*4bdc9457SAndroid Build Coastguard Worker }
631*4bdc9457SAndroid Build Coastguard Worker }
632*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,n_div_8)633*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, n_div_8) {
634*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
635*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
636*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
637*4bdc9457SAndroid Build Coastguard Worker .mr(3)
638*4bdc9457SAndroid Build Coastguard Worker .nr(8)
639*4bdc9457SAndroid Build Coastguard Worker .kr(1)
640*4bdc9457SAndroid Build Coastguard Worker .sr(1)
641*4bdc9457SAndroid Build Coastguard Worker .m(3)
642*4bdc9457SAndroid Build Coastguard Worker .n(n)
643*4bdc9457SAndroid Build Coastguard Worker .k(k)
644*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
645*4bdc9457SAndroid Build Coastguard Worker }
646*4bdc9457SAndroid Build Coastguard Worker }
647*4bdc9457SAndroid Build Coastguard Worker }
648*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)649*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
650*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
651*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
652*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
653*4bdc9457SAndroid Build Coastguard Worker .mr(3)
654*4bdc9457SAndroid Build Coastguard Worker .nr(8)
655*4bdc9457SAndroid Build Coastguard Worker .kr(1)
656*4bdc9457SAndroid Build Coastguard Worker .sr(1)
657*4bdc9457SAndroid Build Coastguard Worker .m(3)
658*4bdc9457SAndroid Build Coastguard Worker .n(n)
659*4bdc9457SAndroid Build Coastguard Worker .k(k)
660*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
661*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
662*4bdc9457SAndroid Build Coastguard Worker }
663*4bdc9457SAndroid Build Coastguard Worker }
664*4bdc9457SAndroid Build Coastguard Worker }
665*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,n_div_8_strided_a)666*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, n_div_8_strided_a) {
667*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
668*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
669*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
670*4bdc9457SAndroid Build Coastguard Worker .mr(3)
671*4bdc9457SAndroid Build Coastguard Worker .nr(8)
672*4bdc9457SAndroid Build Coastguard Worker .kr(1)
673*4bdc9457SAndroid Build Coastguard Worker .sr(1)
674*4bdc9457SAndroid Build Coastguard Worker .m(3)
675*4bdc9457SAndroid Build Coastguard Worker .n(n)
676*4bdc9457SAndroid Build Coastguard Worker .k(k)
677*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
678*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
679*4bdc9457SAndroid Build Coastguard Worker }
680*4bdc9457SAndroid Build Coastguard Worker }
681*4bdc9457SAndroid Build Coastguard Worker }
682*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)683*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
684*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
685*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
686*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
687*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
688*4bdc9457SAndroid Build Coastguard Worker .mr(3)
689*4bdc9457SAndroid Build Coastguard Worker .nr(8)
690*4bdc9457SAndroid Build Coastguard Worker .kr(1)
691*4bdc9457SAndroid Build Coastguard Worker .sr(1)
692*4bdc9457SAndroid Build Coastguard Worker .m(m)
693*4bdc9457SAndroid Build Coastguard Worker .n(n)
694*4bdc9457SAndroid Build Coastguard Worker .k(k)
695*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
696*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
697*4bdc9457SAndroid Build Coastguard Worker }
698*4bdc9457SAndroid Build Coastguard Worker }
699*4bdc9457SAndroid Build Coastguard Worker }
700*4bdc9457SAndroid Build Coastguard Worker }
701*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)702*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
703*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
704*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
705*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
706*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
707*4bdc9457SAndroid Build Coastguard Worker .mr(3)
708*4bdc9457SAndroid Build Coastguard Worker .nr(8)
709*4bdc9457SAndroid Build Coastguard Worker .kr(1)
710*4bdc9457SAndroid Build Coastguard Worker .sr(1)
711*4bdc9457SAndroid Build Coastguard Worker .m(m)
712*4bdc9457SAndroid Build Coastguard Worker .n(n)
713*4bdc9457SAndroid Build Coastguard Worker .k(k)
714*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
715*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
716*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
717*4bdc9457SAndroid Build Coastguard Worker }
718*4bdc9457SAndroid Build Coastguard Worker }
719*4bdc9457SAndroid Build Coastguard Worker }
720*4bdc9457SAndroid Build Coastguard Worker }
721*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT,strided_cm)722*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_LOADSPLAT, strided_cm) {
723*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
724*4bdc9457SAndroid Build Coastguard Worker .mr(3)
725*4bdc9457SAndroid Build Coastguard Worker .nr(8)
726*4bdc9457SAndroid Build Coastguard Worker .kr(1)
727*4bdc9457SAndroid Build Coastguard Worker .sr(1)
728*4bdc9457SAndroid Build Coastguard Worker .m(3)
729*4bdc9457SAndroid Build Coastguard Worker .n(8)
730*4bdc9457SAndroid Build Coastguard Worker .k(1)
731*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
732*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat);
733*4bdc9457SAndroid Build Coastguard Worker }
734*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
735*4bdc9457SAndroid Build Coastguard Worker
736*4bdc9457SAndroid Build Coastguard Worker
737*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_eq_4)738*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_eq_4) {
739*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
740*4bdc9457SAndroid Build Coastguard Worker .mr(3)
741*4bdc9457SAndroid Build Coastguard Worker .nr(8)
742*4bdc9457SAndroid Build Coastguard Worker .kr(1)
743*4bdc9457SAndroid Build Coastguard Worker .sr(1)
744*4bdc9457SAndroid Build Coastguard Worker .m(3)
745*4bdc9457SAndroid Build Coastguard Worker .n(8)
746*4bdc9457SAndroid Build Coastguard Worker .k(4)
747*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
748*4bdc9457SAndroid Build Coastguard Worker }
749*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,strided_cn)750*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, strided_cn) {
751*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
752*4bdc9457SAndroid Build Coastguard Worker .mr(3)
753*4bdc9457SAndroid Build Coastguard Worker .nr(8)
754*4bdc9457SAndroid Build Coastguard Worker .kr(1)
755*4bdc9457SAndroid Build Coastguard Worker .sr(1)
756*4bdc9457SAndroid Build Coastguard Worker .m(3)
757*4bdc9457SAndroid Build Coastguard Worker .n(8)
758*4bdc9457SAndroid Build Coastguard Worker .k(4)
759*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
760*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
761*4bdc9457SAndroid Build Coastguard Worker }
762*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_eq_4_strided_a)763*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_eq_4_strided_a) {
764*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
765*4bdc9457SAndroid Build Coastguard Worker .mr(3)
766*4bdc9457SAndroid Build Coastguard Worker .nr(8)
767*4bdc9457SAndroid Build Coastguard Worker .kr(1)
768*4bdc9457SAndroid Build Coastguard Worker .sr(1)
769*4bdc9457SAndroid Build Coastguard Worker .m(3)
770*4bdc9457SAndroid Build Coastguard Worker .n(8)
771*4bdc9457SAndroid Build Coastguard Worker .k(4)
772*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
773*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
774*4bdc9457SAndroid Build Coastguard Worker }
775*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_eq_4_subtile)776*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
777*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
778*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
779*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
780*4bdc9457SAndroid Build Coastguard Worker .mr(3)
781*4bdc9457SAndroid Build Coastguard Worker .nr(8)
782*4bdc9457SAndroid Build Coastguard Worker .kr(1)
783*4bdc9457SAndroid Build Coastguard Worker .sr(1)
784*4bdc9457SAndroid Build Coastguard Worker .m(m)
785*4bdc9457SAndroid Build Coastguard Worker .n(n)
786*4bdc9457SAndroid Build Coastguard Worker .k(4)
787*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
788*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
789*4bdc9457SAndroid Build Coastguard Worker }
790*4bdc9457SAndroid Build Coastguard Worker }
791*4bdc9457SAndroid Build Coastguard Worker }
792*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)793*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
794*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
795*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
796*4bdc9457SAndroid Build Coastguard Worker .mr(3)
797*4bdc9457SAndroid Build Coastguard Worker .nr(8)
798*4bdc9457SAndroid Build Coastguard Worker .kr(1)
799*4bdc9457SAndroid Build Coastguard Worker .sr(1)
800*4bdc9457SAndroid Build Coastguard Worker .m(m)
801*4bdc9457SAndroid Build Coastguard Worker .n(8)
802*4bdc9457SAndroid Build Coastguard Worker .k(4)
803*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
804*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
805*4bdc9457SAndroid Build Coastguard Worker }
806*4bdc9457SAndroid Build Coastguard Worker }
807*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)808*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
809*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
810*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
811*4bdc9457SAndroid Build Coastguard Worker .mr(3)
812*4bdc9457SAndroid Build Coastguard Worker .nr(8)
813*4bdc9457SAndroid Build Coastguard Worker .kr(1)
814*4bdc9457SAndroid Build Coastguard Worker .sr(1)
815*4bdc9457SAndroid Build Coastguard Worker .m(3)
816*4bdc9457SAndroid Build Coastguard Worker .n(n)
817*4bdc9457SAndroid Build Coastguard Worker .k(4)
818*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
819*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
820*4bdc9457SAndroid Build Coastguard Worker }
821*4bdc9457SAndroid Build Coastguard Worker }
822*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_lt_4)823*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_lt_4) {
824*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
825*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
826*4bdc9457SAndroid Build Coastguard Worker .mr(3)
827*4bdc9457SAndroid Build Coastguard Worker .nr(8)
828*4bdc9457SAndroid Build Coastguard Worker .kr(1)
829*4bdc9457SAndroid Build Coastguard Worker .sr(1)
830*4bdc9457SAndroid Build Coastguard Worker .m(3)
831*4bdc9457SAndroid Build Coastguard Worker .n(8)
832*4bdc9457SAndroid Build Coastguard Worker .k(k)
833*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
834*4bdc9457SAndroid Build Coastguard Worker }
835*4bdc9457SAndroid Build Coastguard Worker }
836*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_lt_4_strided_a)837*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_lt_4_strided_a) {
838*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
839*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
840*4bdc9457SAndroid Build Coastguard Worker .mr(3)
841*4bdc9457SAndroid Build Coastguard Worker .nr(8)
842*4bdc9457SAndroid Build Coastguard Worker .kr(1)
843*4bdc9457SAndroid Build Coastguard Worker .sr(1)
844*4bdc9457SAndroid Build Coastguard Worker .m(3)
845*4bdc9457SAndroid Build Coastguard Worker .n(8)
846*4bdc9457SAndroid Build Coastguard Worker .k(k)
847*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
848*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
849*4bdc9457SAndroid Build Coastguard Worker }
850*4bdc9457SAndroid Build Coastguard Worker }
851*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_lt_4_subtile)852*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
853*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
854*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
855*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
856*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
857*4bdc9457SAndroid Build Coastguard Worker .mr(3)
858*4bdc9457SAndroid Build Coastguard Worker .nr(8)
859*4bdc9457SAndroid Build Coastguard Worker .kr(1)
860*4bdc9457SAndroid Build Coastguard Worker .sr(1)
861*4bdc9457SAndroid Build Coastguard Worker .m(m)
862*4bdc9457SAndroid Build Coastguard Worker .n(n)
863*4bdc9457SAndroid Build Coastguard Worker .k(k)
864*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
865*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
866*4bdc9457SAndroid Build Coastguard Worker }
867*4bdc9457SAndroid Build Coastguard Worker }
868*4bdc9457SAndroid Build Coastguard Worker }
869*4bdc9457SAndroid Build Coastguard Worker }
870*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_gt_4)871*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_gt_4) {
872*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
873*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
874*4bdc9457SAndroid Build Coastguard Worker .mr(3)
875*4bdc9457SAndroid Build Coastguard Worker .nr(8)
876*4bdc9457SAndroid Build Coastguard Worker .kr(1)
877*4bdc9457SAndroid Build Coastguard Worker .sr(1)
878*4bdc9457SAndroid Build Coastguard Worker .m(3)
879*4bdc9457SAndroid Build Coastguard Worker .n(8)
880*4bdc9457SAndroid Build Coastguard Worker .k(k)
881*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
882*4bdc9457SAndroid Build Coastguard Worker }
883*4bdc9457SAndroid Build Coastguard Worker }
884*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_gt_4_strided_a)885*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_gt_4_strided_a) {
886*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
887*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
888*4bdc9457SAndroid Build Coastguard Worker .mr(3)
889*4bdc9457SAndroid Build Coastguard Worker .nr(8)
890*4bdc9457SAndroid Build Coastguard Worker .kr(1)
891*4bdc9457SAndroid Build Coastguard Worker .sr(1)
892*4bdc9457SAndroid Build Coastguard Worker .m(3)
893*4bdc9457SAndroid Build Coastguard Worker .n(8)
894*4bdc9457SAndroid Build Coastguard Worker .k(k)
895*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
896*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
897*4bdc9457SAndroid Build Coastguard Worker }
898*4bdc9457SAndroid Build Coastguard Worker }
899*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_gt_4_subtile)900*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
901*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
902*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
903*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
904*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
905*4bdc9457SAndroid Build Coastguard Worker .mr(3)
906*4bdc9457SAndroid Build Coastguard Worker .nr(8)
907*4bdc9457SAndroid Build Coastguard Worker .kr(1)
908*4bdc9457SAndroid Build Coastguard Worker .sr(1)
909*4bdc9457SAndroid Build Coastguard Worker .m(m)
910*4bdc9457SAndroid Build Coastguard Worker .n(n)
911*4bdc9457SAndroid Build Coastguard Worker .k(k)
912*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
913*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
914*4bdc9457SAndroid Build Coastguard Worker }
915*4bdc9457SAndroid Build Coastguard Worker }
916*4bdc9457SAndroid Build Coastguard Worker }
917*4bdc9457SAndroid Build Coastguard Worker }
918*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_div_4)919*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_div_4) {
920*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
921*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
922*4bdc9457SAndroid Build Coastguard Worker .mr(3)
923*4bdc9457SAndroid Build Coastguard Worker .nr(8)
924*4bdc9457SAndroid Build Coastguard Worker .kr(1)
925*4bdc9457SAndroid Build Coastguard Worker .sr(1)
926*4bdc9457SAndroid Build Coastguard Worker .m(3)
927*4bdc9457SAndroid Build Coastguard Worker .n(8)
928*4bdc9457SAndroid Build Coastguard Worker .k(k)
929*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
930*4bdc9457SAndroid Build Coastguard Worker }
931*4bdc9457SAndroid Build Coastguard Worker }
932*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_div_4_strided_a)933*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_div_4_strided_a) {
934*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
935*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
936*4bdc9457SAndroid Build Coastguard Worker .mr(3)
937*4bdc9457SAndroid Build Coastguard Worker .nr(8)
938*4bdc9457SAndroid Build Coastguard Worker .kr(1)
939*4bdc9457SAndroid Build Coastguard Worker .sr(1)
940*4bdc9457SAndroid Build Coastguard Worker .m(3)
941*4bdc9457SAndroid Build Coastguard Worker .n(8)
942*4bdc9457SAndroid Build Coastguard Worker .k(k)
943*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
944*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
945*4bdc9457SAndroid Build Coastguard Worker }
946*4bdc9457SAndroid Build Coastguard Worker }
947*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,k_div_4_subtile)948*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, k_div_4_subtile) {
949*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
950*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
951*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
952*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
953*4bdc9457SAndroid Build Coastguard Worker .mr(3)
954*4bdc9457SAndroid Build Coastguard Worker .nr(8)
955*4bdc9457SAndroid Build Coastguard Worker .kr(1)
956*4bdc9457SAndroid Build Coastguard Worker .sr(1)
957*4bdc9457SAndroid Build Coastguard Worker .m(m)
958*4bdc9457SAndroid Build Coastguard Worker .n(n)
959*4bdc9457SAndroid Build Coastguard Worker .k(k)
960*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
961*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
962*4bdc9457SAndroid Build Coastguard Worker }
963*4bdc9457SAndroid Build Coastguard Worker }
964*4bdc9457SAndroid Build Coastguard Worker }
965*4bdc9457SAndroid Build Coastguard Worker }
966*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,n_gt_8)967*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, n_gt_8) {
968*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
969*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
970*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
971*4bdc9457SAndroid Build Coastguard Worker .mr(3)
972*4bdc9457SAndroid Build Coastguard Worker .nr(8)
973*4bdc9457SAndroid Build Coastguard Worker .kr(1)
974*4bdc9457SAndroid Build Coastguard Worker .sr(1)
975*4bdc9457SAndroid Build Coastguard Worker .m(3)
976*4bdc9457SAndroid Build Coastguard Worker .n(n)
977*4bdc9457SAndroid Build Coastguard Worker .k(k)
978*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
979*4bdc9457SAndroid Build Coastguard Worker }
980*4bdc9457SAndroid Build Coastguard Worker }
981*4bdc9457SAndroid Build Coastguard Worker }
982*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)983*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
984*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
985*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
986*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
987*4bdc9457SAndroid Build Coastguard Worker .mr(3)
988*4bdc9457SAndroid Build Coastguard Worker .nr(8)
989*4bdc9457SAndroid Build Coastguard Worker .kr(1)
990*4bdc9457SAndroid Build Coastguard Worker .sr(1)
991*4bdc9457SAndroid Build Coastguard Worker .m(3)
992*4bdc9457SAndroid Build Coastguard Worker .n(n)
993*4bdc9457SAndroid Build Coastguard Worker .k(k)
994*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
995*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
996*4bdc9457SAndroid Build Coastguard Worker }
997*4bdc9457SAndroid Build Coastguard Worker }
998*4bdc9457SAndroid Build Coastguard Worker }
999*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,n_gt_8_strided_a)1000*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, n_gt_8_strided_a) {
1001*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1002*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1003*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1004*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1005*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1006*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1007*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1008*4bdc9457SAndroid Build Coastguard Worker .m(3)
1009*4bdc9457SAndroid Build Coastguard Worker .n(n)
1010*4bdc9457SAndroid Build Coastguard Worker .k(k)
1011*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1012*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
1013*4bdc9457SAndroid Build Coastguard Worker }
1014*4bdc9457SAndroid Build Coastguard Worker }
1015*4bdc9457SAndroid Build Coastguard Worker }
1016*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,n_gt_8_subtile)1017*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
1018*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1019*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1020*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1021*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1022*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1023*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1024*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1025*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1026*4bdc9457SAndroid Build Coastguard Worker .m(m)
1027*4bdc9457SAndroid Build Coastguard Worker .n(n)
1028*4bdc9457SAndroid Build Coastguard Worker .k(k)
1029*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1030*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
1031*4bdc9457SAndroid Build Coastguard Worker }
1032*4bdc9457SAndroid Build Coastguard Worker }
1033*4bdc9457SAndroid Build Coastguard Worker }
1034*4bdc9457SAndroid Build Coastguard Worker }
1035*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,n_div_8)1036*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, n_div_8) {
1037*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1038*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1039*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1040*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1041*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1042*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1043*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1044*4bdc9457SAndroid Build Coastguard Worker .m(3)
1045*4bdc9457SAndroid Build Coastguard Worker .n(n)
1046*4bdc9457SAndroid Build Coastguard Worker .k(k)
1047*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
1048*4bdc9457SAndroid Build Coastguard Worker }
1049*4bdc9457SAndroid Build Coastguard Worker }
1050*4bdc9457SAndroid Build Coastguard Worker }
1051*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,n_div_8_strided_cn)1052*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
1053*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1054*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1055*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1056*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1057*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1058*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1059*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1060*4bdc9457SAndroid Build Coastguard Worker .m(3)
1061*4bdc9457SAndroid Build Coastguard Worker .n(n)
1062*4bdc9457SAndroid Build Coastguard Worker .k(k)
1063*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1064*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
1065*4bdc9457SAndroid Build Coastguard Worker }
1066*4bdc9457SAndroid Build Coastguard Worker }
1067*4bdc9457SAndroid Build Coastguard Worker }
1068*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,n_div_8_strided_a)1069*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, n_div_8_strided_a) {
1070*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1071*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1072*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1073*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1074*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1075*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1076*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1077*4bdc9457SAndroid Build Coastguard Worker .m(3)
1078*4bdc9457SAndroid Build Coastguard Worker .n(n)
1079*4bdc9457SAndroid Build Coastguard Worker .k(k)
1080*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1081*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
1082*4bdc9457SAndroid Build Coastguard Worker }
1083*4bdc9457SAndroid Build Coastguard Worker }
1084*4bdc9457SAndroid Build Coastguard Worker }
1085*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,n_div_8_subtile)1086*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, n_div_8_subtile) {
1087*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1088*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1089*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1090*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1091*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1092*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1093*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1094*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1095*4bdc9457SAndroid Build Coastguard Worker .m(m)
1096*4bdc9457SAndroid Build Coastguard Worker .n(n)
1097*4bdc9457SAndroid Build Coastguard Worker .k(k)
1098*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1099*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
1100*4bdc9457SAndroid Build Coastguard Worker }
1101*4bdc9457SAndroid Build Coastguard Worker }
1102*4bdc9457SAndroid Build Coastguard Worker }
1103*4bdc9457SAndroid Build Coastguard Worker }
1104*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,strided_cm_subtile)1105*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, strided_cm_subtile) {
1106*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1107*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1108*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1109*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1110*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1111*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1112*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1113*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1114*4bdc9457SAndroid Build Coastguard Worker .m(m)
1115*4bdc9457SAndroid Build Coastguard Worker .n(n)
1116*4bdc9457SAndroid Build Coastguard Worker .k(k)
1117*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1118*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1119*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
1120*4bdc9457SAndroid Build Coastguard Worker }
1121*4bdc9457SAndroid Build Coastguard Worker }
1122*4bdc9457SAndroid Build Coastguard Worker }
1123*4bdc9457SAndroid Build Coastguard Worker }
1124*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMSIMD_SPLAT,strided_cm)1125*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMSIMD_SPLAT, strided_cm) {
1126*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1127*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1128*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1129*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1130*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1131*4bdc9457SAndroid Build Coastguard Worker .m(3)
1132*4bdc9457SAndroid Build Coastguard Worker .n(8)
1133*4bdc9457SAndroid Build Coastguard Worker .k(4)
1134*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1135*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmsimd_splat);
1136*4bdc9457SAndroid Build Coastguard Worker }
1137*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1138*4bdc9457SAndroid Build Coastguard Worker
1139*4bdc9457SAndroid Build Coastguard Worker
1140*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_3X8S4__WASMSIMD,k_eq_4)1141*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_eq_4) {
1142*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1143*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1144*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1145*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1146*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1147*4bdc9457SAndroid Build Coastguard Worker .m(3)
1148*4bdc9457SAndroid Build Coastguard Worker .n(8)
1149*4bdc9457SAndroid Build Coastguard Worker .k(4)
1150*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1151*4bdc9457SAndroid Build Coastguard Worker }
1152*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,strided_cn)1153*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, strided_cn) {
1154*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1155*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1156*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1157*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1158*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1159*4bdc9457SAndroid Build Coastguard Worker .m(3)
1160*4bdc9457SAndroid Build Coastguard Worker .n(8)
1161*4bdc9457SAndroid Build Coastguard Worker .k(4)
1162*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1163*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1164*4bdc9457SAndroid Build Coastguard Worker }
1165*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_eq_4_strided_a)1166*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_eq_4_strided_a) {
1167*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1168*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1169*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1170*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1171*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1172*4bdc9457SAndroid Build Coastguard Worker .m(3)
1173*4bdc9457SAndroid Build Coastguard Worker .n(8)
1174*4bdc9457SAndroid Build Coastguard Worker .k(4)
1175*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1176*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1177*4bdc9457SAndroid Build Coastguard Worker }
1178*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_eq_4_subtile)1179*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_eq_4_subtile) {
1180*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1181*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1182*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1183*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1184*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1185*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1186*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1187*4bdc9457SAndroid Build Coastguard Worker .m(m)
1188*4bdc9457SAndroid Build Coastguard Worker .n(n)
1189*4bdc9457SAndroid Build Coastguard Worker .k(4)
1190*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1191*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1192*4bdc9457SAndroid Build Coastguard Worker }
1193*4bdc9457SAndroid Build Coastguard Worker }
1194*4bdc9457SAndroid Build Coastguard Worker }
1195*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_eq_4_subtile_m)1196*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_eq_4_subtile_m) {
1197*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1198*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1199*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1200*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1201*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1202*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1203*4bdc9457SAndroid Build Coastguard Worker .m(m)
1204*4bdc9457SAndroid Build Coastguard Worker .n(8)
1205*4bdc9457SAndroid Build Coastguard Worker .k(4)
1206*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1207*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1208*4bdc9457SAndroid Build Coastguard Worker }
1209*4bdc9457SAndroid Build Coastguard Worker }
1210*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_eq_4_subtile_n)1211*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_eq_4_subtile_n) {
1212*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1213*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1214*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1215*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1216*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1217*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1218*4bdc9457SAndroid Build Coastguard Worker .m(3)
1219*4bdc9457SAndroid Build Coastguard Worker .n(n)
1220*4bdc9457SAndroid Build Coastguard Worker .k(4)
1221*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1222*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1223*4bdc9457SAndroid Build Coastguard Worker }
1224*4bdc9457SAndroid Build Coastguard Worker }
1225*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_lt_4)1226*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_lt_4) {
1227*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1228*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1229*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1230*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1231*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1232*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1233*4bdc9457SAndroid Build Coastguard Worker .m(3)
1234*4bdc9457SAndroid Build Coastguard Worker .n(8)
1235*4bdc9457SAndroid Build Coastguard Worker .k(k)
1236*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1237*4bdc9457SAndroid Build Coastguard Worker }
1238*4bdc9457SAndroid Build Coastguard Worker }
1239*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_lt_4_strided_a)1240*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_lt_4_strided_a) {
1241*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1242*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1243*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1244*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1245*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1246*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1247*4bdc9457SAndroid Build Coastguard Worker .m(3)
1248*4bdc9457SAndroid Build Coastguard Worker .n(8)
1249*4bdc9457SAndroid Build Coastguard Worker .k(k)
1250*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1251*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1252*4bdc9457SAndroid Build Coastguard Worker }
1253*4bdc9457SAndroid Build Coastguard Worker }
1254*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_lt_4_subtile)1255*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_lt_4_subtile) {
1256*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1257*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1258*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1259*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1260*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1261*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1262*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1263*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1264*4bdc9457SAndroid Build Coastguard Worker .m(m)
1265*4bdc9457SAndroid Build Coastguard Worker .n(n)
1266*4bdc9457SAndroid Build Coastguard Worker .k(k)
1267*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1268*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1269*4bdc9457SAndroid Build Coastguard Worker }
1270*4bdc9457SAndroid Build Coastguard Worker }
1271*4bdc9457SAndroid Build Coastguard Worker }
1272*4bdc9457SAndroid Build Coastguard Worker }
1273*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_gt_4)1274*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_gt_4) {
1275*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1276*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1277*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1278*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1279*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1280*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1281*4bdc9457SAndroid Build Coastguard Worker .m(3)
1282*4bdc9457SAndroid Build Coastguard Worker .n(8)
1283*4bdc9457SAndroid Build Coastguard Worker .k(k)
1284*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1285*4bdc9457SAndroid Build Coastguard Worker }
1286*4bdc9457SAndroid Build Coastguard Worker }
1287*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_gt_4_strided_a)1288*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_gt_4_strided_a) {
1289*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1290*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1291*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1292*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1293*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1294*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1295*4bdc9457SAndroid Build Coastguard Worker .m(3)
1296*4bdc9457SAndroid Build Coastguard Worker .n(8)
1297*4bdc9457SAndroid Build Coastguard Worker .k(k)
1298*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
1299*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1300*4bdc9457SAndroid Build Coastguard Worker }
1301*4bdc9457SAndroid Build Coastguard Worker }
1302*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_gt_4_subtile)1303*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_gt_4_subtile) {
1304*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1305*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1306*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1307*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1308*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1309*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1310*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1311*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1312*4bdc9457SAndroid Build Coastguard Worker .m(m)
1313*4bdc9457SAndroid Build Coastguard Worker .n(n)
1314*4bdc9457SAndroid Build Coastguard Worker .k(k)
1315*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1316*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1317*4bdc9457SAndroid Build Coastguard Worker }
1318*4bdc9457SAndroid Build Coastguard Worker }
1319*4bdc9457SAndroid Build Coastguard Worker }
1320*4bdc9457SAndroid Build Coastguard Worker }
1321*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_div_4)1322*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_div_4) {
1323*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1324*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1325*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1326*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1327*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1328*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1329*4bdc9457SAndroid Build Coastguard Worker .m(3)
1330*4bdc9457SAndroid Build Coastguard Worker .n(8)
1331*4bdc9457SAndroid Build Coastguard Worker .k(k)
1332*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1333*4bdc9457SAndroid Build Coastguard Worker }
1334*4bdc9457SAndroid Build Coastguard Worker }
1335*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_div_4_strided_a)1336*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_div_4_strided_a) {
1337*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1338*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1339*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1340*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1341*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1342*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1343*4bdc9457SAndroid Build Coastguard Worker .m(3)
1344*4bdc9457SAndroid Build Coastguard Worker .n(8)
1345*4bdc9457SAndroid Build Coastguard Worker .k(k)
1346*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
1347*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1348*4bdc9457SAndroid Build Coastguard Worker }
1349*4bdc9457SAndroid Build Coastguard Worker }
1350*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,k_div_4_subtile)1351*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, k_div_4_subtile) {
1352*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1353*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1354*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1355*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1356*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1357*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1358*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1359*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1360*4bdc9457SAndroid Build Coastguard Worker .m(m)
1361*4bdc9457SAndroid Build Coastguard Worker .n(n)
1362*4bdc9457SAndroid Build Coastguard Worker .k(k)
1363*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1364*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1365*4bdc9457SAndroid Build Coastguard Worker }
1366*4bdc9457SAndroid Build Coastguard Worker }
1367*4bdc9457SAndroid Build Coastguard Worker }
1368*4bdc9457SAndroid Build Coastguard Worker }
1369*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,n_gt_8)1370*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, n_gt_8) {
1371*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1372*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1373*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1374*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1375*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1376*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1377*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1378*4bdc9457SAndroid Build Coastguard Worker .m(3)
1379*4bdc9457SAndroid Build Coastguard Worker .n(n)
1380*4bdc9457SAndroid Build Coastguard Worker .k(k)
1381*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1382*4bdc9457SAndroid Build Coastguard Worker }
1383*4bdc9457SAndroid Build Coastguard Worker }
1384*4bdc9457SAndroid Build Coastguard Worker }
1385*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,n_gt_8_strided_cn)1386*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, n_gt_8_strided_cn) {
1387*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1388*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1389*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1390*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1391*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1392*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1393*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1394*4bdc9457SAndroid Build Coastguard Worker .m(3)
1395*4bdc9457SAndroid Build Coastguard Worker .n(n)
1396*4bdc9457SAndroid Build Coastguard Worker .k(k)
1397*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1398*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1399*4bdc9457SAndroid Build Coastguard Worker }
1400*4bdc9457SAndroid Build Coastguard Worker }
1401*4bdc9457SAndroid Build Coastguard Worker }
1402*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,n_gt_8_strided_a)1403*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, n_gt_8_strided_a) {
1404*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1405*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1406*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1407*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1408*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1409*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1410*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1411*4bdc9457SAndroid Build Coastguard Worker .m(3)
1412*4bdc9457SAndroid Build Coastguard Worker .n(n)
1413*4bdc9457SAndroid Build Coastguard Worker .k(k)
1414*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1415*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1416*4bdc9457SAndroid Build Coastguard Worker }
1417*4bdc9457SAndroid Build Coastguard Worker }
1418*4bdc9457SAndroid Build Coastguard Worker }
1419*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,n_gt_8_subtile)1420*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, n_gt_8_subtile) {
1421*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
1422*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1423*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1424*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1425*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1426*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1427*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1428*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1429*4bdc9457SAndroid Build Coastguard Worker .m(m)
1430*4bdc9457SAndroid Build Coastguard Worker .n(n)
1431*4bdc9457SAndroid Build Coastguard Worker .k(k)
1432*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1433*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1434*4bdc9457SAndroid Build Coastguard Worker }
1435*4bdc9457SAndroid Build Coastguard Worker }
1436*4bdc9457SAndroid Build Coastguard Worker }
1437*4bdc9457SAndroid Build Coastguard Worker }
1438*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,n_div_8)1439*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, n_div_8) {
1440*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1441*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1442*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1443*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1444*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1445*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1446*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1447*4bdc9457SAndroid Build Coastguard Worker .m(3)
1448*4bdc9457SAndroid Build Coastguard Worker .n(n)
1449*4bdc9457SAndroid Build Coastguard Worker .k(k)
1450*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1451*4bdc9457SAndroid Build Coastguard Worker }
1452*4bdc9457SAndroid Build Coastguard Worker }
1453*4bdc9457SAndroid Build Coastguard Worker }
1454*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,n_div_8_strided_cn)1455*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, n_div_8_strided_cn) {
1456*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1457*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1458*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1459*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1460*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1461*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1462*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1463*4bdc9457SAndroid Build Coastguard Worker .m(3)
1464*4bdc9457SAndroid Build Coastguard Worker .n(n)
1465*4bdc9457SAndroid Build Coastguard Worker .k(k)
1466*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1467*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1468*4bdc9457SAndroid Build Coastguard Worker }
1469*4bdc9457SAndroid Build Coastguard Worker }
1470*4bdc9457SAndroid Build Coastguard Worker }
1471*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,n_div_8_strided_a)1472*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, n_div_8_strided_a) {
1473*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1474*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1475*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1476*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1477*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1478*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1479*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1480*4bdc9457SAndroid Build Coastguard Worker .m(3)
1481*4bdc9457SAndroid Build Coastguard Worker .n(n)
1482*4bdc9457SAndroid Build Coastguard Worker .k(k)
1483*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1484*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1485*4bdc9457SAndroid Build Coastguard Worker }
1486*4bdc9457SAndroid Build Coastguard Worker }
1487*4bdc9457SAndroid Build Coastguard Worker }
1488*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,n_div_8_subtile)1489*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, n_div_8_subtile) {
1490*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
1491*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1492*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1493*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1494*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1495*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1496*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1497*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1498*4bdc9457SAndroid Build Coastguard Worker .m(m)
1499*4bdc9457SAndroid Build Coastguard Worker .n(n)
1500*4bdc9457SAndroid Build Coastguard Worker .k(k)
1501*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1502*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1503*4bdc9457SAndroid Build Coastguard Worker }
1504*4bdc9457SAndroid Build Coastguard Worker }
1505*4bdc9457SAndroid Build Coastguard Worker }
1506*4bdc9457SAndroid Build Coastguard Worker }
1507*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,strided_cm_subtile)1508*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, strided_cm_subtile) {
1509*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1510*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1511*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
1512*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1513*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1514*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1515*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1516*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1517*4bdc9457SAndroid Build Coastguard Worker .m(m)
1518*4bdc9457SAndroid Build Coastguard Worker .n(n)
1519*4bdc9457SAndroid Build Coastguard Worker .k(k)
1520*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1521*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1522*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1523*4bdc9457SAndroid Build Coastguard Worker }
1524*4bdc9457SAndroid Build Coastguard Worker }
1525*4bdc9457SAndroid Build Coastguard Worker }
1526*4bdc9457SAndroid Build Coastguard Worker }
1527*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMSIMD,strided_cm)1528*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMSIMD, strided_cm) {
1529*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1530*4bdc9457SAndroid Build Coastguard Worker .mr(3)
1531*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1532*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1533*4bdc9457SAndroid Build Coastguard Worker .sr(4)
1534*4bdc9457SAndroid Build Coastguard Worker .m(3)
1535*4bdc9457SAndroid Build Coastguard Worker .n(8)
1536*4bdc9457SAndroid Build Coastguard Worker .k(4)
1537*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
1538*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmsimd);
1539*4bdc9457SAndroid Build Coastguard Worker }
1540*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1541*4bdc9457SAndroid Build Coastguard Worker
1542*4bdc9457SAndroid Build Coastguard Worker
1543*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_4X2C4__WASMSIMD,k_eq_4)1544*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_eq_4) {
1545*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1546*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1547*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1548*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1549*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1550*4bdc9457SAndroid Build Coastguard Worker .m(4)
1551*4bdc9457SAndroid Build Coastguard Worker .n(2)
1552*4bdc9457SAndroid Build Coastguard Worker .k(4)
1553*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1554*4bdc9457SAndroid Build Coastguard Worker }
1555*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,strided_cn)1556*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, strided_cn) {
1557*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1558*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1559*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1560*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1561*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1562*4bdc9457SAndroid Build Coastguard Worker .m(4)
1563*4bdc9457SAndroid Build Coastguard Worker .n(2)
1564*4bdc9457SAndroid Build Coastguard Worker .k(4)
1565*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
1566*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1567*4bdc9457SAndroid Build Coastguard Worker }
1568*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_eq_4_strided_a)1569*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_eq_4_strided_a) {
1570*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1571*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1572*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1573*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1574*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1575*4bdc9457SAndroid Build Coastguard Worker .m(4)
1576*4bdc9457SAndroid Build Coastguard Worker .n(2)
1577*4bdc9457SAndroid Build Coastguard Worker .k(4)
1578*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1579*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1580*4bdc9457SAndroid Build Coastguard Worker }
1581*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_eq_4_subtile)1582*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_eq_4_subtile) {
1583*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1584*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1585*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1586*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1587*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1588*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1589*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1590*4bdc9457SAndroid Build Coastguard Worker .m(m)
1591*4bdc9457SAndroid Build Coastguard Worker .n(n)
1592*4bdc9457SAndroid Build Coastguard Worker .k(4)
1593*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1594*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1595*4bdc9457SAndroid Build Coastguard Worker }
1596*4bdc9457SAndroid Build Coastguard Worker }
1597*4bdc9457SAndroid Build Coastguard Worker }
1598*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_eq_4_subtile_m)1599*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_eq_4_subtile_m) {
1600*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1601*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1602*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1603*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1604*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1605*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1606*4bdc9457SAndroid Build Coastguard Worker .m(m)
1607*4bdc9457SAndroid Build Coastguard Worker .n(2)
1608*4bdc9457SAndroid Build Coastguard Worker .k(4)
1609*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1610*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1611*4bdc9457SAndroid Build Coastguard Worker }
1612*4bdc9457SAndroid Build Coastguard Worker }
1613*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_eq_4_subtile_n)1614*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_eq_4_subtile_n) {
1615*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1616*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1617*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1618*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1619*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1620*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1621*4bdc9457SAndroid Build Coastguard Worker .m(4)
1622*4bdc9457SAndroid Build Coastguard Worker .n(n)
1623*4bdc9457SAndroid Build Coastguard Worker .k(4)
1624*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1625*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1626*4bdc9457SAndroid Build Coastguard Worker }
1627*4bdc9457SAndroid Build Coastguard Worker }
1628*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_lt_4)1629*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_lt_4) {
1630*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1631*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1632*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1633*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1634*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1635*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1636*4bdc9457SAndroid Build Coastguard Worker .m(4)
1637*4bdc9457SAndroid Build Coastguard Worker .n(2)
1638*4bdc9457SAndroid Build Coastguard Worker .k(k)
1639*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1640*4bdc9457SAndroid Build Coastguard Worker }
1641*4bdc9457SAndroid Build Coastguard Worker }
1642*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_lt_4_strided_a)1643*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_lt_4_strided_a) {
1644*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1645*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1646*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1647*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1648*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1649*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1650*4bdc9457SAndroid Build Coastguard Worker .m(4)
1651*4bdc9457SAndroid Build Coastguard Worker .n(2)
1652*4bdc9457SAndroid Build Coastguard Worker .k(k)
1653*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
1654*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1655*4bdc9457SAndroid Build Coastguard Worker }
1656*4bdc9457SAndroid Build Coastguard Worker }
1657*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_lt_4_subtile)1658*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_lt_4_subtile) {
1659*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
1660*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1661*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1662*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1663*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1664*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1665*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1666*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1667*4bdc9457SAndroid Build Coastguard Worker .m(m)
1668*4bdc9457SAndroid Build Coastguard Worker .n(n)
1669*4bdc9457SAndroid Build Coastguard Worker .k(k)
1670*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1671*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1672*4bdc9457SAndroid Build Coastguard Worker }
1673*4bdc9457SAndroid Build Coastguard Worker }
1674*4bdc9457SAndroid Build Coastguard Worker }
1675*4bdc9457SAndroid Build Coastguard Worker }
1676*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_gt_4)1677*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_gt_4) {
1678*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1679*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1680*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1681*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1682*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1683*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1684*4bdc9457SAndroid Build Coastguard Worker .m(4)
1685*4bdc9457SAndroid Build Coastguard Worker .n(2)
1686*4bdc9457SAndroid Build Coastguard Worker .k(k)
1687*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1688*4bdc9457SAndroid Build Coastguard Worker }
1689*4bdc9457SAndroid Build Coastguard Worker }
1690*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_gt_4_strided_a)1691*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_gt_4_strided_a) {
1692*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1693*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1694*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1695*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1696*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1697*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1698*4bdc9457SAndroid Build Coastguard Worker .m(4)
1699*4bdc9457SAndroid Build Coastguard Worker .n(2)
1700*4bdc9457SAndroid Build Coastguard Worker .k(k)
1701*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
1702*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1703*4bdc9457SAndroid Build Coastguard Worker }
1704*4bdc9457SAndroid Build Coastguard Worker }
1705*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_gt_4_subtile)1706*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_gt_4_subtile) {
1707*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
1708*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1709*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1710*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1711*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1712*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1713*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1714*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1715*4bdc9457SAndroid Build Coastguard Worker .m(m)
1716*4bdc9457SAndroid Build Coastguard Worker .n(n)
1717*4bdc9457SAndroid Build Coastguard Worker .k(k)
1718*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1719*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1720*4bdc9457SAndroid Build Coastguard Worker }
1721*4bdc9457SAndroid Build Coastguard Worker }
1722*4bdc9457SAndroid Build Coastguard Worker }
1723*4bdc9457SAndroid Build Coastguard Worker }
1724*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_div_4)1725*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_div_4) {
1726*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1727*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1728*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1729*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1730*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1731*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1732*4bdc9457SAndroid Build Coastguard Worker .m(4)
1733*4bdc9457SAndroid Build Coastguard Worker .n(2)
1734*4bdc9457SAndroid Build Coastguard Worker .k(k)
1735*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1736*4bdc9457SAndroid Build Coastguard Worker }
1737*4bdc9457SAndroid Build Coastguard Worker }
1738*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_div_4_strided_a)1739*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_div_4_strided_a) {
1740*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1741*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1742*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1743*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1744*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1745*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1746*4bdc9457SAndroid Build Coastguard Worker .m(4)
1747*4bdc9457SAndroid Build Coastguard Worker .n(2)
1748*4bdc9457SAndroid Build Coastguard Worker .k(k)
1749*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
1750*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1751*4bdc9457SAndroid Build Coastguard Worker }
1752*4bdc9457SAndroid Build Coastguard Worker }
1753*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,k_div_4_subtile)1754*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, k_div_4_subtile) {
1755*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
1756*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1757*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1758*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1759*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1760*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1761*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1762*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1763*4bdc9457SAndroid Build Coastguard Worker .m(m)
1764*4bdc9457SAndroid Build Coastguard Worker .n(n)
1765*4bdc9457SAndroid Build Coastguard Worker .k(k)
1766*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1767*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1768*4bdc9457SAndroid Build Coastguard Worker }
1769*4bdc9457SAndroid Build Coastguard Worker }
1770*4bdc9457SAndroid Build Coastguard Worker }
1771*4bdc9457SAndroid Build Coastguard Worker }
1772*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,n_gt_2)1773*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, n_gt_2) {
1774*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1775*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1776*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1777*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1778*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1779*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1780*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1781*4bdc9457SAndroid Build Coastguard Worker .m(4)
1782*4bdc9457SAndroid Build Coastguard Worker .n(n)
1783*4bdc9457SAndroid Build Coastguard Worker .k(k)
1784*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1785*4bdc9457SAndroid Build Coastguard Worker }
1786*4bdc9457SAndroid Build Coastguard Worker }
1787*4bdc9457SAndroid Build Coastguard Worker }
1788*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,n_gt_2_strided_cn)1789*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, n_gt_2_strided_cn) {
1790*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1791*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1792*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1793*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1794*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1795*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1796*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1797*4bdc9457SAndroid Build Coastguard Worker .m(4)
1798*4bdc9457SAndroid Build Coastguard Worker .n(n)
1799*4bdc9457SAndroid Build Coastguard Worker .k(k)
1800*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
1801*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1802*4bdc9457SAndroid Build Coastguard Worker }
1803*4bdc9457SAndroid Build Coastguard Worker }
1804*4bdc9457SAndroid Build Coastguard Worker }
1805*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,n_gt_2_strided_a)1806*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, n_gt_2_strided_a) {
1807*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1808*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1809*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1810*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1811*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1812*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1813*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1814*4bdc9457SAndroid Build Coastguard Worker .m(4)
1815*4bdc9457SAndroid Build Coastguard Worker .n(n)
1816*4bdc9457SAndroid Build Coastguard Worker .k(k)
1817*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1818*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1819*4bdc9457SAndroid Build Coastguard Worker }
1820*4bdc9457SAndroid Build Coastguard Worker }
1821*4bdc9457SAndroid Build Coastguard Worker }
1822*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,n_gt_2_subtile)1823*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, n_gt_2_subtile) {
1824*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 3; n < 4; n++) {
1825*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1826*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1827*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1828*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1829*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1830*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1831*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1832*4bdc9457SAndroid Build Coastguard Worker .m(m)
1833*4bdc9457SAndroid Build Coastguard Worker .n(n)
1834*4bdc9457SAndroid Build Coastguard Worker .k(k)
1835*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1836*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1837*4bdc9457SAndroid Build Coastguard Worker }
1838*4bdc9457SAndroid Build Coastguard Worker }
1839*4bdc9457SAndroid Build Coastguard Worker }
1840*4bdc9457SAndroid Build Coastguard Worker }
1841*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,n_div_2)1842*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, n_div_2) {
1843*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1844*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1845*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1846*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1847*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1848*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1849*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1850*4bdc9457SAndroid Build Coastguard Worker .m(4)
1851*4bdc9457SAndroid Build Coastguard Worker .n(n)
1852*4bdc9457SAndroid Build Coastguard Worker .k(k)
1853*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1854*4bdc9457SAndroid Build Coastguard Worker }
1855*4bdc9457SAndroid Build Coastguard Worker }
1856*4bdc9457SAndroid Build Coastguard Worker }
1857*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,n_div_2_strided_cn)1858*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, n_div_2_strided_cn) {
1859*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1860*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1861*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1862*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1863*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1864*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1865*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1866*4bdc9457SAndroid Build Coastguard Worker .m(4)
1867*4bdc9457SAndroid Build Coastguard Worker .n(n)
1868*4bdc9457SAndroid Build Coastguard Worker .k(k)
1869*4bdc9457SAndroid Build Coastguard Worker .cn_stride(5)
1870*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1871*4bdc9457SAndroid Build Coastguard Worker }
1872*4bdc9457SAndroid Build Coastguard Worker }
1873*4bdc9457SAndroid Build Coastguard Worker }
1874*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,n_div_2_strided_a)1875*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, n_div_2_strided_a) {
1876*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1877*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1878*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1879*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1880*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1881*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1882*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1883*4bdc9457SAndroid Build Coastguard Worker .m(4)
1884*4bdc9457SAndroid Build Coastguard Worker .n(n)
1885*4bdc9457SAndroid Build Coastguard Worker .k(k)
1886*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
1887*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1888*4bdc9457SAndroid Build Coastguard Worker }
1889*4bdc9457SAndroid Build Coastguard Worker }
1890*4bdc9457SAndroid Build Coastguard Worker }
1891*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,n_div_2_subtile)1892*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, n_div_2_subtile) {
1893*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 4; n <= 6; n += 2) {
1894*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1895*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1896*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1897*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1898*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1899*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1900*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1901*4bdc9457SAndroid Build Coastguard Worker .m(m)
1902*4bdc9457SAndroid Build Coastguard Worker .n(n)
1903*4bdc9457SAndroid Build Coastguard Worker .k(k)
1904*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1905*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1906*4bdc9457SAndroid Build Coastguard Worker }
1907*4bdc9457SAndroid Build Coastguard Worker }
1908*4bdc9457SAndroid Build Coastguard Worker }
1909*4bdc9457SAndroid Build Coastguard Worker }
1910*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,strided_cm_subtile)1911*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, strided_cm_subtile) {
1912*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
1913*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 2; n++) {
1914*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1915*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1916*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1917*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1918*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1919*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1920*4bdc9457SAndroid Build Coastguard Worker .m(m)
1921*4bdc9457SAndroid Build Coastguard Worker .n(n)
1922*4bdc9457SAndroid Build Coastguard Worker .k(k)
1923*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
1924*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1925*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1926*4bdc9457SAndroid Build Coastguard Worker }
1927*4bdc9457SAndroid Build Coastguard Worker }
1928*4bdc9457SAndroid Build Coastguard Worker }
1929*4bdc9457SAndroid Build Coastguard Worker }
1930*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X2C4__WASMSIMD,strided_cm)1931*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X2C4__WASMSIMD, strided_cm) {
1932*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1933*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1934*4bdc9457SAndroid Build Coastguard Worker .nr(2)
1935*4bdc9457SAndroid Build Coastguard Worker .kr(4)
1936*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1937*4bdc9457SAndroid Build Coastguard Worker .m(4)
1938*4bdc9457SAndroid Build Coastguard Worker .n(2)
1939*4bdc9457SAndroid Build Coastguard Worker .k(4)
1940*4bdc9457SAndroid Build Coastguard Worker .cm_stride(5)
1941*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x2c4__wasmsimd);
1942*4bdc9457SAndroid Build Coastguard Worker }
1943*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
1944*4bdc9457SAndroid Build Coastguard Worker
1945*4bdc9457SAndroid Build Coastguard Worker
1946*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,k_eq_1)1947*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, k_eq_1) {
1948*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1949*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1950*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1951*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1952*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1953*4bdc9457SAndroid Build Coastguard Worker .m(4)
1954*4bdc9457SAndroid Build Coastguard Worker .n(8)
1955*4bdc9457SAndroid Build Coastguard Worker .k(1)
1956*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
1957*4bdc9457SAndroid Build Coastguard Worker }
1958*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,strided_cn)1959*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, strided_cn) {
1960*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1961*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1962*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1963*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1964*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1965*4bdc9457SAndroid Build Coastguard Worker .m(4)
1966*4bdc9457SAndroid Build Coastguard Worker .n(8)
1967*4bdc9457SAndroid Build Coastguard Worker .k(1)
1968*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
1969*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
1970*4bdc9457SAndroid Build Coastguard Worker }
1971*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,k_eq_1_strided_a)1972*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, k_eq_1_strided_a) {
1973*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1974*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1975*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1976*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1977*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1978*4bdc9457SAndroid Build Coastguard Worker .m(4)
1979*4bdc9457SAndroid Build Coastguard Worker .n(8)
1980*4bdc9457SAndroid Build Coastguard Worker .k(1)
1981*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
1982*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
1983*4bdc9457SAndroid Build Coastguard Worker }
1984*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)1985*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
1986*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
1987*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
1988*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
1989*4bdc9457SAndroid Build Coastguard Worker .mr(4)
1990*4bdc9457SAndroid Build Coastguard Worker .nr(8)
1991*4bdc9457SAndroid Build Coastguard Worker .kr(1)
1992*4bdc9457SAndroid Build Coastguard Worker .sr(1)
1993*4bdc9457SAndroid Build Coastguard Worker .m(m)
1994*4bdc9457SAndroid Build Coastguard Worker .n(n)
1995*4bdc9457SAndroid Build Coastguard Worker .k(1)
1996*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
1997*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
1998*4bdc9457SAndroid Build Coastguard Worker }
1999*4bdc9457SAndroid Build Coastguard Worker }
2000*4bdc9457SAndroid Build Coastguard Worker }
2001*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)2002*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
2003*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2004*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2005*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2006*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2007*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2008*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2009*4bdc9457SAndroid Build Coastguard Worker .m(m)
2010*4bdc9457SAndroid Build Coastguard Worker .n(8)
2011*4bdc9457SAndroid Build Coastguard Worker .k(1)
2012*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2013*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2014*4bdc9457SAndroid Build Coastguard Worker }
2015*4bdc9457SAndroid Build Coastguard Worker }
2016*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)2017*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
2018*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2019*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2020*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2021*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2022*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2023*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2024*4bdc9457SAndroid Build Coastguard Worker .m(4)
2025*4bdc9457SAndroid Build Coastguard Worker .n(n)
2026*4bdc9457SAndroid Build Coastguard Worker .k(1)
2027*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2028*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2029*4bdc9457SAndroid Build Coastguard Worker }
2030*4bdc9457SAndroid Build Coastguard Worker }
2031*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,k_gt_1)2032*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, k_gt_1) {
2033*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2034*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2035*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2036*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2037*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2038*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2039*4bdc9457SAndroid Build Coastguard Worker .m(4)
2040*4bdc9457SAndroid Build Coastguard Worker .n(8)
2041*4bdc9457SAndroid Build Coastguard Worker .k(k)
2042*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2043*4bdc9457SAndroid Build Coastguard Worker }
2044*4bdc9457SAndroid Build Coastguard Worker }
2045*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,k_gt_1_strided_a)2046*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, k_gt_1_strided_a) {
2047*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2048*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2049*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2050*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2051*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2052*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2053*4bdc9457SAndroid Build Coastguard Worker .m(4)
2054*4bdc9457SAndroid Build Coastguard Worker .n(8)
2055*4bdc9457SAndroid Build Coastguard Worker .k(k)
2056*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
2057*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2058*4bdc9457SAndroid Build Coastguard Worker }
2059*4bdc9457SAndroid Build Coastguard Worker }
2060*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)2061*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
2062*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2063*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2064*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2065*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2066*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2067*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2068*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2069*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2070*4bdc9457SAndroid Build Coastguard Worker .m(m)
2071*4bdc9457SAndroid Build Coastguard Worker .n(n)
2072*4bdc9457SAndroid Build Coastguard Worker .k(k)
2073*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2074*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2075*4bdc9457SAndroid Build Coastguard Worker }
2076*4bdc9457SAndroid Build Coastguard Worker }
2077*4bdc9457SAndroid Build Coastguard Worker }
2078*4bdc9457SAndroid Build Coastguard Worker }
2079*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,n_gt_8)2080*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, n_gt_8) {
2081*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2082*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2083*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2084*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2085*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2086*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2087*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2088*4bdc9457SAndroid Build Coastguard Worker .m(4)
2089*4bdc9457SAndroid Build Coastguard Worker .n(n)
2090*4bdc9457SAndroid Build Coastguard Worker .k(k)
2091*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2092*4bdc9457SAndroid Build Coastguard Worker }
2093*4bdc9457SAndroid Build Coastguard Worker }
2094*4bdc9457SAndroid Build Coastguard Worker }
2095*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)2096*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
2097*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2098*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2099*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2100*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2101*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2102*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2103*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2104*4bdc9457SAndroid Build Coastguard Worker .m(4)
2105*4bdc9457SAndroid Build Coastguard Worker .n(n)
2106*4bdc9457SAndroid Build Coastguard Worker .k(k)
2107*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2108*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2109*4bdc9457SAndroid Build Coastguard Worker }
2110*4bdc9457SAndroid Build Coastguard Worker }
2111*4bdc9457SAndroid Build Coastguard Worker }
2112*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_a)2113*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_a) {
2114*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2115*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2116*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2117*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2118*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2119*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2120*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2121*4bdc9457SAndroid Build Coastguard Worker .m(4)
2122*4bdc9457SAndroid Build Coastguard Worker .n(n)
2123*4bdc9457SAndroid Build Coastguard Worker .k(k)
2124*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2125*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2126*4bdc9457SAndroid Build Coastguard Worker }
2127*4bdc9457SAndroid Build Coastguard Worker }
2128*4bdc9457SAndroid Build Coastguard Worker }
2129*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)2130*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
2131*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2132*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2133*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2134*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2135*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2136*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2137*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2138*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2139*4bdc9457SAndroid Build Coastguard Worker .m(m)
2140*4bdc9457SAndroid Build Coastguard Worker .n(n)
2141*4bdc9457SAndroid Build Coastguard Worker .k(k)
2142*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2143*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2144*4bdc9457SAndroid Build Coastguard Worker }
2145*4bdc9457SAndroid Build Coastguard Worker }
2146*4bdc9457SAndroid Build Coastguard Worker }
2147*4bdc9457SAndroid Build Coastguard Worker }
2148*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,n_div_8)2149*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, n_div_8) {
2150*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2151*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2152*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2153*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2154*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2155*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2156*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2157*4bdc9457SAndroid Build Coastguard Worker .m(4)
2158*4bdc9457SAndroid Build Coastguard Worker .n(n)
2159*4bdc9457SAndroid Build Coastguard Worker .k(k)
2160*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2161*4bdc9457SAndroid Build Coastguard Worker }
2162*4bdc9457SAndroid Build Coastguard Worker }
2163*4bdc9457SAndroid Build Coastguard Worker }
2164*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)2165*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
2166*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2167*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2168*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2169*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2170*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2171*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2172*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2173*4bdc9457SAndroid Build Coastguard Worker .m(4)
2174*4bdc9457SAndroid Build Coastguard Worker .n(n)
2175*4bdc9457SAndroid Build Coastguard Worker .k(k)
2176*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2177*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2178*4bdc9457SAndroid Build Coastguard Worker }
2179*4bdc9457SAndroid Build Coastguard Worker }
2180*4bdc9457SAndroid Build Coastguard Worker }
2181*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,n_div_8_strided_a)2182*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, n_div_8_strided_a) {
2183*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2184*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2185*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2186*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2187*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2188*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2189*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2190*4bdc9457SAndroid Build Coastguard Worker .m(4)
2191*4bdc9457SAndroid Build Coastguard Worker .n(n)
2192*4bdc9457SAndroid Build Coastguard Worker .k(k)
2193*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2194*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2195*4bdc9457SAndroid Build Coastguard Worker }
2196*4bdc9457SAndroid Build Coastguard Worker }
2197*4bdc9457SAndroid Build Coastguard Worker }
2198*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)2199*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
2200*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2201*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2202*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2203*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2204*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2205*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2206*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2207*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2208*4bdc9457SAndroid Build Coastguard Worker .m(m)
2209*4bdc9457SAndroid Build Coastguard Worker .n(n)
2210*4bdc9457SAndroid Build Coastguard Worker .k(k)
2211*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2212*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2213*4bdc9457SAndroid Build Coastguard Worker }
2214*4bdc9457SAndroid Build Coastguard Worker }
2215*4bdc9457SAndroid Build Coastguard Worker }
2216*4bdc9457SAndroid Build Coastguard Worker }
2217*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)2218*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
2219*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2220*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2221*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2222*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2223*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2224*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2225*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2226*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2227*4bdc9457SAndroid Build Coastguard Worker .m(m)
2228*4bdc9457SAndroid Build Coastguard Worker .n(n)
2229*4bdc9457SAndroid Build Coastguard Worker .k(k)
2230*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2231*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2232*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2233*4bdc9457SAndroid Build Coastguard Worker }
2234*4bdc9457SAndroid Build Coastguard Worker }
2235*4bdc9457SAndroid Build Coastguard Worker }
2236*4bdc9457SAndroid Build Coastguard Worker }
2237*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT,strided_cm)2238*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMSIMD_LOADSPLAT, strided_cm) {
2239*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2240*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2241*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2242*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2243*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2244*4bdc9457SAndroid Build Coastguard Worker .m(4)
2245*4bdc9457SAndroid Build Coastguard Worker .n(8)
2246*4bdc9457SAndroid Build Coastguard Worker .k(1)
2247*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2248*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmsimd_loadsplat);
2249*4bdc9457SAndroid Build Coastguard Worker }
2250*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2251*4bdc9457SAndroid Build Coastguard Worker
2252*4bdc9457SAndroid Build Coastguard Worker
2253*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_4X8S4__WASMSIMD,k_eq_4)2254*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_eq_4) {
2255*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2256*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2257*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2258*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2259*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2260*4bdc9457SAndroid Build Coastguard Worker .m(4)
2261*4bdc9457SAndroid Build Coastguard Worker .n(8)
2262*4bdc9457SAndroid Build Coastguard Worker .k(4)
2263*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2264*4bdc9457SAndroid Build Coastguard Worker }
2265*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,strided_cn)2266*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, strided_cn) {
2267*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2268*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2269*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2270*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2271*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2272*4bdc9457SAndroid Build Coastguard Worker .m(4)
2273*4bdc9457SAndroid Build Coastguard Worker .n(8)
2274*4bdc9457SAndroid Build Coastguard Worker .k(4)
2275*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2276*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2277*4bdc9457SAndroid Build Coastguard Worker }
2278*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_eq_4_strided_a)2279*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_eq_4_strided_a) {
2280*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2281*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2282*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2283*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2284*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2285*4bdc9457SAndroid Build Coastguard Worker .m(4)
2286*4bdc9457SAndroid Build Coastguard Worker .n(8)
2287*4bdc9457SAndroid Build Coastguard Worker .k(4)
2288*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2289*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2290*4bdc9457SAndroid Build Coastguard Worker }
2291*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_eq_4_subtile)2292*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_eq_4_subtile) {
2293*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2294*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2295*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2296*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2297*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2298*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2299*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2300*4bdc9457SAndroid Build Coastguard Worker .m(m)
2301*4bdc9457SAndroid Build Coastguard Worker .n(n)
2302*4bdc9457SAndroid Build Coastguard Worker .k(4)
2303*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2304*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2305*4bdc9457SAndroid Build Coastguard Worker }
2306*4bdc9457SAndroid Build Coastguard Worker }
2307*4bdc9457SAndroid Build Coastguard Worker }
2308*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_eq_4_subtile_m)2309*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_eq_4_subtile_m) {
2310*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2311*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2312*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2313*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2314*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2315*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2316*4bdc9457SAndroid Build Coastguard Worker .m(m)
2317*4bdc9457SAndroid Build Coastguard Worker .n(8)
2318*4bdc9457SAndroid Build Coastguard Worker .k(4)
2319*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2320*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2321*4bdc9457SAndroid Build Coastguard Worker }
2322*4bdc9457SAndroid Build Coastguard Worker }
2323*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_eq_4_subtile_n)2324*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_eq_4_subtile_n) {
2325*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2326*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2327*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2328*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2329*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2330*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2331*4bdc9457SAndroid Build Coastguard Worker .m(4)
2332*4bdc9457SAndroid Build Coastguard Worker .n(n)
2333*4bdc9457SAndroid Build Coastguard Worker .k(4)
2334*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2335*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2336*4bdc9457SAndroid Build Coastguard Worker }
2337*4bdc9457SAndroid Build Coastguard Worker }
2338*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_lt_4)2339*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_lt_4) {
2340*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2341*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2342*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2343*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2344*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2345*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2346*4bdc9457SAndroid Build Coastguard Worker .m(4)
2347*4bdc9457SAndroid Build Coastguard Worker .n(8)
2348*4bdc9457SAndroid Build Coastguard Worker .k(k)
2349*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2350*4bdc9457SAndroid Build Coastguard Worker }
2351*4bdc9457SAndroid Build Coastguard Worker }
2352*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_lt_4_strided_a)2353*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_lt_4_strided_a) {
2354*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2355*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2356*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2357*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2358*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2359*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2360*4bdc9457SAndroid Build Coastguard Worker .m(4)
2361*4bdc9457SAndroid Build Coastguard Worker .n(8)
2362*4bdc9457SAndroid Build Coastguard Worker .k(k)
2363*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2364*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2365*4bdc9457SAndroid Build Coastguard Worker }
2366*4bdc9457SAndroid Build Coastguard Worker }
2367*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_lt_4_subtile)2368*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_lt_4_subtile) {
2369*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
2370*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2371*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2372*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2373*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2374*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2375*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2376*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2377*4bdc9457SAndroid Build Coastguard Worker .m(m)
2378*4bdc9457SAndroid Build Coastguard Worker .n(n)
2379*4bdc9457SAndroid Build Coastguard Worker .k(k)
2380*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2381*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2382*4bdc9457SAndroid Build Coastguard Worker }
2383*4bdc9457SAndroid Build Coastguard Worker }
2384*4bdc9457SAndroid Build Coastguard Worker }
2385*4bdc9457SAndroid Build Coastguard Worker }
2386*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_gt_4)2387*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_gt_4) {
2388*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2389*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2390*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2391*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2392*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2393*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2394*4bdc9457SAndroid Build Coastguard Worker .m(4)
2395*4bdc9457SAndroid Build Coastguard Worker .n(8)
2396*4bdc9457SAndroid Build Coastguard Worker .k(k)
2397*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2398*4bdc9457SAndroid Build Coastguard Worker }
2399*4bdc9457SAndroid Build Coastguard Worker }
2400*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_gt_4_strided_a)2401*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_gt_4_strided_a) {
2402*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2403*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2404*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2405*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2406*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2407*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2408*4bdc9457SAndroid Build Coastguard Worker .m(4)
2409*4bdc9457SAndroid Build Coastguard Worker .n(8)
2410*4bdc9457SAndroid Build Coastguard Worker .k(k)
2411*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
2412*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2413*4bdc9457SAndroid Build Coastguard Worker }
2414*4bdc9457SAndroid Build Coastguard Worker }
2415*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_gt_4_subtile)2416*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_gt_4_subtile) {
2417*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
2418*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2419*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2420*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2421*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2422*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2423*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2424*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2425*4bdc9457SAndroid Build Coastguard Worker .m(m)
2426*4bdc9457SAndroid Build Coastguard Worker .n(n)
2427*4bdc9457SAndroid Build Coastguard Worker .k(k)
2428*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2429*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2430*4bdc9457SAndroid Build Coastguard Worker }
2431*4bdc9457SAndroid Build Coastguard Worker }
2432*4bdc9457SAndroid Build Coastguard Worker }
2433*4bdc9457SAndroid Build Coastguard Worker }
2434*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_div_4)2435*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_div_4) {
2436*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2437*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2438*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2439*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2440*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2441*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2442*4bdc9457SAndroid Build Coastguard Worker .m(4)
2443*4bdc9457SAndroid Build Coastguard Worker .n(8)
2444*4bdc9457SAndroid Build Coastguard Worker .k(k)
2445*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2446*4bdc9457SAndroid Build Coastguard Worker }
2447*4bdc9457SAndroid Build Coastguard Worker }
2448*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_div_4_strided_a)2449*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_div_4_strided_a) {
2450*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2451*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2452*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2453*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2454*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2455*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2456*4bdc9457SAndroid Build Coastguard Worker .m(4)
2457*4bdc9457SAndroid Build Coastguard Worker .n(8)
2458*4bdc9457SAndroid Build Coastguard Worker .k(k)
2459*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
2460*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2461*4bdc9457SAndroid Build Coastguard Worker }
2462*4bdc9457SAndroid Build Coastguard Worker }
2463*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,k_div_4_subtile)2464*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, k_div_4_subtile) {
2465*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
2466*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2467*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2468*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2469*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2470*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2471*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2472*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2473*4bdc9457SAndroid Build Coastguard Worker .m(m)
2474*4bdc9457SAndroid Build Coastguard Worker .n(n)
2475*4bdc9457SAndroid Build Coastguard Worker .k(k)
2476*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2477*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2478*4bdc9457SAndroid Build Coastguard Worker }
2479*4bdc9457SAndroid Build Coastguard Worker }
2480*4bdc9457SAndroid Build Coastguard Worker }
2481*4bdc9457SAndroid Build Coastguard Worker }
2482*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,n_gt_8)2483*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, n_gt_8) {
2484*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2485*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2486*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2487*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2488*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2489*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2490*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2491*4bdc9457SAndroid Build Coastguard Worker .m(4)
2492*4bdc9457SAndroid Build Coastguard Worker .n(n)
2493*4bdc9457SAndroid Build Coastguard Worker .k(k)
2494*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2495*4bdc9457SAndroid Build Coastguard Worker }
2496*4bdc9457SAndroid Build Coastguard Worker }
2497*4bdc9457SAndroid Build Coastguard Worker }
2498*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,n_gt_8_strided_cn)2499*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, n_gt_8_strided_cn) {
2500*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2501*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2502*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2503*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2504*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2505*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2506*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2507*4bdc9457SAndroid Build Coastguard Worker .m(4)
2508*4bdc9457SAndroid Build Coastguard Worker .n(n)
2509*4bdc9457SAndroid Build Coastguard Worker .k(k)
2510*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2511*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2512*4bdc9457SAndroid Build Coastguard Worker }
2513*4bdc9457SAndroid Build Coastguard Worker }
2514*4bdc9457SAndroid Build Coastguard Worker }
2515*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,n_gt_8_strided_a)2516*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, n_gt_8_strided_a) {
2517*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2518*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2519*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2520*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2521*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2522*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2523*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2524*4bdc9457SAndroid Build Coastguard Worker .m(4)
2525*4bdc9457SAndroid Build Coastguard Worker .n(n)
2526*4bdc9457SAndroid Build Coastguard Worker .k(k)
2527*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
2528*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2529*4bdc9457SAndroid Build Coastguard Worker }
2530*4bdc9457SAndroid Build Coastguard Worker }
2531*4bdc9457SAndroid Build Coastguard Worker }
2532*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,n_gt_8_subtile)2533*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, n_gt_8_subtile) {
2534*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2535*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2536*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2537*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2538*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2539*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2540*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2541*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2542*4bdc9457SAndroid Build Coastguard Worker .m(m)
2543*4bdc9457SAndroid Build Coastguard Worker .n(n)
2544*4bdc9457SAndroid Build Coastguard Worker .k(k)
2545*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2546*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2547*4bdc9457SAndroid Build Coastguard Worker }
2548*4bdc9457SAndroid Build Coastguard Worker }
2549*4bdc9457SAndroid Build Coastguard Worker }
2550*4bdc9457SAndroid Build Coastguard Worker }
2551*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,n_div_8)2552*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, n_div_8) {
2553*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2554*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2555*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2556*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2557*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2558*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2559*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2560*4bdc9457SAndroid Build Coastguard Worker .m(4)
2561*4bdc9457SAndroid Build Coastguard Worker .n(n)
2562*4bdc9457SAndroid Build Coastguard Worker .k(k)
2563*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2564*4bdc9457SAndroid Build Coastguard Worker }
2565*4bdc9457SAndroid Build Coastguard Worker }
2566*4bdc9457SAndroid Build Coastguard Worker }
2567*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,n_div_8_strided_cn)2568*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, n_div_8_strided_cn) {
2569*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2570*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2571*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2572*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2573*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2574*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2575*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2576*4bdc9457SAndroid Build Coastguard Worker .m(4)
2577*4bdc9457SAndroid Build Coastguard Worker .n(n)
2578*4bdc9457SAndroid Build Coastguard Worker .k(k)
2579*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2580*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2581*4bdc9457SAndroid Build Coastguard Worker }
2582*4bdc9457SAndroid Build Coastguard Worker }
2583*4bdc9457SAndroid Build Coastguard Worker }
2584*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,n_div_8_strided_a)2585*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, n_div_8_strided_a) {
2586*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2587*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2588*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2589*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2590*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2591*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2592*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2593*4bdc9457SAndroid Build Coastguard Worker .m(4)
2594*4bdc9457SAndroid Build Coastguard Worker .n(n)
2595*4bdc9457SAndroid Build Coastguard Worker .k(k)
2596*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
2597*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2598*4bdc9457SAndroid Build Coastguard Worker }
2599*4bdc9457SAndroid Build Coastguard Worker }
2600*4bdc9457SAndroid Build Coastguard Worker }
2601*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,n_div_8_subtile)2602*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, n_div_8_subtile) {
2603*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2604*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2605*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2606*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2607*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2608*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2609*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2610*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2611*4bdc9457SAndroid Build Coastguard Worker .m(m)
2612*4bdc9457SAndroid Build Coastguard Worker .n(n)
2613*4bdc9457SAndroid Build Coastguard Worker .k(k)
2614*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2615*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2616*4bdc9457SAndroid Build Coastguard Worker }
2617*4bdc9457SAndroid Build Coastguard Worker }
2618*4bdc9457SAndroid Build Coastguard Worker }
2619*4bdc9457SAndroid Build Coastguard Worker }
2620*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,strided_cm_subtile)2621*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, strided_cm_subtile) {
2622*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
2623*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2624*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
2625*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2626*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2627*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2628*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2629*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2630*4bdc9457SAndroid Build Coastguard Worker .m(m)
2631*4bdc9457SAndroid Build Coastguard Worker .n(n)
2632*4bdc9457SAndroid Build Coastguard Worker .k(k)
2633*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2634*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2635*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2636*4bdc9457SAndroid Build Coastguard Worker }
2637*4bdc9457SAndroid Build Coastguard Worker }
2638*4bdc9457SAndroid Build Coastguard Worker }
2639*4bdc9457SAndroid Build Coastguard Worker }
2640*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMSIMD,strided_cm)2641*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMSIMD, strided_cm) {
2642*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2643*4bdc9457SAndroid Build Coastguard Worker .mr(4)
2644*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2645*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2646*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2647*4bdc9457SAndroid Build Coastguard Worker .m(4)
2648*4bdc9457SAndroid Build Coastguard Worker .n(8)
2649*4bdc9457SAndroid Build Coastguard Worker .k(4)
2650*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2651*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmsimd);
2652*4bdc9457SAndroid Build Coastguard Worker }
2653*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2654*4bdc9457SAndroid Build Coastguard Worker
2655*4bdc9457SAndroid Build Coastguard Worker
2656*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,k_eq_1)2657*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, k_eq_1) {
2658*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2659*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2660*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2661*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2662*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2663*4bdc9457SAndroid Build Coastguard Worker .m(5)
2664*4bdc9457SAndroid Build Coastguard Worker .n(8)
2665*4bdc9457SAndroid Build Coastguard Worker .k(1)
2666*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2667*4bdc9457SAndroid Build Coastguard Worker }
2668*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,strided_cn)2669*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, strided_cn) {
2670*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2671*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2672*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2673*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2674*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2675*4bdc9457SAndroid Build Coastguard Worker .m(5)
2676*4bdc9457SAndroid Build Coastguard Worker .n(8)
2677*4bdc9457SAndroid Build Coastguard Worker .k(1)
2678*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2679*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2680*4bdc9457SAndroid Build Coastguard Worker }
2681*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,k_eq_1_strided_a)2682*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, k_eq_1_strided_a) {
2683*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2684*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2685*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2686*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2687*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2688*4bdc9457SAndroid Build Coastguard Worker .m(5)
2689*4bdc9457SAndroid Build Coastguard Worker .n(8)
2690*4bdc9457SAndroid Build Coastguard Worker .k(1)
2691*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
2692*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2693*4bdc9457SAndroid Build Coastguard Worker }
2694*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile)2695*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile) {
2696*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2697*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2698*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2699*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2700*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2701*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2702*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2703*4bdc9457SAndroid Build Coastguard Worker .m(m)
2704*4bdc9457SAndroid Build Coastguard Worker .n(n)
2705*4bdc9457SAndroid Build Coastguard Worker .k(1)
2706*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2707*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2708*4bdc9457SAndroid Build Coastguard Worker }
2709*4bdc9457SAndroid Build Coastguard Worker }
2710*4bdc9457SAndroid Build Coastguard Worker }
2711*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_m)2712*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_m) {
2713*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2714*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2715*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2716*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2717*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2718*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2719*4bdc9457SAndroid Build Coastguard Worker .m(m)
2720*4bdc9457SAndroid Build Coastguard Worker .n(8)
2721*4bdc9457SAndroid Build Coastguard Worker .k(1)
2722*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2723*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2724*4bdc9457SAndroid Build Coastguard Worker }
2725*4bdc9457SAndroid Build Coastguard Worker }
2726*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,k_eq_1_subtile_n)2727*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, k_eq_1_subtile_n) {
2728*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2729*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2730*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2731*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2732*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2733*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2734*4bdc9457SAndroid Build Coastguard Worker .m(5)
2735*4bdc9457SAndroid Build Coastguard Worker .n(n)
2736*4bdc9457SAndroid Build Coastguard Worker .k(1)
2737*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2738*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2739*4bdc9457SAndroid Build Coastguard Worker }
2740*4bdc9457SAndroid Build Coastguard Worker }
2741*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,k_gt_1)2742*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, k_gt_1) {
2743*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2744*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2745*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2746*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2747*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2748*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2749*4bdc9457SAndroid Build Coastguard Worker .m(5)
2750*4bdc9457SAndroid Build Coastguard Worker .n(8)
2751*4bdc9457SAndroid Build Coastguard Worker .k(k)
2752*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2753*4bdc9457SAndroid Build Coastguard Worker }
2754*4bdc9457SAndroid Build Coastguard Worker }
2755*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,k_gt_1_strided_a)2756*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, k_gt_1_strided_a) {
2757*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2758*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2759*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2760*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2761*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2762*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2763*4bdc9457SAndroid Build Coastguard Worker .m(5)
2764*4bdc9457SAndroid Build Coastguard Worker .n(8)
2765*4bdc9457SAndroid Build Coastguard Worker .k(k)
2766*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
2767*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2768*4bdc9457SAndroid Build Coastguard Worker }
2769*4bdc9457SAndroid Build Coastguard Worker }
2770*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,k_gt_1_subtile)2771*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, k_gt_1_subtile) {
2772*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
2773*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2774*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2775*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2776*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2777*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2778*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2779*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2780*4bdc9457SAndroid Build Coastguard Worker .m(m)
2781*4bdc9457SAndroid Build Coastguard Worker .n(n)
2782*4bdc9457SAndroid Build Coastguard Worker .k(k)
2783*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2784*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2785*4bdc9457SAndroid Build Coastguard Worker }
2786*4bdc9457SAndroid Build Coastguard Worker }
2787*4bdc9457SAndroid Build Coastguard Worker }
2788*4bdc9457SAndroid Build Coastguard Worker }
2789*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,n_gt_8)2790*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, n_gt_8) {
2791*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2792*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2793*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2794*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2795*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2796*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2797*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2798*4bdc9457SAndroid Build Coastguard Worker .m(5)
2799*4bdc9457SAndroid Build Coastguard Worker .n(n)
2800*4bdc9457SAndroid Build Coastguard Worker .k(k)
2801*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2802*4bdc9457SAndroid Build Coastguard Worker }
2803*4bdc9457SAndroid Build Coastguard Worker }
2804*4bdc9457SAndroid Build Coastguard Worker }
2805*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_cn)2806*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_cn) {
2807*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2808*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2809*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2810*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2811*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2812*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2813*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2814*4bdc9457SAndroid Build Coastguard Worker .m(5)
2815*4bdc9457SAndroid Build Coastguard Worker .n(n)
2816*4bdc9457SAndroid Build Coastguard Worker .k(k)
2817*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2818*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2819*4bdc9457SAndroid Build Coastguard Worker }
2820*4bdc9457SAndroid Build Coastguard Worker }
2821*4bdc9457SAndroid Build Coastguard Worker }
2822*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,n_gt_8_strided_a)2823*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, n_gt_8_strided_a) {
2824*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2825*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2826*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2827*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2828*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2829*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2830*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2831*4bdc9457SAndroid Build Coastguard Worker .m(5)
2832*4bdc9457SAndroid Build Coastguard Worker .n(n)
2833*4bdc9457SAndroid Build Coastguard Worker .k(k)
2834*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2835*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2836*4bdc9457SAndroid Build Coastguard Worker }
2837*4bdc9457SAndroid Build Coastguard Worker }
2838*4bdc9457SAndroid Build Coastguard Worker }
2839*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,n_gt_8_subtile)2840*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, n_gt_8_subtile) {
2841*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
2842*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2843*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2844*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2845*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2846*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2847*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2848*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2849*4bdc9457SAndroid Build Coastguard Worker .m(m)
2850*4bdc9457SAndroid Build Coastguard Worker .n(n)
2851*4bdc9457SAndroid Build Coastguard Worker .k(k)
2852*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2853*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2854*4bdc9457SAndroid Build Coastguard Worker }
2855*4bdc9457SAndroid Build Coastguard Worker }
2856*4bdc9457SAndroid Build Coastguard Worker }
2857*4bdc9457SAndroid Build Coastguard Worker }
2858*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,n_div_8)2859*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, n_div_8) {
2860*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2861*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2862*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2863*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2864*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2865*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2866*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2867*4bdc9457SAndroid Build Coastguard Worker .m(5)
2868*4bdc9457SAndroid Build Coastguard Worker .n(n)
2869*4bdc9457SAndroid Build Coastguard Worker .k(k)
2870*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2871*4bdc9457SAndroid Build Coastguard Worker }
2872*4bdc9457SAndroid Build Coastguard Worker }
2873*4bdc9457SAndroid Build Coastguard Worker }
2874*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,n_div_8_strided_cn)2875*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, n_div_8_strided_cn) {
2876*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2877*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2878*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2879*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2880*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2881*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2882*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2883*4bdc9457SAndroid Build Coastguard Worker .m(5)
2884*4bdc9457SAndroid Build Coastguard Worker .n(n)
2885*4bdc9457SAndroid Build Coastguard Worker .k(k)
2886*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2887*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2888*4bdc9457SAndroid Build Coastguard Worker }
2889*4bdc9457SAndroid Build Coastguard Worker }
2890*4bdc9457SAndroid Build Coastguard Worker }
2891*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,n_div_8_strided_a)2892*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, n_div_8_strided_a) {
2893*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2894*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2895*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2896*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2897*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2898*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2899*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2900*4bdc9457SAndroid Build Coastguard Worker .m(5)
2901*4bdc9457SAndroid Build Coastguard Worker .n(n)
2902*4bdc9457SAndroid Build Coastguard Worker .k(k)
2903*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2904*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2905*4bdc9457SAndroid Build Coastguard Worker }
2906*4bdc9457SAndroid Build Coastguard Worker }
2907*4bdc9457SAndroid Build Coastguard Worker }
2908*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,n_div_8_subtile)2909*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, n_div_8_subtile) {
2910*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
2911*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2912*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2913*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2914*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2915*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2916*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2917*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2918*4bdc9457SAndroid Build Coastguard Worker .m(m)
2919*4bdc9457SAndroid Build Coastguard Worker .n(n)
2920*4bdc9457SAndroid Build Coastguard Worker .k(k)
2921*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2922*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2923*4bdc9457SAndroid Build Coastguard Worker }
2924*4bdc9457SAndroid Build Coastguard Worker }
2925*4bdc9457SAndroid Build Coastguard Worker }
2926*4bdc9457SAndroid Build Coastguard Worker }
2927*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,strided_cm_subtile)2928*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, strided_cm_subtile) {
2929*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
2930*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
2931*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
2932*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2933*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2934*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2935*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2936*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2937*4bdc9457SAndroid Build Coastguard Worker .m(m)
2938*4bdc9457SAndroid Build Coastguard Worker .n(n)
2939*4bdc9457SAndroid Build Coastguard Worker .k(k)
2940*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2941*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
2942*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2943*4bdc9457SAndroid Build Coastguard Worker }
2944*4bdc9457SAndroid Build Coastguard Worker }
2945*4bdc9457SAndroid Build Coastguard Worker }
2946*4bdc9457SAndroid Build Coastguard Worker }
2947*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT,strided_cm)2948*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMSIMD_LOADSPLAT, strided_cm) {
2949*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2950*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2951*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2952*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2953*4bdc9457SAndroid Build Coastguard Worker .sr(1)
2954*4bdc9457SAndroid Build Coastguard Worker .m(5)
2955*4bdc9457SAndroid Build Coastguard Worker .n(8)
2956*4bdc9457SAndroid Build Coastguard Worker .k(1)
2957*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
2958*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmsimd_loadsplat);
2959*4bdc9457SAndroid Build Coastguard Worker }
2960*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
2961*4bdc9457SAndroid Build Coastguard Worker
2962*4bdc9457SAndroid Build Coastguard Worker
2963*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_5X8S4__WASMSIMD,k_eq_4)2964*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_eq_4) {
2965*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2966*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2967*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2968*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2969*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2970*4bdc9457SAndroid Build Coastguard Worker .m(5)
2971*4bdc9457SAndroid Build Coastguard Worker .n(8)
2972*4bdc9457SAndroid Build Coastguard Worker .k(4)
2973*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
2974*4bdc9457SAndroid Build Coastguard Worker }
2975*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,strided_cn)2976*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, strided_cn) {
2977*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2978*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2979*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2980*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2981*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2982*4bdc9457SAndroid Build Coastguard Worker .m(5)
2983*4bdc9457SAndroid Build Coastguard Worker .n(8)
2984*4bdc9457SAndroid Build Coastguard Worker .k(4)
2985*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
2986*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
2987*4bdc9457SAndroid Build Coastguard Worker }
2988*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_eq_4_strided_a)2989*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_eq_4_strided_a) {
2990*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
2991*4bdc9457SAndroid Build Coastguard Worker .mr(5)
2992*4bdc9457SAndroid Build Coastguard Worker .nr(8)
2993*4bdc9457SAndroid Build Coastguard Worker .kr(1)
2994*4bdc9457SAndroid Build Coastguard Worker .sr(4)
2995*4bdc9457SAndroid Build Coastguard Worker .m(5)
2996*4bdc9457SAndroid Build Coastguard Worker .n(8)
2997*4bdc9457SAndroid Build Coastguard Worker .k(4)
2998*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
2999*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3000*4bdc9457SAndroid Build Coastguard Worker }
3001*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_eq_4_subtile)3002*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_eq_4_subtile) {
3003*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3004*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
3005*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3006*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3007*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3008*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3009*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3010*4bdc9457SAndroid Build Coastguard Worker .m(m)
3011*4bdc9457SAndroid Build Coastguard Worker .n(n)
3012*4bdc9457SAndroid Build Coastguard Worker .k(4)
3013*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3014*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3015*4bdc9457SAndroid Build Coastguard Worker }
3016*4bdc9457SAndroid Build Coastguard Worker }
3017*4bdc9457SAndroid Build Coastguard Worker }
3018*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_eq_4_subtile_m)3019*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_eq_4_subtile_m) {
3020*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
3021*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3022*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3023*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3024*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3025*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3026*4bdc9457SAndroid Build Coastguard Worker .m(m)
3027*4bdc9457SAndroid Build Coastguard Worker .n(8)
3028*4bdc9457SAndroid Build Coastguard Worker .k(4)
3029*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3030*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3031*4bdc9457SAndroid Build Coastguard Worker }
3032*4bdc9457SAndroid Build Coastguard Worker }
3033*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_eq_4_subtile_n)3034*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_eq_4_subtile_n) {
3035*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3036*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3037*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3038*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3039*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3040*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3041*4bdc9457SAndroid Build Coastguard Worker .m(5)
3042*4bdc9457SAndroid Build Coastguard Worker .n(n)
3043*4bdc9457SAndroid Build Coastguard Worker .k(4)
3044*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3045*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3046*4bdc9457SAndroid Build Coastguard Worker }
3047*4bdc9457SAndroid Build Coastguard Worker }
3048*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_lt_4)3049*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_lt_4) {
3050*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3051*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3052*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3053*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3054*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3055*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3056*4bdc9457SAndroid Build Coastguard Worker .m(5)
3057*4bdc9457SAndroid Build Coastguard Worker .n(8)
3058*4bdc9457SAndroid Build Coastguard Worker .k(k)
3059*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3060*4bdc9457SAndroid Build Coastguard Worker }
3061*4bdc9457SAndroid Build Coastguard Worker }
3062*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_lt_4_strided_a)3063*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_lt_4_strided_a) {
3064*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3065*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3066*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3067*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3068*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3069*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3070*4bdc9457SAndroid Build Coastguard Worker .m(5)
3071*4bdc9457SAndroid Build Coastguard Worker .n(8)
3072*4bdc9457SAndroid Build Coastguard Worker .k(k)
3073*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3074*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3075*4bdc9457SAndroid Build Coastguard Worker }
3076*4bdc9457SAndroid Build Coastguard Worker }
3077*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_lt_4_subtile)3078*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_lt_4_subtile) {
3079*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3080*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3081*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
3082*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3083*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3084*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3085*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3086*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3087*4bdc9457SAndroid Build Coastguard Worker .m(m)
3088*4bdc9457SAndroid Build Coastguard Worker .n(n)
3089*4bdc9457SAndroid Build Coastguard Worker .k(k)
3090*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3091*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3092*4bdc9457SAndroid Build Coastguard Worker }
3093*4bdc9457SAndroid Build Coastguard Worker }
3094*4bdc9457SAndroid Build Coastguard Worker }
3095*4bdc9457SAndroid Build Coastguard Worker }
3096*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_gt_4)3097*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_gt_4) {
3098*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3099*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3100*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3101*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3102*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3103*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3104*4bdc9457SAndroid Build Coastguard Worker .m(5)
3105*4bdc9457SAndroid Build Coastguard Worker .n(8)
3106*4bdc9457SAndroid Build Coastguard Worker .k(k)
3107*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3108*4bdc9457SAndroid Build Coastguard Worker }
3109*4bdc9457SAndroid Build Coastguard Worker }
3110*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_gt_4_strided_a)3111*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_gt_4_strided_a) {
3112*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3113*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3114*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3115*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3116*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3117*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3118*4bdc9457SAndroid Build Coastguard Worker .m(5)
3119*4bdc9457SAndroid Build Coastguard Worker .n(8)
3120*4bdc9457SAndroid Build Coastguard Worker .k(k)
3121*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
3122*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3123*4bdc9457SAndroid Build Coastguard Worker }
3124*4bdc9457SAndroid Build Coastguard Worker }
3125*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_gt_4_subtile)3126*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_gt_4_subtile) {
3127*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3128*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3129*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
3130*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3131*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3132*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3133*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3134*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3135*4bdc9457SAndroid Build Coastguard Worker .m(m)
3136*4bdc9457SAndroid Build Coastguard Worker .n(n)
3137*4bdc9457SAndroid Build Coastguard Worker .k(k)
3138*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3139*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3140*4bdc9457SAndroid Build Coastguard Worker }
3141*4bdc9457SAndroid Build Coastguard Worker }
3142*4bdc9457SAndroid Build Coastguard Worker }
3143*4bdc9457SAndroid Build Coastguard Worker }
3144*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_div_4)3145*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_div_4) {
3146*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3147*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3148*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3149*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3150*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3151*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3152*4bdc9457SAndroid Build Coastguard Worker .m(5)
3153*4bdc9457SAndroid Build Coastguard Worker .n(8)
3154*4bdc9457SAndroid Build Coastguard Worker .k(k)
3155*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3156*4bdc9457SAndroid Build Coastguard Worker }
3157*4bdc9457SAndroid Build Coastguard Worker }
3158*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_div_4_strided_a)3159*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_div_4_strided_a) {
3160*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3161*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3162*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3163*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3164*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3165*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3166*4bdc9457SAndroid Build Coastguard Worker .m(5)
3167*4bdc9457SAndroid Build Coastguard Worker .n(8)
3168*4bdc9457SAndroid Build Coastguard Worker .k(k)
3169*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
3170*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3171*4bdc9457SAndroid Build Coastguard Worker }
3172*4bdc9457SAndroid Build Coastguard Worker }
3173*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,k_div_4_subtile)3174*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, k_div_4_subtile) {
3175*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3176*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3177*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
3178*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3179*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3180*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3181*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3182*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3183*4bdc9457SAndroid Build Coastguard Worker .m(m)
3184*4bdc9457SAndroid Build Coastguard Worker .n(n)
3185*4bdc9457SAndroid Build Coastguard Worker .k(k)
3186*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3187*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3188*4bdc9457SAndroid Build Coastguard Worker }
3189*4bdc9457SAndroid Build Coastguard Worker }
3190*4bdc9457SAndroid Build Coastguard Worker }
3191*4bdc9457SAndroid Build Coastguard Worker }
3192*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,n_gt_8)3193*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, n_gt_8) {
3194*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3195*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3196*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3197*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3198*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3199*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3200*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3201*4bdc9457SAndroid Build Coastguard Worker .m(5)
3202*4bdc9457SAndroid Build Coastguard Worker .n(n)
3203*4bdc9457SAndroid Build Coastguard Worker .k(k)
3204*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3205*4bdc9457SAndroid Build Coastguard Worker }
3206*4bdc9457SAndroid Build Coastguard Worker }
3207*4bdc9457SAndroid Build Coastguard Worker }
3208*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,n_gt_8_strided_cn)3209*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, n_gt_8_strided_cn) {
3210*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3211*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3212*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3213*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3214*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3215*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3216*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3217*4bdc9457SAndroid Build Coastguard Worker .m(5)
3218*4bdc9457SAndroid Build Coastguard Worker .n(n)
3219*4bdc9457SAndroid Build Coastguard Worker .k(k)
3220*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3221*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3222*4bdc9457SAndroid Build Coastguard Worker }
3223*4bdc9457SAndroid Build Coastguard Worker }
3224*4bdc9457SAndroid Build Coastguard Worker }
3225*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,n_gt_8_strided_a)3226*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, n_gt_8_strided_a) {
3227*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3228*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3229*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3230*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3231*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3232*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3233*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3234*4bdc9457SAndroid Build Coastguard Worker .m(5)
3235*4bdc9457SAndroid Build Coastguard Worker .n(n)
3236*4bdc9457SAndroid Build Coastguard Worker .k(k)
3237*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3238*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3239*4bdc9457SAndroid Build Coastguard Worker }
3240*4bdc9457SAndroid Build Coastguard Worker }
3241*4bdc9457SAndroid Build Coastguard Worker }
3242*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,n_gt_8_subtile)3243*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, n_gt_8_subtile) {
3244*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3245*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3246*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
3247*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3248*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3249*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3250*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3251*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3252*4bdc9457SAndroid Build Coastguard Worker .m(m)
3253*4bdc9457SAndroid Build Coastguard Worker .n(n)
3254*4bdc9457SAndroid Build Coastguard Worker .k(k)
3255*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3256*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3257*4bdc9457SAndroid Build Coastguard Worker }
3258*4bdc9457SAndroid Build Coastguard Worker }
3259*4bdc9457SAndroid Build Coastguard Worker }
3260*4bdc9457SAndroid Build Coastguard Worker }
3261*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,n_div_8)3262*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, n_div_8) {
3263*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3264*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3265*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3266*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3267*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3268*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3269*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3270*4bdc9457SAndroid Build Coastguard Worker .m(5)
3271*4bdc9457SAndroid Build Coastguard Worker .n(n)
3272*4bdc9457SAndroid Build Coastguard Worker .k(k)
3273*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3274*4bdc9457SAndroid Build Coastguard Worker }
3275*4bdc9457SAndroid Build Coastguard Worker }
3276*4bdc9457SAndroid Build Coastguard Worker }
3277*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,n_div_8_strided_cn)3278*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, n_div_8_strided_cn) {
3279*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3280*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3281*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3282*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3283*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3284*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3285*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3286*4bdc9457SAndroid Build Coastguard Worker .m(5)
3287*4bdc9457SAndroid Build Coastguard Worker .n(n)
3288*4bdc9457SAndroid Build Coastguard Worker .k(k)
3289*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3290*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3291*4bdc9457SAndroid Build Coastguard Worker }
3292*4bdc9457SAndroid Build Coastguard Worker }
3293*4bdc9457SAndroid Build Coastguard Worker }
3294*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,n_div_8_strided_a)3295*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, n_div_8_strided_a) {
3296*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3297*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3298*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3299*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3300*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3301*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3302*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3303*4bdc9457SAndroid Build Coastguard Worker .m(5)
3304*4bdc9457SAndroid Build Coastguard Worker .n(n)
3305*4bdc9457SAndroid Build Coastguard Worker .k(k)
3306*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3307*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3308*4bdc9457SAndroid Build Coastguard Worker }
3309*4bdc9457SAndroid Build Coastguard Worker }
3310*4bdc9457SAndroid Build Coastguard Worker }
3311*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,n_div_8_subtile)3312*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, n_div_8_subtile) {
3313*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3314*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3315*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
3316*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3317*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3318*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3319*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3320*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3321*4bdc9457SAndroid Build Coastguard Worker .m(m)
3322*4bdc9457SAndroid Build Coastguard Worker .n(n)
3323*4bdc9457SAndroid Build Coastguard Worker .k(k)
3324*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3325*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3326*4bdc9457SAndroid Build Coastguard Worker }
3327*4bdc9457SAndroid Build Coastguard Worker }
3328*4bdc9457SAndroid Build Coastguard Worker }
3329*4bdc9457SAndroid Build Coastguard Worker }
3330*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,strided_cm_subtile)3331*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, strided_cm_subtile) {
3332*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3333*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3334*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
3335*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3336*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3337*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3338*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3339*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3340*4bdc9457SAndroid Build Coastguard Worker .m(m)
3341*4bdc9457SAndroid Build Coastguard Worker .n(n)
3342*4bdc9457SAndroid Build Coastguard Worker .k(k)
3343*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3344*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3345*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3346*4bdc9457SAndroid Build Coastguard Worker }
3347*4bdc9457SAndroid Build Coastguard Worker }
3348*4bdc9457SAndroid Build Coastguard Worker }
3349*4bdc9457SAndroid Build Coastguard Worker }
3350*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8S4__WASMSIMD,strided_cm)3351*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8S4__WASMSIMD, strided_cm) {
3352*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3353*4bdc9457SAndroid Build Coastguard Worker .mr(5)
3354*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3355*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3356*4bdc9457SAndroid Build Coastguard Worker .sr(4)
3357*4bdc9457SAndroid Build Coastguard Worker .m(5)
3358*4bdc9457SAndroid Build Coastguard Worker .n(8)
3359*4bdc9457SAndroid Build Coastguard Worker .k(4)
3360*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3361*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8s4__wasmsimd);
3362*4bdc9457SAndroid Build Coastguard Worker }
3363*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
3364*4bdc9457SAndroid Build Coastguard Worker
3365*4bdc9457SAndroid Build Coastguard Worker
3366*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_eq_4)3367*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_eq_4) {
3368*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3369*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3370*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3371*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3372*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3373*4bdc9457SAndroid Build Coastguard Worker .m(6)
3374*4bdc9457SAndroid Build Coastguard Worker .n(8)
3375*4bdc9457SAndroid Build Coastguard Worker .k(4)
3376*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3377*4bdc9457SAndroid Build Coastguard Worker }
3378*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,strided_cn)3379*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, strided_cn) {
3380*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3381*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3382*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3383*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3384*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3385*4bdc9457SAndroid Build Coastguard Worker .m(6)
3386*4bdc9457SAndroid Build Coastguard Worker .n(8)
3387*4bdc9457SAndroid Build Coastguard Worker .k(4)
3388*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3389*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3390*4bdc9457SAndroid Build Coastguard Worker }
3391*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_eq_4_strided_a)3392*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_eq_4_strided_a) {
3393*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3394*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3395*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3396*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3397*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3398*4bdc9457SAndroid Build Coastguard Worker .m(6)
3399*4bdc9457SAndroid Build Coastguard Worker .n(8)
3400*4bdc9457SAndroid Build Coastguard Worker .k(4)
3401*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3402*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3403*4bdc9457SAndroid Build Coastguard Worker }
3404*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_eq_4_subtile)3405*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_eq_4_subtile) {
3406*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3407*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3408*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3409*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3410*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3411*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3412*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3413*4bdc9457SAndroid Build Coastguard Worker .m(m)
3414*4bdc9457SAndroid Build Coastguard Worker .n(n)
3415*4bdc9457SAndroid Build Coastguard Worker .k(4)
3416*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3417*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3418*4bdc9457SAndroid Build Coastguard Worker }
3419*4bdc9457SAndroid Build Coastguard Worker }
3420*4bdc9457SAndroid Build Coastguard Worker }
3421*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_eq_4_subtile_m)3422*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_eq_4_subtile_m) {
3423*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3424*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3425*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3426*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3427*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3428*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3429*4bdc9457SAndroid Build Coastguard Worker .m(m)
3430*4bdc9457SAndroid Build Coastguard Worker .n(8)
3431*4bdc9457SAndroid Build Coastguard Worker .k(4)
3432*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3433*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3434*4bdc9457SAndroid Build Coastguard Worker }
3435*4bdc9457SAndroid Build Coastguard Worker }
3436*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_eq_4_subtile_n)3437*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_eq_4_subtile_n) {
3438*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3439*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3440*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3441*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3442*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3443*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3444*4bdc9457SAndroid Build Coastguard Worker .m(6)
3445*4bdc9457SAndroid Build Coastguard Worker .n(n)
3446*4bdc9457SAndroid Build Coastguard Worker .k(4)
3447*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3448*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3449*4bdc9457SAndroid Build Coastguard Worker }
3450*4bdc9457SAndroid Build Coastguard Worker }
3451*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_lt_4)3452*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_lt_4) {
3453*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3454*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3455*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3456*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3457*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3458*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3459*4bdc9457SAndroid Build Coastguard Worker .m(6)
3460*4bdc9457SAndroid Build Coastguard Worker .n(8)
3461*4bdc9457SAndroid Build Coastguard Worker .k(k)
3462*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3463*4bdc9457SAndroid Build Coastguard Worker }
3464*4bdc9457SAndroid Build Coastguard Worker }
3465*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_lt_4_strided_a)3466*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_lt_4_strided_a) {
3467*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3468*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3469*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3470*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3471*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3472*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3473*4bdc9457SAndroid Build Coastguard Worker .m(6)
3474*4bdc9457SAndroid Build Coastguard Worker .n(8)
3475*4bdc9457SAndroid Build Coastguard Worker .k(k)
3476*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3477*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3478*4bdc9457SAndroid Build Coastguard Worker }
3479*4bdc9457SAndroid Build Coastguard Worker }
3480*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_lt_4_subtile)3481*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_lt_4_subtile) {
3482*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
3483*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3484*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3485*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3486*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3487*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3488*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3489*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3490*4bdc9457SAndroid Build Coastguard Worker .m(m)
3491*4bdc9457SAndroid Build Coastguard Worker .n(n)
3492*4bdc9457SAndroid Build Coastguard Worker .k(k)
3493*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3494*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3495*4bdc9457SAndroid Build Coastguard Worker }
3496*4bdc9457SAndroid Build Coastguard Worker }
3497*4bdc9457SAndroid Build Coastguard Worker }
3498*4bdc9457SAndroid Build Coastguard Worker }
3499*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_gt_4)3500*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_gt_4) {
3501*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3502*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3503*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3504*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3505*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3506*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3507*4bdc9457SAndroid Build Coastguard Worker .m(6)
3508*4bdc9457SAndroid Build Coastguard Worker .n(8)
3509*4bdc9457SAndroid Build Coastguard Worker .k(k)
3510*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3511*4bdc9457SAndroid Build Coastguard Worker }
3512*4bdc9457SAndroid Build Coastguard Worker }
3513*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_gt_4_strided_a)3514*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_gt_4_strided_a) {
3515*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3516*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3517*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3518*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3519*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3520*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3521*4bdc9457SAndroid Build Coastguard Worker .m(6)
3522*4bdc9457SAndroid Build Coastguard Worker .n(8)
3523*4bdc9457SAndroid Build Coastguard Worker .k(k)
3524*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
3525*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3526*4bdc9457SAndroid Build Coastguard Worker }
3527*4bdc9457SAndroid Build Coastguard Worker }
3528*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_gt_4_subtile)3529*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_gt_4_subtile) {
3530*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
3531*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3532*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3533*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3534*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3535*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3536*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3537*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3538*4bdc9457SAndroid Build Coastguard Worker .m(m)
3539*4bdc9457SAndroid Build Coastguard Worker .n(n)
3540*4bdc9457SAndroid Build Coastguard Worker .k(k)
3541*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3542*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3543*4bdc9457SAndroid Build Coastguard Worker }
3544*4bdc9457SAndroid Build Coastguard Worker }
3545*4bdc9457SAndroid Build Coastguard Worker }
3546*4bdc9457SAndroid Build Coastguard Worker }
3547*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_div_4)3548*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_div_4) {
3549*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3550*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3551*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3552*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3553*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3554*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3555*4bdc9457SAndroid Build Coastguard Worker .m(6)
3556*4bdc9457SAndroid Build Coastguard Worker .n(8)
3557*4bdc9457SAndroid Build Coastguard Worker .k(k)
3558*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3559*4bdc9457SAndroid Build Coastguard Worker }
3560*4bdc9457SAndroid Build Coastguard Worker }
3561*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_div_4_strided_a)3562*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_div_4_strided_a) {
3563*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3564*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3565*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3566*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3567*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3568*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3569*4bdc9457SAndroid Build Coastguard Worker .m(6)
3570*4bdc9457SAndroid Build Coastguard Worker .n(8)
3571*4bdc9457SAndroid Build Coastguard Worker .k(k)
3572*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
3573*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3574*4bdc9457SAndroid Build Coastguard Worker }
3575*4bdc9457SAndroid Build Coastguard Worker }
3576*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,k_div_4_subtile)3577*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, k_div_4_subtile) {
3578*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
3579*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3580*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3581*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3582*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3583*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3584*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3585*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3586*4bdc9457SAndroid Build Coastguard Worker .m(m)
3587*4bdc9457SAndroid Build Coastguard Worker .n(n)
3588*4bdc9457SAndroid Build Coastguard Worker .k(k)
3589*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3590*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3591*4bdc9457SAndroid Build Coastguard Worker }
3592*4bdc9457SAndroid Build Coastguard Worker }
3593*4bdc9457SAndroid Build Coastguard Worker }
3594*4bdc9457SAndroid Build Coastguard Worker }
3595*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,n_gt_8)3596*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, n_gt_8) {
3597*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3598*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3599*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3600*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3601*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3602*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3603*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3604*4bdc9457SAndroid Build Coastguard Worker .m(6)
3605*4bdc9457SAndroid Build Coastguard Worker .n(n)
3606*4bdc9457SAndroid Build Coastguard Worker .k(k)
3607*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3608*4bdc9457SAndroid Build Coastguard Worker }
3609*4bdc9457SAndroid Build Coastguard Worker }
3610*4bdc9457SAndroid Build Coastguard Worker }
3611*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,n_gt_8_strided_cn)3612*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, n_gt_8_strided_cn) {
3613*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3614*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3615*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3616*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3617*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3618*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3619*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3620*4bdc9457SAndroid Build Coastguard Worker .m(6)
3621*4bdc9457SAndroid Build Coastguard Worker .n(n)
3622*4bdc9457SAndroid Build Coastguard Worker .k(k)
3623*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3624*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3625*4bdc9457SAndroid Build Coastguard Worker }
3626*4bdc9457SAndroid Build Coastguard Worker }
3627*4bdc9457SAndroid Build Coastguard Worker }
3628*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,n_gt_8_strided_a)3629*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, n_gt_8_strided_a) {
3630*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3631*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3632*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3633*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3634*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3635*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3636*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3637*4bdc9457SAndroid Build Coastguard Worker .m(6)
3638*4bdc9457SAndroid Build Coastguard Worker .n(n)
3639*4bdc9457SAndroid Build Coastguard Worker .k(k)
3640*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3641*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3642*4bdc9457SAndroid Build Coastguard Worker }
3643*4bdc9457SAndroid Build Coastguard Worker }
3644*4bdc9457SAndroid Build Coastguard Worker }
3645*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,n_gt_8_subtile)3646*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, n_gt_8_subtile) {
3647*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3648*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3649*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3650*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3651*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3652*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3653*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3654*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3655*4bdc9457SAndroid Build Coastguard Worker .m(m)
3656*4bdc9457SAndroid Build Coastguard Worker .n(n)
3657*4bdc9457SAndroid Build Coastguard Worker .k(k)
3658*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3659*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3660*4bdc9457SAndroid Build Coastguard Worker }
3661*4bdc9457SAndroid Build Coastguard Worker }
3662*4bdc9457SAndroid Build Coastguard Worker }
3663*4bdc9457SAndroid Build Coastguard Worker }
3664*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,n_div_8)3665*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, n_div_8) {
3666*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3667*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3668*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3669*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3670*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3671*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3672*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3673*4bdc9457SAndroid Build Coastguard Worker .m(6)
3674*4bdc9457SAndroid Build Coastguard Worker .n(n)
3675*4bdc9457SAndroid Build Coastguard Worker .k(k)
3676*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3677*4bdc9457SAndroid Build Coastguard Worker }
3678*4bdc9457SAndroid Build Coastguard Worker }
3679*4bdc9457SAndroid Build Coastguard Worker }
3680*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,n_div_8_strided_cn)3681*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, n_div_8_strided_cn) {
3682*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3683*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3684*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3685*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3686*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3687*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3688*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3689*4bdc9457SAndroid Build Coastguard Worker .m(6)
3690*4bdc9457SAndroid Build Coastguard Worker .n(n)
3691*4bdc9457SAndroid Build Coastguard Worker .k(k)
3692*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3693*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3694*4bdc9457SAndroid Build Coastguard Worker }
3695*4bdc9457SAndroid Build Coastguard Worker }
3696*4bdc9457SAndroid Build Coastguard Worker }
3697*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,n_div_8_strided_a)3698*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, n_div_8_strided_a) {
3699*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3700*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3701*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3702*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3703*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3704*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3705*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3706*4bdc9457SAndroid Build Coastguard Worker .m(6)
3707*4bdc9457SAndroid Build Coastguard Worker .n(n)
3708*4bdc9457SAndroid Build Coastguard Worker .k(k)
3709*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
3710*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3711*4bdc9457SAndroid Build Coastguard Worker }
3712*4bdc9457SAndroid Build Coastguard Worker }
3713*4bdc9457SAndroid Build Coastguard Worker }
3714*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,n_div_8_subtile)3715*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, n_div_8_subtile) {
3716*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3717*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3718*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3719*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3720*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3721*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3722*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3723*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3724*4bdc9457SAndroid Build Coastguard Worker .m(m)
3725*4bdc9457SAndroid Build Coastguard Worker .n(n)
3726*4bdc9457SAndroid Build Coastguard Worker .k(k)
3727*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3728*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3729*4bdc9457SAndroid Build Coastguard Worker }
3730*4bdc9457SAndroid Build Coastguard Worker }
3731*4bdc9457SAndroid Build Coastguard Worker }
3732*4bdc9457SAndroid Build Coastguard Worker }
3733*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,strided_cm_subtile)3734*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, strided_cm_subtile) {
3735*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
3736*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3737*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
3738*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3739*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3740*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3741*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3742*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3743*4bdc9457SAndroid Build Coastguard Worker .m(m)
3744*4bdc9457SAndroid Build Coastguard Worker .n(n)
3745*4bdc9457SAndroid Build Coastguard Worker .k(k)
3746*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3747*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3748*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3749*4bdc9457SAndroid Build Coastguard Worker }
3750*4bdc9457SAndroid Build Coastguard Worker }
3751*4bdc9457SAndroid Build Coastguard Worker }
3752*4bdc9457SAndroid Build Coastguard Worker }
3753*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMSIMD_SPLAT,strided_cm)3754*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMSIMD_SPLAT, strided_cm) {
3755*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3756*4bdc9457SAndroid Build Coastguard Worker .mr(6)
3757*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3758*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3759*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3760*4bdc9457SAndroid Build Coastguard Worker .m(6)
3761*4bdc9457SAndroid Build Coastguard Worker .n(8)
3762*4bdc9457SAndroid Build Coastguard Worker .k(4)
3763*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
3764*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmsimd_splat);
3765*4bdc9457SAndroid Build Coastguard Worker }
3766*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD
3767*4bdc9457SAndroid Build Coastguard Worker
3768*4bdc9457SAndroid Build Coastguard Worker
3769*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)3770*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
3771*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3772*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3773*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3774*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3775*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3776*4bdc9457SAndroid Build Coastguard Worker .m(1)
3777*4bdc9457SAndroid Build Coastguard Worker .n(8)
3778*4bdc9457SAndroid Build Coastguard Worker .k(1)
3779*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3780*4bdc9457SAndroid Build Coastguard Worker }
3781*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)3782*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
3783*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3784*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3785*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3786*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3787*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3788*4bdc9457SAndroid Build Coastguard Worker .m(1)
3789*4bdc9457SAndroid Build Coastguard Worker .n(8)
3790*4bdc9457SAndroid Build Coastguard Worker .k(1)
3791*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3792*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3793*4bdc9457SAndroid Build Coastguard Worker }
3794*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)3795*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
3796*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3797*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3798*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3799*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3800*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3801*4bdc9457SAndroid Build Coastguard Worker .m(1)
3802*4bdc9457SAndroid Build Coastguard Worker .n(8)
3803*4bdc9457SAndroid Build Coastguard Worker .k(1)
3804*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
3805*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3806*4bdc9457SAndroid Build Coastguard Worker }
3807*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)3808*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
3809*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3810*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3811*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3812*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3813*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3814*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3815*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3816*4bdc9457SAndroid Build Coastguard Worker .m(m)
3817*4bdc9457SAndroid Build Coastguard Worker .n(n)
3818*4bdc9457SAndroid Build Coastguard Worker .k(1)
3819*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3820*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3821*4bdc9457SAndroid Build Coastguard Worker }
3822*4bdc9457SAndroid Build Coastguard Worker }
3823*4bdc9457SAndroid Build Coastguard Worker }
3824*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)3825*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
3826*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3827*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3828*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3829*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3830*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3831*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3832*4bdc9457SAndroid Build Coastguard Worker .m(m)
3833*4bdc9457SAndroid Build Coastguard Worker .n(8)
3834*4bdc9457SAndroid Build Coastguard Worker .k(1)
3835*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3836*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3837*4bdc9457SAndroid Build Coastguard Worker }
3838*4bdc9457SAndroid Build Coastguard Worker }
3839*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)3840*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
3841*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3842*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3843*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3844*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3845*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3846*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3847*4bdc9457SAndroid Build Coastguard Worker .m(1)
3848*4bdc9457SAndroid Build Coastguard Worker .n(n)
3849*4bdc9457SAndroid Build Coastguard Worker .k(1)
3850*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3851*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3852*4bdc9457SAndroid Build Coastguard Worker }
3853*4bdc9457SAndroid Build Coastguard Worker }
3854*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)3855*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
3856*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3857*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3858*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3859*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3860*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3861*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3862*4bdc9457SAndroid Build Coastguard Worker .m(1)
3863*4bdc9457SAndroid Build Coastguard Worker .n(8)
3864*4bdc9457SAndroid Build Coastguard Worker .k(k)
3865*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3866*4bdc9457SAndroid Build Coastguard Worker }
3867*4bdc9457SAndroid Build Coastguard Worker }
3868*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)3869*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
3870*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3871*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3872*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3873*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3874*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3875*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3876*4bdc9457SAndroid Build Coastguard Worker .m(1)
3877*4bdc9457SAndroid Build Coastguard Worker .n(8)
3878*4bdc9457SAndroid Build Coastguard Worker .k(k)
3879*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
3880*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3881*4bdc9457SAndroid Build Coastguard Worker }
3882*4bdc9457SAndroid Build Coastguard Worker }
3883*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)3884*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
3885*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
3886*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
3887*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3888*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3889*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3890*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3891*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3892*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3893*4bdc9457SAndroid Build Coastguard Worker .m(m)
3894*4bdc9457SAndroid Build Coastguard Worker .n(n)
3895*4bdc9457SAndroid Build Coastguard Worker .k(k)
3896*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3897*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3898*4bdc9457SAndroid Build Coastguard Worker }
3899*4bdc9457SAndroid Build Coastguard Worker }
3900*4bdc9457SAndroid Build Coastguard Worker }
3901*4bdc9457SAndroid Build Coastguard Worker }
3902*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)3903*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
3904*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3905*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3906*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3907*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3908*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3909*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3910*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3911*4bdc9457SAndroid Build Coastguard Worker .m(1)
3912*4bdc9457SAndroid Build Coastguard Worker .n(n)
3913*4bdc9457SAndroid Build Coastguard Worker .k(k)
3914*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3915*4bdc9457SAndroid Build Coastguard Worker }
3916*4bdc9457SAndroid Build Coastguard Worker }
3917*4bdc9457SAndroid Build Coastguard Worker }
3918*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)3919*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
3920*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3921*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3922*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3923*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3924*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3925*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3926*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3927*4bdc9457SAndroid Build Coastguard Worker .m(1)
3928*4bdc9457SAndroid Build Coastguard Worker .n(n)
3929*4bdc9457SAndroid Build Coastguard Worker .k(k)
3930*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
3931*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3932*4bdc9457SAndroid Build Coastguard Worker }
3933*4bdc9457SAndroid Build Coastguard Worker }
3934*4bdc9457SAndroid Build Coastguard Worker }
3935*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)3936*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
3937*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3938*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3939*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3940*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3941*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3942*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3943*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3944*4bdc9457SAndroid Build Coastguard Worker .m(1)
3945*4bdc9457SAndroid Build Coastguard Worker .n(n)
3946*4bdc9457SAndroid Build Coastguard Worker .k(k)
3947*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
3948*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3949*4bdc9457SAndroid Build Coastguard Worker }
3950*4bdc9457SAndroid Build Coastguard Worker }
3951*4bdc9457SAndroid Build Coastguard Worker }
3952*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)3953*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
3954*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
3955*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3956*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
3957*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3958*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3959*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3960*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3961*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3962*4bdc9457SAndroid Build Coastguard Worker .m(m)
3963*4bdc9457SAndroid Build Coastguard Worker .n(n)
3964*4bdc9457SAndroid Build Coastguard Worker .k(k)
3965*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
3966*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3967*4bdc9457SAndroid Build Coastguard Worker }
3968*4bdc9457SAndroid Build Coastguard Worker }
3969*4bdc9457SAndroid Build Coastguard Worker }
3970*4bdc9457SAndroid Build Coastguard Worker }
3971*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)3972*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
3973*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3974*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3975*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3976*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3977*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3978*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3979*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3980*4bdc9457SAndroid Build Coastguard Worker .m(1)
3981*4bdc9457SAndroid Build Coastguard Worker .n(n)
3982*4bdc9457SAndroid Build Coastguard Worker .k(k)
3983*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
3984*4bdc9457SAndroid Build Coastguard Worker }
3985*4bdc9457SAndroid Build Coastguard Worker }
3986*4bdc9457SAndroid Build Coastguard Worker }
3987*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)3988*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
3989*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
3990*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
3991*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
3992*4bdc9457SAndroid Build Coastguard Worker .mr(1)
3993*4bdc9457SAndroid Build Coastguard Worker .nr(8)
3994*4bdc9457SAndroid Build Coastguard Worker .kr(1)
3995*4bdc9457SAndroid Build Coastguard Worker .sr(1)
3996*4bdc9457SAndroid Build Coastguard Worker .m(1)
3997*4bdc9457SAndroid Build Coastguard Worker .n(n)
3998*4bdc9457SAndroid Build Coastguard Worker .k(k)
3999*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4000*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
4001*4bdc9457SAndroid Build Coastguard Worker }
4002*4bdc9457SAndroid Build Coastguard Worker }
4003*4bdc9457SAndroid Build Coastguard Worker }
4004*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)4005*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
4006*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4007*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4008*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4009*4bdc9457SAndroid Build Coastguard Worker .mr(1)
4010*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4011*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4012*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4013*4bdc9457SAndroid Build Coastguard Worker .m(1)
4014*4bdc9457SAndroid Build Coastguard Worker .n(n)
4015*4bdc9457SAndroid Build Coastguard Worker .k(k)
4016*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4017*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
4018*4bdc9457SAndroid Build Coastguard Worker }
4019*4bdc9457SAndroid Build Coastguard Worker }
4020*4bdc9457SAndroid Build Coastguard Worker }
4021*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)4022*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
4023*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4024*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4025*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
4026*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4027*4bdc9457SAndroid Build Coastguard Worker .mr(1)
4028*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4029*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4030*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4031*4bdc9457SAndroid Build Coastguard Worker .m(m)
4032*4bdc9457SAndroid Build Coastguard Worker .n(n)
4033*4bdc9457SAndroid Build Coastguard Worker .k(k)
4034*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4035*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
4036*4bdc9457SAndroid Build Coastguard Worker }
4037*4bdc9457SAndroid Build Coastguard Worker }
4038*4bdc9457SAndroid Build Coastguard Worker }
4039*4bdc9457SAndroid Build Coastguard Worker }
4040*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)4041*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
4042*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4043*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4044*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 1; m++) {
4045*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4046*4bdc9457SAndroid Build Coastguard Worker .mr(1)
4047*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4048*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4049*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4050*4bdc9457SAndroid Build Coastguard Worker .m(m)
4051*4bdc9457SAndroid Build Coastguard Worker .n(n)
4052*4bdc9457SAndroid Build Coastguard Worker .k(k)
4053*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4054*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4055*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
4056*4bdc9457SAndroid Build Coastguard Worker }
4057*4bdc9457SAndroid Build Coastguard Worker }
4058*4bdc9457SAndroid Build Coastguard Worker }
4059*4bdc9457SAndroid Build Coastguard Worker }
4060*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)4061*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_1X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
4062*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4063*4bdc9457SAndroid Build Coastguard Worker .mr(1)
4064*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4065*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4066*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4067*4bdc9457SAndroid Build Coastguard Worker .m(1)
4068*4bdc9457SAndroid Build Coastguard Worker .n(8)
4069*4bdc9457SAndroid Build Coastguard Worker .k(1)
4070*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4071*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_1x8__wasmrelaxedsimd_fma_loadsplat);
4072*4bdc9457SAndroid Build Coastguard Worker }
4073*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4074*4bdc9457SAndroid Build Coastguard Worker
4075*4bdc9457SAndroid Build Coastguard Worker
4076*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)4077*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
4078*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4079*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4080*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4081*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4082*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4083*4bdc9457SAndroid Build Coastguard Worker .m(3)
4084*4bdc9457SAndroid Build Coastguard Worker .n(8)
4085*4bdc9457SAndroid Build Coastguard Worker .k(1)
4086*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4087*4bdc9457SAndroid Build Coastguard Worker }
4088*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)4089*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
4090*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4091*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4092*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4093*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4094*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4095*4bdc9457SAndroid Build Coastguard Worker .m(3)
4096*4bdc9457SAndroid Build Coastguard Worker .n(8)
4097*4bdc9457SAndroid Build Coastguard Worker .k(1)
4098*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4099*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4100*4bdc9457SAndroid Build Coastguard Worker }
4101*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)4102*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
4103*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4104*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4105*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4106*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4107*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4108*4bdc9457SAndroid Build Coastguard Worker .m(3)
4109*4bdc9457SAndroid Build Coastguard Worker .n(8)
4110*4bdc9457SAndroid Build Coastguard Worker .k(1)
4111*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
4112*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4113*4bdc9457SAndroid Build Coastguard Worker }
4114*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)4115*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
4116*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4117*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4118*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4119*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4120*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4121*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4122*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4123*4bdc9457SAndroid Build Coastguard Worker .m(m)
4124*4bdc9457SAndroid Build Coastguard Worker .n(n)
4125*4bdc9457SAndroid Build Coastguard Worker .k(1)
4126*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4127*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4128*4bdc9457SAndroid Build Coastguard Worker }
4129*4bdc9457SAndroid Build Coastguard Worker }
4130*4bdc9457SAndroid Build Coastguard Worker }
4131*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)4132*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
4133*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4134*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4135*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4136*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4137*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4138*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4139*4bdc9457SAndroid Build Coastguard Worker .m(m)
4140*4bdc9457SAndroid Build Coastguard Worker .n(8)
4141*4bdc9457SAndroid Build Coastguard Worker .k(1)
4142*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4143*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4144*4bdc9457SAndroid Build Coastguard Worker }
4145*4bdc9457SAndroid Build Coastguard Worker }
4146*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)4147*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
4148*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4149*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4150*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4151*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4152*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4153*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4154*4bdc9457SAndroid Build Coastguard Worker .m(3)
4155*4bdc9457SAndroid Build Coastguard Worker .n(n)
4156*4bdc9457SAndroid Build Coastguard Worker .k(1)
4157*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4158*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4159*4bdc9457SAndroid Build Coastguard Worker }
4160*4bdc9457SAndroid Build Coastguard Worker }
4161*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)4162*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
4163*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4164*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4165*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4166*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4167*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4168*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4169*4bdc9457SAndroid Build Coastguard Worker .m(3)
4170*4bdc9457SAndroid Build Coastguard Worker .n(8)
4171*4bdc9457SAndroid Build Coastguard Worker .k(k)
4172*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4173*4bdc9457SAndroid Build Coastguard Worker }
4174*4bdc9457SAndroid Build Coastguard Worker }
4175*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)4176*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
4177*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4178*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4179*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4180*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4181*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4182*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4183*4bdc9457SAndroid Build Coastguard Worker .m(3)
4184*4bdc9457SAndroid Build Coastguard Worker .n(8)
4185*4bdc9457SAndroid Build Coastguard Worker .k(k)
4186*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
4187*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4188*4bdc9457SAndroid Build Coastguard Worker }
4189*4bdc9457SAndroid Build Coastguard Worker }
4190*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)4191*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
4192*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4193*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4194*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4195*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4196*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4197*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4198*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4199*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4200*4bdc9457SAndroid Build Coastguard Worker .m(m)
4201*4bdc9457SAndroid Build Coastguard Worker .n(n)
4202*4bdc9457SAndroid Build Coastguard Worker .k(k)
4203*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4204*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4205*4bdc9457SAndroid Build Coastguard Worker }
4206*4bdc9457SAndroid Build Coastguard Worker }
4207*4bdc9457SAndroid Build Coastguard Worker }
4208*4bdc9457SAndroid Build Coastguard Worker }
4209*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)4210*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
4211*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4212*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4213*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4214*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4215*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4216*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4217*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4218*4bdc9457SAndroid Build Coastguard Worker .m(3)
4219*4bdc9457SAndroid Build Coastguard Worker .n(n)
4220*4bdc9457SAndroid Build Coastguard Worker .k(k)
4221*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4222*4bdc9457SAndroid Build Coastguard Worker }
4223*4bdc9457SAndroid Build Coastguard Worker }
4224*4bdc9457SAndroid Build Coastguard Worker }
4225*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)4226*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
4227*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4228*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4229*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4230*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4231*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4232*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4233*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4234*4bdc9457SAndroid Build Coastguard Worker .m(3)
4235*4bdc9457SAndroid Build Coastguard Worker .n(n)
4236*4bdc9457SAndroid Build Coastguard Worker .k(k)
4237*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4238*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4239*4bdc9457SAndroid Build Coastguard Worker }
4240*4bdc9457SAndroid Build Coastguard Worker }
4241*4bdc9457SAndroid Build Coastguard Worker }
4242*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)4243*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
4244*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4245*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4246*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4247*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4248*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4249*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4250*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4251*4bdc9457SAndroid Build Coastguard Worker .m(3)
4252*4bdc9457SAndroid Build Coastguard Worker .n(n)
4253*4bdc9457SAndroid Build Coastguard Worker .k(k)
4254*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4255*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4256*4bdc9457SAndroid Build Coastguard Worker }
4257*4bdc9457SAndroid Build Coastguard Worker }
4258*4bdc9457SAndroid Build Coastguard Worker }
4259*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)4260*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
4261*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4262*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4263*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4264*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4265*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4266*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4267*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4268*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4269*4bdc9457SAndroid Build Coastguard Worker .m(m)
4270*4bdc9457SAndroid Build Coastguard Worker .n(n)
4271*4bdc9457SAndroid Build Coastguard Worker .k(k)
4272*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4273*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4274*4bdc9457SAndroid Build Coastguard Worker }
4275*4bdc9457SAndroid Build Coastguard Worker }
4276*4bdc9457SAndroid Build Coastguard Worker }
4277*4bdc9457SAndroid Build Coastguard Worker }
4278*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)4279*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
4280*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4281*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4282*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4283*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4284*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4285*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4286*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4287*4bdc9457SAndroid Build Coastguard Worker .m(3)
4288*4bdc9457SAndroid Build Coastguard Worker .n(n)
4289*4bdc9457SAndroid Build Coastguard Worker .k(k)
4290*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4291*4bdc9457SAndroid Build Coastguard Worker }
4292*4bdc9457SAndroid Build Coastguard Worker }
4293*4bdc9457SAndroid Build Coastguard Worker }
4294*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)4295*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
4296*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4297*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4298*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4299*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4300*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4301*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4302*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4303*4bdc9457SAndroid Build Coastguard Worker .m(3)
4304*4bdc9457SAndroid Build Coastguard Worker .n(n)
4305*4bdc9457SAndroid Build Coastguard Worker .k(k)
4306*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4307*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4308*4bdc9457SAndroid Build Coastguard Worker }
4309*4bdc9457SAndroid Build Coastguard Worker }
4310*4bdc9457SAndroid Build Coastguard Worker }
4311*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)4312*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
4313*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4314*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4315*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4316*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4317*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4318*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4319*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4320*4bdc9457SAndroid Build Coastguard Worker .m(3)
4321*4bdc9457SAndroid Build Coastguard Worker .n(n)
4322*4bdc9457SAndroid Build Coastguard Worker .k(k)
4323*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4324*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4325*4bdc9457SAndroid Build Coastguard Worker }
4326*4bdc9457SAndroid Build Coastguard Worker }
4327*4bdc9457SAndroid Build Coastguard Worker }
4328*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)4329*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
4330*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4331*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4332*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4333*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4334*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4335*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4336*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4337*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4338*4bdc9457SAndroid Build Coastguard Worker .m(m)
4339*4bdc9457SAndroid Build Coastguard Worker .n(n)
4340*4bdc9457SAndroid Build Coastguard Worker .k(k)
4341*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4342*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4343*4bdc9457SAndroid Build Coastguard Worker }
4344*4bdc9457SAndroid Build Coastguard Worker }
4345*4bdc9457SAndroid Build Coastguard Worker }
4346*4bdc9457SAndroid Build Coastguard Worker }
4347*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)4348*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
4349*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4350*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4351*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4352*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4353*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4354*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4355*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4356*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4357*4bdc9457SAndroid Build Coastguard Worker .m(m)
4358*4bdc9457SAndroid Build Coastguard Worker .n(n)
4359*4bdc9457SAndroid Build Coastguard Worker .k(k)
4360*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4361*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4362*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4363*4bdc9457SAndroid Build Coastguard Worker }
4364*4bdc9457SAndroid Build Coastguard Worker }
4365*4bdc9457SAndroid Build Coastguard Worker }
4366*4bdc9457SAndroid Build Coastguard Worker }
4367*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)4368*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
4369*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4370*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4371*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4372*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4373*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4374*4bdc9457SAndroid Build Coastguard Worker .m(3)
4375*4bdc9457SAndroid Build Coastguard Worker .n(8)
4376*4bdc9457SAndroid Build Coastguard Worker .k(1)
4377*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4378*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_loadsplat);
4379*4bdc9457SAndroid Build Coastguard Worker }
4380*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4381*4bdc9457SAndroid Build Coastguard Worker
4382*4bdc9457SAndroid Build Coastguard Worker
4383*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)4384*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
4385*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4386*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4387*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4388*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4389*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4390*4bdc9457SAndroid Build Coastguard Worker .m(3)
4391*4bdc9457SAndroid Build Coastguard Worker .n(8)
4392*4bdc9457SAndroid Build Coastguard Worker .k(4)
4393*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4394*4bdc9457SAndroid Build Coastguard Worker }
4395*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,strided_cn)4396*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
4397*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4398*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4399*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4400*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4401*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4402*4bdc9457SAndroid Build Coastguard Worker .m(3)
4403*4bdc9457SAndroid Build Coastguard Worker .n(8)
4404*4bdc9457SAndroid Build Coastguard Worker .k(4)
4405*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4406*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4407*4bdc9457SAndroid Build Coastguard Worker }
4408*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_strided_a)4409*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_strided_a) {
4410*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4411*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4412*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4413*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4414*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4415*4bdc9457SAndroid Build Coastguard Worker .m(3)
4416*4bdc9457SAndroid Build Coastguard Worker .n(8)
4417*4bdc9457SAndroid Build Coastguard Worker .k(4)
4418*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4419*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4420*4bdc9457SAndroid Build Coastguard Worker }
4421*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)4422*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
4423*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4424*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4425*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4426*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4427*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4428*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4429*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4430*4bdc9457SAndroid Build Coastguard Worker .m(m)
4431*4bdc9457SAndroid Build Coastguard Worker .n(n)
4432*4bdc9457SAndroid Build Coastguard Worker .k(4)
4433*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4434*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4435*4bdc9457SAndroid Build Coastguard Worker }
4436*4bdc9457SAndroid Build Coastguard Worker }
4437*4bdc9457SAndroid Build Coastguard Worker }
4438*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)4439*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
4440*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4441*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4442*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4443*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4444*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4445*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4446*4bdc9457SAndroid Build Coastguard Worker .m(m)
4447*4bdc9457SAndroid Build Coastguard Worker .n(8)
4448*4bdc9457SAndroid Build Coastguard Worker .k(4)
4449*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4450*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4451*4bdc9457SAndroid Build Coastguard Worker }
4452*4bdc9457SAndroid Build Coastguard Worker }
4453*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)4454*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
4455*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4456*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4457*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4458*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4459*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4460*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4461*4bdc9457SAndroid Build Coastguard Worker .m(3)
4462*4bdc9457SAndroid Build Coastguard Worker .n(n)
4463*4bdc9457SAndroid Build Coastguard Worker .k(4)
4464*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4465*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4466*4bdc9457SAndroid Build Coastguard Worker }
4467*4bdc9457SAndroid Build Coastguard Worker }
4468*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)4469*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
4470*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4471*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4472*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4473*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4474*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4475*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4476*4bdc9457SAndroid Build Coastguard Worker .m(3)
4477*4bdc9457SAndroid Build Coastguard Worker .n(8)
4478*4bdc9457SAndroid Build Coastguard Worker .k(k)
4479*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4480*4bdc9457SAndroid Build Coastguard Worker }
4481*4bdc9457SAndroid Build Coastguard Worker }
4482*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_strided_a)4483*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_strided_a) {
4484*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4485*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4486*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4487*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4488*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4489*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4490*4bdc9457SAndroid Build Coastguard Worker .m(3)
4491*4bdc9457SAndroid Build Coastguard Worker .n(8)
4492*4bdc9457SAndroid Build Coastguard Worker .k(k)
4493*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4494*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4495*4bdc9457SAndroid Build Coastguard Worker }
4496*4bdc9457SAndroid Build Coastguard Worker }
4497*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)4498*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
4499*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
4500*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4501*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4502*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4503*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4504*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4505*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4506*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4507*4bdc9457SAndroid Build Coastguard Worker .m(m)
4508*4bdc9457SAndroid Build Coastguard Worker .n(n)
4509*4bdc9457SAndroid Build Coastguard Worker .k(k)
4510*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4511*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4512*4bdc9457SAndroid Build Coastguard Worker }
4513*4bdc9457SAndroid Build Coastguard Worker }
4514*4bdc9457SAndroid Build Coastguard Worker }
4515*4bdc9457SAndroid Build Coastguard Worker }
4516*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)4517*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
4518*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4519*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4520*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4521*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4522*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4523*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4524*4bdc9457SAndroid Build Coastguard Worker .m(3)
4525*4bdc9457SAndroid Build Coastguard Worker .n(8)
4526*4bdc9457SAndroid Build Coastguard Worker .k(k)
4527*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4528*4bdc9457SAndroid Build Coastguard Worker }
4529*4bdc9457SAndroid Build Coastguard Worker }
4530*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_strided_a)4531*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_strided_a) {
4532*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4533*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4534*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4535*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4536*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4537*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4538*4bdc9457SAndroid Build Coastguard Worker .m(3)
4539*4bdc9457SAndroid Build Coastguard Worker .n(8)
4540*4bdc9457SAndroid Build Coastguard Worker .k(k)
4541*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
4542*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4543*4bdc9457SAndroid Build Coastguard Worker }
4544*4bdc9457SAndroid Build Coastguard Worker }
4545*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)4546*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
4547*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
4548*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4549*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4550*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4551*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4552*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4553*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4554*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4555*4bdc9457SAndroid Build Coastguard Worker .m(m)
4556*4bdc9457SAndroid Build Coastguard Worker .n(n)
4557*4bdc9457SAndroid Build Coastguard Worker .k(k)
4558*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4559*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4560*4bdc9457SAndroid Build Coastguard Worker }
4561*4bdc9457SAndroid Build Coastguard Worker }
4562*4bdc9457SAndroid Build Coastguard Worker }
4563*4bdc9457SAndroid Build Coastguard Worker }
4564*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_div_4)4565*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
4566*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4567*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4568*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4569*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4570*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4571*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4572*4bdc9457SAndroid Build Coastguard Worker .m(3)
4573*4bdc9457SAndroid Build Coastguard Worker .n(8)
4574*4bdc9457SAndroid Build Coastguard Worker .k(k)
4575*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4576*4bdc9457SAndroid Build Coastguard Worker }
4577*4bdc9457SAndroid Build Coastguard Worker }
4578*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_div_4_strided_a)4579*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_div_4_strided_a) {
4580*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4581*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4582*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4583*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4584*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4585*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4586*4bdc9457SAndroid Build Coastguard Worker .m(3)
4587*4bdc9457SAndroid Build Coastguard Worker .n(8)
4588*4bdc9457SAndroid Build Coastguard Worker .k(k)
4589*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
4590*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4591*4bdc9457SAndroid Build Coastguard Worker }
4592*4bdc9457SAndroid Build Coastguard Worker }
4593*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)4594*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
4595*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
4596*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4597*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4598*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4599*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4600*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4601*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4602*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4603*4bdc9457SAndroid Build Coastguard Worker .m(m)
4604*4bdc9457SAndroid Build Coastguard Worker .n(n)
4605*4bdc9457SAndroid Build Coastguard Worker .k(k)
4606*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4607*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4608*4bdc9457SAndroid Build Coastguard Worker }
4609*4bdc9457SAndroid Build Coastguard Worker }
4610*4bdc9457SAndroid Build Coastguard Worker }
4611*4bdc9457SAndroid Build Coastguard Worker }
4612*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)4613*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
4614*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4615*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4616*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4617*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4618*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4619*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4620*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4621*4bdc9457SAndroid Build Coastguard Worker .m(3)
4622*4bdc9457SAndroid Build Coastguard Worker .n(n)
4623*4bdc9457SAndroid Build Coastguard Worker .k(k)
4624*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4625*4bdc9457SAndroid Build Coastguard Worker }
4626*4bdc9457SAndroid Build Coastguard Worker }
4627*4bdc9457SAndroid Build Coastguard Worker }
4628*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)4629*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
4630*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4631*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4632*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4633*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4634*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4635*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4636*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4637*4bdc9457SAndroid Build Coastguard Worker .m(3)
4638*4bdc9457SAndroid Build Coastguard Worker .n(n)
4639*4bdc9457SAndroid Build Coastguard Worker .k(k)
4640*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4641*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4642*4bdc9457SAndroid Build Coastguard Worker }
4643*4bdc9457SAndroid Build Coastguard Worker }
4644*4bdc9457SAndroid Build Coastguard Worker }
4645*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_a)4646*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_a) {
4647*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4648*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4649*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4650*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4651*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4652*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4653*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4654*4bdc9457SAndroid Build Coastguard Worker .m(3)
4655*4bdc9457SAndroid Build Coastguard Worker .n(n)
4656*4bdc9457SAndroid Build Coastguard Worker .k(k)
4657*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4658*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4659*4bdc9457SAndroid Build Coastguard Worker }
4660*4bdc9457SAndroid Build Coastguard Worker }
4661*4bdc9457SAndroid Build Coastguard Worker }
4662*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)4663*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
4664*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4665*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4666*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4667*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4668*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4669*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4670*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4671*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4672*4bdc9457SAndroid Build Coastguard Worker .m(m)
4673*4bdc9457SAndroid Build Coastguard Worker .n(n)
4674*4bdc9457SAndroid Build Coastguard Worker .k(k)
4675*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4676*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4677*4bdc9457SAndroid Build Coastguard Worker }
4678*4bdc9457SAndroid Build Coastguard Worker }
4679*4bdc9457SAndroid Build Coastguard Worker }
4680*4bdc9457SAndroid Build Coastguard Worker }
4681*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8)4682*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
4683*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4684*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4685*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4686*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4687*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4688*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4689*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4690*4bdc9457SAndroid Build Coastguard Worker .m(3)
4691*4bdc9457SAndroid Build Coastguard Worker .n(n)
4692*4bdc9457SAndroid Build Coastguard Worker .k(k)
4693*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4694*4bdc9457SAndroid Build Coastguard Worker }
4695*4bdc9457SAndroid Build Coastguard Worker }
4696*4bdc9457SAndroid Build Coastguard Worker }
4697*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)4698*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
4699*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4700*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4701*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4702*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4703*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4704*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4705*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4706*4bdc9457SAndroid Build Coastguard Worker .m(3)
4707*4bdc9457SAndroid Build Coastguard Worker .n(n)
4708*4bdc9457SAndroid Build Coastguard Worker .k(k)
4709*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4710*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4711*4bdc9457SAndroid Build Coastguard Worker }
4712*4bdc9457SAndroid Build Coastguard Worker }
4713*4bdc9457SAndroid Build Coastguard Worker }
4714*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_a)4715*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_a) {
4716*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4717*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4718*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4719*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4720*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4721*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4722*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4723*4bdc9457SAndroid Build Coastguard Worker .m(3)
4724*4bdc9457SAndroid Build Coastguard Worker .n(n)
4725*4bdc9457SAndroid Build Coastguard Worker .k(k)
4726*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
4727*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4728*4bdc9457SAndroid Build Coastguard Worker }
4729*4bdc9457SAndroid Build Coastguard Worker }
4730*4bdc9457SAndroid Build Coastguard Worker }
4731*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)4732*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
4733*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4734*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4735*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4736*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4737*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4738*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4739*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4740*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4741*4bdc9457SAndroid Build Coastguard Worker .m(m)
4742*4bdc9457SAndroid Build Coastguard Worker .n(n)
4743*4bdc9457SAndroid Build Coastguard Worker .k(k)
4744*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4745*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4746*4bdc9457SAndroid Build Coastguard Worker }
4747*4bdc9457SAndroid Build Coastguard Worker }
4748*4bdc9457SAndroid Build Coastguard Worker }
4749*4bdc9457SAndroid Build Coastguard Worker }
4750*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)4751*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
4752*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
4753*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4754*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 3; m++) {
4755*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4756*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4757*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4758*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4759*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4760*4bdc9457SAndroid Build Coastguard Worker .m(m)
4761*4bdc9457SAndroid Build Coastguard Worker .n(n)
4762*4bdc9457SAndroid Build Coastguard Worker .k(k)
4763*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4764*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4765*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4766*4bdc9457SAndroid Build Coastguard Worker }
4767*4bdc9457SAndroid Build Coastguard Worker }
4768*4bdc9457SAndroid Build Coastguard Worker }
4769*4bdc9457SAndroid Build Coastguard Worker }
4770*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA,strided_cm)4771*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_3X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
4772*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4773*4bdc9457SAndroid Build Coastguard Worker .mr(3)
4774*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4775*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4776*4bdc9457SAndroid Build Coastguard Worker .sr(4)
4777*4bdc9457SAndroid Build Coastguard Worker .m(3)
4778*4bdc9457SAndroid Build Coastguard Worker .n(8)
4779*4bdc9457SAndroid Build Coastguard Worker .k(4)
4780*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
4781*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_3x8s4__wasmrelaxedsimd_fma);
4782*4bdc9457SAndroid Build Coastguard Worker }
4783*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
4784*4bdc9457SAndroid Build Coastguard Worker
4785*4bdc9457SAndroid Build Coastguard Worker
4786*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)4787*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
4788*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4789*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4790*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4791*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4792*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4793*4bdc9457SAndroid Build Coastguard Worker .m(4)
4794*4bdc9457SAndroid Build Coastguard Worker .n(8)
4795*4bdc9457SAndroid Build Coastguard Worker .k(1)
4796*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4797*4bdc9457SAndroid Build Coastguard Worker }
4798*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)4799*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
4800*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4801*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4802*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4803*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4804*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4805*4bdc9457SAndroid Build Coastguard Worker .m(4)
4806*4bdc9457SAndroid Build Coastguard Worker .n(8)
4807*4bdc9457SAndroid Build Coastguard Worker .k(1)
4808*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4809*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4810*4bdc9457SAndroid Build Coastguard Worker }
4811*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)4812*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
4813*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4814*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4815*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4816*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4817*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4818*4bdc9457SAndroid Build Coastguard Worker .m(4)
4819*4bdc9457SAndroid Build Coastguard Worker .n(8)
4820*4bdc9457SAndroid Build Coastguard Worker .k(1)
4821*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
4822*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4823*4bdc9457SAndroid Build Coastguard Worker }
4824*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)4825*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
4826*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4827*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4828*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4829*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4830*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4831*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4832*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4833*4bdc9457SAndroid Build Coastguard Worker .m(m)
4834*4bdc9457SAndroid Build Coastguard Worker .n(n)
4835*4bdc9457SAndroid Build Coastguard Worker .k(1)
4836*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4837*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4838*4bdc9457SAndroid Build Coastguard Worker }
4839*4bdc9457SAndroid Build Coastguard Worker }
4840*4bdc9457SAndroid Build Coastguard Worker }
4841*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)4842*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
4843*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4844*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4845*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4846*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4847*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4848*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4849*4bdc9457SAndroid Build Coastguard Worker .m(m)
4850*4bdc9457SAndroid Build Coastguard Worker .n(8)
4851*4bdc9457SAndroid Build Coastguard Worker .k(1)
4852*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4853*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4854*4bdc9457SAndroid Build Coastguard Worker }
4855*4bdc9457SAndroid Build Coastguard Worker }
4856*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)4857*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
4858*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4859*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4860*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4861*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4862*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4863*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4864*4bdc9457SAndroid Build Coastguard Worker .m(4)
4865*4bdc9457SAndroid Build Coastguard Worker .n(n)
4866*4bdc9457SAndroid Build Coastguard Worker .k(1)
4867*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4868*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4869*4bdc9457SAndroid Build Coastguard Worker }
4870*4bdc9457SAndroid Build Coastguard Worker }
4871*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)4872*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
4873*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4874*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4875*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4876*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4877*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4878*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4879*4bdc9457SAndroid Build Coastguard Worker .m(4)
4880*4bdc9457SAndroid Build Coastguard Worker .n(8)
4881*4bdc9457SAndroid Build Coastguard Worker .k(k)
4882*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4883*4bdc9457SAndroid Build Coastguard Worker }
4884*4bdc9457SAndroid Build Coastguard Worker }
4885*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)4886*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
4887*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4888*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4889*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4890*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4891*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4892*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4893*4bdc9457SAndroid Build Coastguard Worker .m(4)
4894*4bdc9457SAndroid Build Coastguard Worker .n(8)
4895*4bdc9457SAndroid Build Coastguard Worker .k(k)
4896*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
4897*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4898*4bdc9457SAndroid Build Coastguard Worker }
4899*4bdc9457SAndroid Build Coastguard Worker }
4900*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)4901*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
4902*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
4903*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
4904*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4905*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4906*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4907*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4908*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4909*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4910*4bdc9457SAndroid Build Coastguard Worker .m(m)
4911*4bdc9457SAndroid Build Coastguard Worker .n(n)
4912*4bdc9457SAndroid Build Coastguard Worker .k(k)
4913*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4914*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4915*4bdc9457SAndroid Build Coastguard Worker }
4916*4bdc9457SAndroid Build Coastguard Worker }
4917*4bdc9457SAndroid Build Coastguard Worker }
4918*4bdc9457SAndroid Build Coastguard Worker }
4919*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)4920*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
4921*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4922*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4923*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4924*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4925*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4926*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4927*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4928*4bdc9457SAndroid Build Coastguard Worker .m(4)
4929*4bdc9457SAndroid Build Coastguard Worker .n(n)
4930*4bdc9457SAndroid Build Coastguard Worker .k(k)
4931*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4932*4bdc9457SAndroid Build Coastguard Worker }
4933*4bdc9457SAndroid Build Coastguard Worker }
4934*4bdc9457SAndroid Build Coastguard Worker }
4935*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)4936*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
4937*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4938*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4939*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4940*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4941*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4942*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4943*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4944*4bdc9457SAndroid Build Coastguard Worker .m(4)
4945*4bdc9457SAndroid Build Coastguard Worker .n(n)
4946*4bdc9457SAndroid Build Coastguard Worker .k(k)
4947*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
4948*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4949*4bdc9457SAndroid Build Coastguard Worker }
4950*4bdc9457SAndroid Build Coastguard Worker }
4951*4bdc9457SAndroid Build Coastguard Worker }
4952*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)4953*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
4954*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4955*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4956*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4957*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4958*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4959*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4960*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4961*4bdc9457SAndroid Build Coastguard Worker .m(4)
4962*4bdc9457SAndroid Build Coastguard Worker .n(n)
4963*4bdc9457SAndroid Build Coastguard Worker .k(k)
4964*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
4965*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4966*4bdc9457SAndroid Build Coastguard Worker }
4967*4bdc9457SAndroid Build Coastguard Worker }
4968*4bdc9457SAndroid Build Coastguard Worker }
4969*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)4970*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
4971*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
4972*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4973*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
4974*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4975*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4976*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4977*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4978*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4979*4bdc9457SAndroid Build Coastguard Worker .m(m)
4980*4bdc9457SAndroid Build Coastguard Worker .n(n)
4981*4bdc9457SAndroid Build Coastguard Worker .k(k)
4982*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
4983*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
4984*4bdc9457SAndroid Build Coastguard Worker }
4985*4bdc9457SAndroid Build Coastguard Worker }
4986*4bdc9457SAndroid Build Coastguard Worker }
4987*4bdc9457SAndroid Build Coastguard Worker }
4988*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)4989*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
4990*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
4991*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
4992*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
4993*4bdc9457SAndroid Build Coastguard Worker .mr(4)
4994*4bdc9457SAndroid Build Coastguard Worker .nr(8)
4995*4bdc9457SAndroid Build Coastguard Worker .kr(1)
4996*4bdc9457SAndroid Build Coastguard Worker .sr(1)
4997*4bdc9457SAndroid Build Coastguard Worker .m(4)
4998*4bdc9457SAndroid Build Coastguard Worker .n(n)
4999*4bdc9457SAndroid Build Coastguard Worker .k(k)
5000*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5001*4bdc9457SAndroid Build Coastguard Worker }
5002*4bdc9457SAndroid Build Coastguard Worker }
5003*4bdc9457SAndroid Build Coastguard Worker }
5004*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)5005*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
5006*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5007*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5008*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5009*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5010*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5011*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5012*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5013*4bdc9457SAndroid Build Coastguard Worker .m(4)
5014*4bdc9457SAndroid Build Coastguard Worker .n(n)
5015*4bdc9457SAndroid Build Coastguard Worker .k(k)
5016*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5017*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5018*4bdc9457SAndroid Build Coastguard Worker }
5019*4bdc9457SAndroid Build Coastguard Worker }
5020*4bdc9457SAndroid Build Coastguard Worker }
5021*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)5022*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
5023*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5024*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5025*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5026*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5027*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5028*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5029*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5030*4bdc9457SAndroid Build Coastguard Worker .m(4)
5031*4bdc9457SAndroid Build Coastguard Worker .n(n)
5032*4bdc9457SAndroid Build Coastguard Worker .k(k)
5033*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5034*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5035*4bdc9457SAndroid Build Coastguard Worker }
5036*4bdc9457SAndroid Build Coastguard Worker }
5037*4bdc9457SAndroid Build Coastguard Worker }
5038*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)5039*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
5040*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5041*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5042*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5043*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5044*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5045*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5046*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5047*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5048*4bdc9457SAndroid Build Coastguard Worker .m(m)
5049*4bdc9457SAndroid Build Coastguard Worker .n(n)
5050*4bdc9457SAndroid Build Coastguard Worker .k(k)
5051*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5052*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5053*4bdc9457SAndroid Build Coastguard Worker }
5054*4bdc9457SAndroid Build Coastguard Worker }
5055*4bdc9457SAndroid Build Coastguard Worker }
5056*4bdc9457SAndroid Build Coastguard Worker }
5057*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)5058*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
5059*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5060*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5061*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5062*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5063*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5064*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5065*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5066*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5067*4bdc9457SAndroid Build Coastguard Worker .m(m)
5068*4bdc9457SAndroid Build Coastguard Worker .n(n)
5069*4bdc9457SAndroid Build Coastguard Worker .k(k)
5070*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5071*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5072*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5073*4bdc9457SAndroid Build Coastguard Worker }
5074*4bdc9457SAndroid Build Coastguard Worker }
5075*4bdc9457SAndroid Build Coastguard Worker }
5076*4bdc9457SAndroid Build Coastguard Worker }
5077*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)5078*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
5079*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5080*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5081*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5082*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5083*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5084*4bdc9457SAndroid Build Coastguard Worker .m(4)
5085*4bdc9457SAndroid Build Coastguard Worker .n(8)
5086*4bdc9457SAndroid Build Coastguard Worker .k(1)
5087*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5088*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8__wasmrelaxedsimd_fma_loadsplat);
5089*4bdc9457SAndroid Build Coastguard Worker }
5090*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5091*4bdc9457SAndroid Build Coastguard Worker
5092*4bdc9457SAndroid Build Coastguard Worker
5093*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4)5094*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4) {
5095*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5096*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5097*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5098*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5099*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5100*4bdc9457SAndroid Build Coastguard Worker .m(4)
5101*4bdc9457SAndroid Build Coastguard Worker .n(8)
5102*4bdc9457SAndroid Build Coastguard Worker .k(4)
5103*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5104*4bdc9457SAndroid Build Coastguard Worker }
5105*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,strided_cn)5106*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, strided_cn) {
5107*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5108*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5109*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5110*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5111*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5112*4bdc9457SAndroid Build Coastguard Worker .m(4)
5113*4bdc9457SAndroid Build Coastguard Worker .n(8)
5114*4bdc9457SAndroid Build Coastguard Worker .k(4)
5115*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5116*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5117*4bdc9457SAndroid Build Coastguard Worker }
5118*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_strided_a)5119*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_strided_a) {
5120*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5121*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5122*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5123*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5124*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5125*4bdc9457SAndroid Build Coastguard Worker .m(4)
5126*4bdc9457SAndroid Build Coastguard Worker .n(8)
5127*4bdc9457SAndroid Build Coastguard Worker .k(4)
5128*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5129*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5130*4bdc9457SAndroid Build Coastguard Worker }
5131*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile)5132*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile) {
5133*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5134*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5135*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5136*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5137*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5138*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5139*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5140*4bdc9457SAndroid Build Coastguard Worker .m(m)
5141*4bdc9457SAndroid Build Coastguard Worker .n(n)
5142*4bdc9457SAndroid Build Coastguard Worker .k(4)
5143*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5144*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5145*4bdc9457SAndroid Build Coastguard Worker }
5146*4bdc9457SAndroid Build Coastguard Worker }
5147*4bdc9457SAndroid Build Coastguard Worker }
5148*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_m)5149*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_m) {
5150*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5151*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5152*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5153*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5154*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5155*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5156*4bdc9457SAndroid Build Coastguard Worker .m(m)
5157*4bdc9457SAndroid Build Coastguard Worker .n(8)
5158*4bdc9457SAndroid Build Coastguard Worker .k(4)
5159*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5160*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5161*4bdc9457SAndroid Build Coastguard Worker }
5162*4bdc9457SAndroid Build Coastguard Worker }
5163*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_eq_4_subtile_n)5164*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_eq_4_subtile_n) {
5165*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5166*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5167*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5168*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5169*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5170*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5171*4bdc9457SAndroid Build Coastguard Worker .m(4)
5172*4bdc9457SAndroid Build Coastguard Worker .n(n)
5173*4bdc9457SAndroid Build Coastguard Worker .k(4)
5174*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5175*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5176*4bdc9457SAndroid Build Coastguard Worker }
5177*4bdc9457SAndroid Build Coastguard Worker }
5178*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_lt_4)5179*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_lt_4) {
5180*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
5181*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5182*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5183*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5184*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5185*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5186*4bdc9457SAndroid Build Coastguard Worker .m(4)
5187*4bdc9457SAndroid Build Coastguard Worker .n(8)
5188*4bdc9457SAndroid Build Coastguard Worker .k(k)
5189*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5190*4bdc9457SAndroid Build Coastguard Worker }
5191*4bdc9457SAndroid Build Coastguard Worker }
5192*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_strided_a)5193*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_strided_a) {
5194*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
5195*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5196*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5197*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5198*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5199*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5200*4bdc9457SAndroid Build Coastguard Worker .m(4)
5201*4bdc9457SAndroid Build Coastguard Worker .n(8)
5202*4bdc9457SAndroid Build Coastguard Worker .k(k)
5203*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5204*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5205*4bdc9457SAndroid Build Coastguard Worker }
5206*4bdc9457SAndroid Build Coastguard Worker }
5207*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_lt_4_subtile)5208*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_lt_4_subtile) {
5209*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k < 4; k++) {
5210*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5211*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5212*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5213*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5214*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5215*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5216*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5217*4bdc9457SAndroid Build Coastguard Worker .m(m)
5218*4bdc9457SAndroid Build Coastguard Worker .n(n)
5219*4bdc9457SAndroid Build Coastguard Worker .k(k)
5220*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5221*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5222*4bdc9457SAndroid Build Coastguard Worker }
5223*4bdc9457SAndroid Build Coastguard Worker }
5224*4bdc9457SAndroid Build Coastguard Worker }
5225*4bdc9457SAndroid Build Coastguard Worker }
5226*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_gt_4)5227*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_gt_4) {
5228*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
5229*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5230*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5231*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5232*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5233*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5234*4bdc9457SAndroid Build Coastguard Worker .m(4)
5235*4bdc9457SAndroid Build Coastguard Worker .n(8)
5236*4bdc9457SAndroid Build Coastguard Worker .k(k)
5237*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5238*4bdc9457SAndroid Build Coastguard Worker }
5239*4bdc9457SAndroid Build Coastguard Worker }
5240*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_strided_a)5241*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_strided_a) {
5242*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
5243*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5244*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5245*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5246*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5247*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5248*4bdc9457SAndroid Build Coastguard Worker .m(4)
5249*4bdc9457SAndroid Build Coastguard Worker .n(8)
5250*4bdc9457SAndroid Build Coastguard Worker .k(k)
5251*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
5252*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5253*4bdc9457SAndroid Build Coastguard Worker }
5254*4bdc9457SAndroid Build Coastguard Worker }
5255*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_gt_4_subtile)5256*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_gt_4_subtile) {
5257*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 5; k < 8; k++) {
5258*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5259*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5260*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5261*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5262*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5263*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5264*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5265*4bdc9457SAndroid Build Coastguard Worker .m(m)
5266*4bdc9457SAndroid Build Coastguard Worker .n(n)
5267*4bdc9457SAndroid Build Coastguard Worker .k(k)
5268*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5269*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5270*4bdc9457SAndroid Build Coastguard Worker }
5271*4bdc9457SAndroid Build Coastguard Worker }
5272*4bdc9457SAndroid Build Coastguard Worker }
5273*4bdc9457SAndroid Build Coastguard Worker }
5274*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_div_4)5275*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_div_4) {
5276*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
5277*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5278*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5279*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5280*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5281*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5282*4bdc9457SAndroid Build Coastguard Worker .m(4)
5283*4bdc9457SAndroid Build Coastguard Worker .n(8)
5284*4bdc9457SAndroid Build Coastguard Worker .k(k)
5285*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5286*4bdc9457SAndroid Build Coastguard Worker }
5287*4bdc9457SAndroid Build Coastguard Worker }
5288*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_div_4_strided_a)5289*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_div_4_strided_a) {
5290*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
5291*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5292*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5293*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5294*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5295*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5296*4bdc9457SAndroid Build Coastguard Worker .m(4)
5297*4bdc9457SAndroid Build Coastguard Worker .n(8)
5298*4bdc9457SAndroid Build Coastguard Worker .k(k)
5299*4bdc9457SAndroid Build Coastguard Worker .a_stride(43)
5300*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5301*4bdc9457SAndroid Build Coastguard Worker }
5302*4bdc9457SAndroid Build Coastguard Worker }
5303*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,k_div_4_subtile)5304*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, k_div_4_subtile) {
5305*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 8; k <= 40; k += 4) {
5306*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5307*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5308*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5309*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5310*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5311*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5312*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5313*4bdc9457SAndroid Build Coastguard Worker .m(m)
5314*4bdc9457SAndroid Build Coastguard Worker .n(n)
5315*4bdc9457SAndroid Build Coastguard Worker .k(k)
5316*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5317*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5318*4bdc9457SAndroid Build Coastguard Worker }
5319*4bdc9457SAndroid Build Coastguard Worker }
5320*4bdc9457SAndroid Build Coastguard Worker }
5321*4bdc9457SAndroid Build Coastguard Worker }
5322*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8)5323*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8) {
5324*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5325*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5326*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5327*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5328*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5329*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5330*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5331*4bdc9457SAndroid Build Coastguard Worker .m(4)
5332*4bdc9457SAndroid Build Coastguard Worker .n(n)
5333*4bdc9457SAndroid Build Coastguard Worker .k(k)
5334*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5335*4bdc9457SAndroid Build Coastguard Worker }
5336*4bdc9457SAndroid Build Coastguard Worker }
5337*4bdc9457SAndroid Build Coastguard Worker }
5338*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_cn)5339*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_cn) {
5340*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5341*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5342*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5343*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5344*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5345*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5346*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5347*4bdc9457SAndroid Build Coastguard Worker .m(4)
5348*4bdc9457SAndroid Build Coastguard Worker .n(n)
5349*4bdc9457SAndroid Build Coastguard Worker .k(k)
5350*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5351*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5352*4bdc9457SAndroid Build Coastguard Worker }
5353*4bdc9457SAndroid Build Coastguard Worker }
5354*4bdc9457SAndroid Build Coastguard Worker }
5355*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_strided_a)5356*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_strided_a) {
5357*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5358*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5359*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5360*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5361*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5362*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5363*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5364*4bdc9457SAndroid Build Coastguard Worker .m(4)
5365*4bdc9457SAndroid Build Coastguard Worker .n(n)
5366*4bdc9457SAndroid Build Coastguard Worker .k(k)
5367*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
5368*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5369*4bdc9457SAndroid Build Coastguard Worker }
5370*4bdc9457SAndroid Build Coastguard Worker }
5371*4bdc9457SAndroid Build Coastguard Worker }
5372*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,n_gt_8_subtile)5373*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, n_gt_8_subtile) {
5374*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5375*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5376*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5377*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5378*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5379*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5380*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5381*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5382*4bdc9457SAndroid Build Coastguard Worker .m(m)
5383*4bdc9457SAndroid Build Coastguard Worker .n(n)
5384*4bdc9457SAndroid Build Coastguard Worker .k(k)
5385*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5386*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5387*4bdc9457SAndroid Build Coastguard Worker }
5388*4bdc9457SAndroid Build Coastguard Worker }
5389*4bdc9457SAndroid Build Coastguard Worker }
5390*4bdc9457SAndroid Build Coastguard Worker }
5391*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8)5392*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8) {
5393*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5394*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5395*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5396*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5397*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5398*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5399*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5400*4bdc9457SAndroid Build Coastguard Worker .m(4)
5401*4bdc9457SAndroid Build Coastguard Worker .n(n)
5402*4bdc9457SAndroid Build Coastguard Worker .k(k)
5403*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5404*4bdc9457SAndroid Build Coastguard Worker }
5405*4bdc9457SAndroid Build Coastguard Worker }
5406*4bdc9457SAndroid Build Coastguard Worker }
5407*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_cn)5408*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_cn) {
5409*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5410*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5411*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5412*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5413*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5414*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5415*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5416*4bdc9457SAndroid Build Coastguard Worker .m(4)
5417*4bdc9457SAndroid Build Coastguard Worker .n(n)
5418*4bdc9457SAndroid Build Coastguard Worker .k(k)
5419*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5420*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5421*4bdc9457SAndroid Build Coastguard Worker }
5422*4bdc9457SAndroid Build Coastguard Worker }
5423*4bdc9457SAndroid Build Coastguard Worker }
5424*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8_strided_a)5425*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8_strided_a) {
5426*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5427*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5428*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5429*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5430*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5431*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5432*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5433*4bdc9457SAndroid Build Coastguard Worker .m(4)
5434*4bdc9457SAndroid Build Coastguard Worker .n(n)
5435*4bdc9457SAndroid Build Coastguard Worker .k(k)
5436*4bdc9457SAndroid Build Coastguard Worker .a_stride(23)
5437*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5438*4bdc9457SAndroid Build Coastguard Worker }
5439*4bdc9457SAndroid Build Coastguard Worker }
5440*4bdc9457SAndroid Build Coastguard Worker }
5441*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,n_div_8_subtile)5442*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, n_div_8_subtile) {
5443*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5444*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5445*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5446*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5447*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5448*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5449*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5450*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5451*4bdc9457SAndroid Build Coastguard Worker .m(m)
5452*4bdc9457SAndroid Build Coastguard Worker .n(n)
5453*4bdc9457SAndroid Build Coastguard Worker .k(k)
5454*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5455*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5456*4bdc9457SAndroid Build Coastguard Worker }
5457*4bdc9457SAndroid Build Coastguard Worker }
5458*4bdc9457SAndroid Build Coastguard Worker }
5459*4bdc9457SAndroid Build Coastguard Worker }
5460*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,strided_cm_subtile)5461*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, strided_cm_subtile) {
5462*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 20; k += 5) {
5463*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5464*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 4; m++) {
5465*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5466*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5467*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5468*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5469*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5470*4bdc9457SAndroid Build Coastguard Worker .m(m)
5471*4bdc9457SAndroid Build Coastguard Worker .n(n)
5472*4bdc9457SAndroid Build Coastguard Worker .k(k)
5473*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5474*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5475*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5476*4bdc9457SAndroid Build Coastguard Worker }
5477*4bdc9457SAndroid Build Coastguard Worker }
5478*4bdc9457SAndroid Build Coastguard Worker }
5479*4bdc9457SAndroid Build Coastguard Worker }
5480*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA,strided_cm)5481*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_4X8S4__WASMRELAXEDSIMD_FMA, strided_cm) {
5482*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5483*4bdc9457SAndroid Build Coastguard Worker .mr(4)
5484*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5485*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5486*4bdc9457SAndroid Build Coastguard Worker .sr(4)
5487*4bdc9457SAndroid Build Coastguard Worker .m(4)
5488*4bdc9457SAndroid Build Coastguard Worker .n(8)
5489*4bdc9457SAndroid Build Coastguard Worker .k(4)
5490*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5491*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_4x8s4__wasmrelaxedsimd_fma);
5492*4bdc9457SAndroid Build Coastguard Worker }
5493*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5494*4bdc9457SAndroid Build Coastguard Worker
5495*4bdc9457SAndroid Build Coastguard Worker
5496*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)5497*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
5498*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5499*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5500*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5501*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5502*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5503*4bdc9457SAndroid Build Coastguard Worker .m(5)
5504*4bdc9457SAndroid Build Coastguard Worker .n(8)
5505*4bdc9457SAndroid Build Coastguard Worker .k(1)
5506*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5507*4bdc9457SAndroid Build Coastguard Worker }
5508*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)5509*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
5510*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5511*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5512*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5513*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5514*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5515*4bdc9457SAndroid Build Coastguard Worker .m(5)
5516*4bdc9457SAndroid Build Coastguard Worker .n(8)
5517*4bdc9457SAndroid Build Coastguard Worker .k(1)
5518*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5519*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5520*4bdc9457SAndroid Build Coastguard Worker }
5521*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)5522*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
5523*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5524*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5525*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5526*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5527*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5528*4bdc9457SAndroid Build Coastguard Worker .m(5)
5529*4bdc9457SAndroid Build Coastguard Worker .n(8)
5530*4bdc9457SAndroid Build Coastguard Worker .k(1)
5531*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
5532*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5533*4bdc9457SAndroid Build Coastguard Worker }
5534*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)5535*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
5536*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5537*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5538*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5539*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5540*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5541*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5542*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5543*4bdc9457SAndroid Build Coastguard Worker .m(m)
5544*4bdc9457SAndroid Build Coastguard Worker .n(n)
5545*4bdc9457SAndroid Build Coastguard Worker .k(1)
5546*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5547*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5548*4bdc9457SAndroid Build Coastguard Worker }
5549*4bdc9457SAndroid Build Coastguard Worker }
5550*4bdc9457SAndroid Build Coastguard Worker }
5551*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)5552*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
5553*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5554*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5555*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5556*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5557*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5558*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5559*4bdc9457SAndroid Build Coastguard Worker .m(m)
5560*4bdc9457SAndroid Build Coastguard Worker .n(8)
5561*4bdc9457SAndroid Build Coastguard Worker .k(1)
5562*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5563*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5564*4bdc9457SAndroid Build Coastguard Worker }
5565*4bdc9457SAndroid Build Coastguard Worker }
5566*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)5567*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
5568*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5569*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5570*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5571*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5572*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5573*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5574*4bdc9457SAndroid Build Coastguard Worker .m(5)
5575*4bdc9457SAndroid Build Coastguard Worker .n(n)
5576*4bdc9457SAndroid Build Coastguard Worker .k(1)
5577*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5578*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5579*4bdc9457SAndroid Build Coastguard Worker }
5580*4bdc9457SAndroid Build Coastguard Worker }
5581*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)5582*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
5583*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5584*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5585*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5586*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5587*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5588*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5589*4bdc9457SAndroid Build Coastguard Worker .m(5)
5590*4bdc9457SAndroid Build Coastguard Worker .n(8)
5591*4bdc9457SAndroid Build Coastguard Worker .k(k)
5592*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5593*4bdc9457SAndroid Build Coastguard Worker }
5594*4bdc9457SAndroid Build Coastguard Worker }
5595*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)5596*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
5597*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5598*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5599*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5600*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5601*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5602*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5603*4bdc9457SAndroid Build Coastguard Worker .m(5)
5604*4bdc9457SAndroid Build Coastguard Worker .n(8)
5605*4bdc9457SAndroid Build Coastguard Worker .k(k)
5606*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
5607*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5608*4bdc9457SAndroid Build Coastguard Worker }
5609*4bdc9457SAndroid Build Coastguard Worker }
5610*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)5611*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
5612*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5613*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5614*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5615*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5616*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5617*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5618*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5619*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5620*4bdc9457SAndroid Build Coastguard Worker .m(m)
5621*4bdc9457SAndroid Build Coastguard Worker .n(n)
5622*4bdc9457SAndroid Build Coastguard Worker .k(k)
5623*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5624*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5625*4bdc9457SAndroid Build Coastguard Worker }
5626*4bdc9457SAndroid Build Coastguard Worker }
5627*4bdc9457SAndroid Build Coastguard Worker }
5628*4bdc9457SAndroid Build Coastguard Worker }
5629*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)5630*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
5631*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5632*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5633*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5634*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5635*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5636*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5637*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5638*4bdc9457SAndroid Build Coastguard Worker .m(5)
5639*4bdc9457SAndroid Build Coastguard Worker .n(n)
5640*4bdc9457SAndroid Build Coastguard Worker .k(k)
5641*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5642*4bdc9457SAndroid Build Coastguard Worker }
5643*4bdc9457SAndroid Build Coastguard Worker }
5644*4bdc9457SAndroid Build Coastguard Worker }
5645*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)5646*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
5647*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5648*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5649*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5650*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5651*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5652*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5653*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5654*4bdc9457SAndroid Build Coastguard Worker .m(5)
5655*4bdc9457SAndroid Build Coastguard Worker .n(n)
5656*4bdc9457SAndroid Build Coastguard Worker .k(k)
5657*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5658*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5659*4bdc9457SAndroid Build Coastguard Worker }
5660*4bdc9457SAndroid Build Coastguard Worker }
5661*4bdc9457SAndroid Build Coastguard Worker }
5662*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)5663*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
5664*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5665*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5666*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5667*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5668*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5669*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5670*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5671*4bdc9457SAndroid Build Coastguard Worker .m(5)
5672*4bdc9457SAndroid Build Coastguard Worker .n(n)
5673*4bdc9457SAndroid Build Coastguard Worker .k(k)
5674*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5675*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5676*4bdc9457SAndroid Build Coastguard Worker }
5677*4bdc9457SAndroid Build Coastguard Worker }
5678*4bdc9457SAndroid Build Coastguard Worker }
5679*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)5680*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
5681*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5682*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5683*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5684*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5685*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5686*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5687*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5688*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5689*4bdc9457SAndroid Build Coastguard Worker .m(m)
5690*4bdc9457SAndroid Build Coastguard Worker .n(n)
5691*4bdc9457SAndroid Build Coastguard Worker .k(k)
5692*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5693*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5694*4bdc9457SAndroid Build Coastguard Worker }
5695*4bdc9457SAndroid Build Coastguard Worker }
5696*4bdc9457SAndroid Build Coastguard Worker }
5697*4bdc9457SAndroid Build Coastguard Worker }
5698*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)5699*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
5700*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5701*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5702*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5703*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5704*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5705*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5706*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5707*4bdc9457SAndroid Build Coastguard Worker .m(5)
5708*4bdc9457SAndroid Build Coastguard Worker .n(n)
5709*4bdc9457SAndroid Build Coastguard Worker .k(k)
5710*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5711*4bdc9457SAndroid Build Coastguard Worker }
5712*4bdc9457SAndroid Build Coastguard Worker }
5713*4bdc9457SAndroid Build Coastguard Worker }
5714*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)5715*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
5716*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5717*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5718*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5719*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5720*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5721*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5722*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5723*4bdc9457SAndroid Build Coastguard Worker .m(5)
5724*4bdc9457SAndroid Build Coastguard Worker .n(n)
5725*4bdc9457SAndroid Build Coastguard Worker .k(k)
5726*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5727*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5728*4bdc9457SAndroid Build Coastguard Worker }
5729*4bdc9457SAndroid Build Coastguard Worker }
5730*4bdc9457SAndroid Build Coastguard Worker }
5731*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)5732*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
5733*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5734*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5735*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5736*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5737*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5738*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5739*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5740*4bdc9457SAndroid Build Coastguard Worker .m(5)
5741*4bdc9457SAndroid Build Coastguard Worker .n(n)
5742*4bdc9457SAndroid Build Coastguard Worker .k(k)
5743*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5744*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5745*4bdc9457SAndroid Build Coastguard Worker }
5746*4bdc9457SAndroid Build Coastguard Worker }
5747*4bdc9457SAndroid Build Coastguard Worker }
5748*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)5749*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
5750*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
5751*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5752*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5753*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5754*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5755*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5756*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5757*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5758*4bdc9457SAndroid Build Coastguard Worker .m(m)
5759*4bdc9457SAndroid Build Coastguard Worker .n(n)
5760*4bdc9457SAndroid Build Coastguard Worker .k(k)
5761*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5762*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5763*4bdc9457SAndroid Build Coastguard Worker }
5764*4bdc9457SAndroid Build Coastguard Worker }
5765*4bdc9457SAndroid Build Coastguard Worker }
5766*4bdc9457SAndroid Build Coastguard Worker }
5767*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)5768*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
5769*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5770*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5771*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 5; m++) {
5772*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5773*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5774*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5775*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5776*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5777*4bdc9457SAndroid Build Coastguard Worker .m(m)
5778*4bdc9457SAndroid Build Coastguard Worker .n(n)
5779*4bdc9457SAndroid Build Coastguard Worker .k(k)
5780*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5781*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5782*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5783*4bdc9457SAndroid Build Coastguard Worker }
5784*4bdc9457SAndroid Build Coastguard Worker }
5785*4bdc9457SAndroid Build Coastguard Worker }
5786*4bdc9457SAndroid Build Coastguard Worker }
5787*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)5788*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_5X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
5789*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5790*4bdc9457SAndroid Build Coastguard Worker .mr(5)
5791*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5792*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5793*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5794*4bdc9457SAndroid Build Coastguard Worker .m(5)
5795*4bdc9457SAndroid Build Coastguard Worker .n(8)
5796*4bdc9457SAndroid Build Coastguard Worker .k(1)
5797*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
5798*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_5x8__wasmrelaxedsimd_fma_loadsplat);
5799*4bdc9457SAndroid Build Coastguard Worker }
5800*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
5801*4bdc9457SAndroid Build Coastguard Worker
5802*4bdc9457SAndroid Build Coastguard Worker
5803*4bdc9457SAndroid Build Coastguard Worker #if XNN_ARCH_WASMRELAXEDSIMD
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1)5804*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1) {
5805*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5806*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5807*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5808*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5809*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5810*4bdc9457SAndroid Build Coastguard Worker .m(6)
5811*4bdc9457SAndroid Build Coastguard Worker .n(8)
5812*4bdc9457SAndroid Build Coastguard Worker .k(1)
5813*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5814*4bdc9457SAndroid Build Coastguard Worker }
5815*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cn)5816*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cn) {
5817*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5818*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5819*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5820*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5821*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5822*4bdc9457SAndroid Build Coastguard Worker .m(6)
5823*4bdc9457SAndroid Build Coastguard Worker .n(8)
5824*4bdc9457SAndroid Build Coastguard Worker .k(1)
5825*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5826*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5827*4bdc9457SAndroid Build Coastguard Worker }
5828*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_strided_a)5829*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_strided_a) {
5830*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5831*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5832*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5833*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5834*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5835*4bdc9457SAndroid Build Coastguard Worker .m(6)
5836*4bdc9457SAndroid Build Coastguard Worker .n(8)
5837*4bdc9457SAndroid Build Coastguard Worker .k(1)
5838*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
5839*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5840*4bdc9457SAndroid Build Coastguard Worker }
5841*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile)5842*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile) {
5843*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5844*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5845*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5846*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5847*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5848*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5849*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5850*4bdc9457SAndroid Build Coastguard Worker .m(m)
5851*4bdc9457SAndroid Build Coastguard Worker .n(n)
5852*4bdc9457SAndroid Build Coastguard Worker .k(1)
5853*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5854*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5855*4bdc9457SAndroid Build Coastguard Worker }
5856*4bdc9457SAndroid Build Coastguard Worker }
5857*4bdc9457SAndroid Build Coastguard Worker }
5858*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_m)5859*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_m) {
5860*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5861*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5862*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5863*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5864*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5865*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5866*4bdc9457SAndroid Build Coastguard Worker .m(m)
5867*4bdc9457SAndroid Build Coastguard Worker .n(8)
5868*4bdc9457SAndroid Build Coastguard Worker .k(1)
5869*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5870*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5871*4bdc9457SAndroid Build Coastguard Worker }
5872*4bdc9457SAndroid Build Coastguard Worker }
5873*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_eq_1_subtile_n)5874*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_eq_1_subtile_n) {
5875*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5876*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5877*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5878*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5879*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5880*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5881*4bdc9457SAndroid Build Coastguard Worker .m(6)
5882*4bdc9457SAndroid Build Coastguard Worker .n(n)
5883*4bdc9457SAndroid Build Coastguard Worker .k(1)
5884*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5885*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5886*4bdc9457SAndroid Build Coastguard Worker }
5887*4bdc9457SAndroid Build Coastguard Worker }
5888*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1)5889*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1) {
5890*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5891*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5892*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5893*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5894*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5895*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5896*4bdc9457SAndroid Build Coastguard Worker .m(6)
5897*4bdc9457SAndroid Build Coastguard Worker .n(8)
5898*4bdc9457SAndroid Build Coastguard Worker .k(k)
5899*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5900*4bdc9457SAndroid Build Coastguard Worker }
5901*4bdc9457SAndroid Build Coastguard Worker }
5902*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_strided_a)5903*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_strided_a) {
5904*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5905*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5906*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5907*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5908*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5909*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5910*4bdc9457SAndroid Build Coastguard Worker .m(6)
5911*4bdc9457SAndroid Build Coastguard Worker .n(8)
5912*4bdc9457SAndroid Build Coastguard Worker .k(k)
5913*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
5914*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5915*4bdc9457SAndroid Build Coastguard Worker }
5916*4bdc9457SAndroid Build Coastguard Worker }
5917*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,k_gt_1_subtile)5918*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, k_gt_1_subtile) {
5919*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
5920*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
5921*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5922*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5923*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5924*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5925*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5926*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5927*4bdc9457SAndroid Build Coastguard Worker .m(m)
5928*4bdc9457SAndroid Build Coastguard Worker .n(n)
5929*4bdc9457SAndroid Build Coastguard Worker .k(k)
5930*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
5931*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5932*4bdc9457SAndroid Build Coastguard Worker }
5933*4bdc9457SAndroid Build Coastguard Worker }
5934*4bdc9457SAndroid Build Coastguard Worker }
5935*4bdc9457SAndroid Build Coastguard Worker }
5936*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8)5937*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8) {
5938*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5939*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5940*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5941*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5942*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5943*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5944*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5945*4bdc9457SAndroid Build Coastguard Worker .m(6)
5946*4bdc9457SAndroid Build Coastguard Worker .n(n)
5947*4bdc9457SAndroid Build Coastguard Worker .k(k)
5948*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5949*4bdc9457SAndroid Build Coastguard Worker }
5950*4bdc9457SAndroid Build Coastguard Worker }
5951*4bdc9457SAndroid Build Coastguard Worker }
5952*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_cn)5953*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_cn) {
5954*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5955*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5956*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5957*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5958*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5959*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5960*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5961*4bdc9457SAndroid Build Coastguard Worker .m(6)
5962*4bdc9457SAndroid Build Coastguard Worker .n(n)
5963*4bdc9457SAndroid Build Coastguard Worker .k(k)
5964*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
5965*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5966*4bdc9457SAndroid Build Coastguard Worker }
5967*4bdc9457SAndroid Build Coastguard Worker }
5968*4bdc9457SAndroid Build Coastguard Worker }
5969*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_strided_a)5970*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_strided_a) {
5971*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5972*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5973*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5974*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5975*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5976*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5977*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5978*4bdc9457SAndroid Build Coastguard Worker .m(6)
5979*4bdc9457SAndroid Build Coastguard Worker .n(n)
5980*4bdc9457SAndroid Build Coastguard Worker .k(k)
5981*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
5982*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
5983*4bdc9457SAndroid Build Coastguard Worker }
5984*4bdc9457SAndroid Build Coastguard Worker }
5985*4bdc9457SAndroid Build Coastguard Worker }
5986*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_gt_8_subtile)5987*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_gt_8_subtile) {
5988*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 9; n < 16; n++) {
5989*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
5990*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
5991*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
5992*4bdc9457SAndroid Build Coastguard Worker .mr(6)
5993*4bdc9457SAndroid Build Coastguard Worker .nr(8)
5994*4bdc9457SAndroid Build Coastguard Worker .kr(1)
5995*4bdc9457SAndroid Build Coastguard Worker .sr(1)
5996*4bdc9457SAndroid Build Coastguard Worker .m(m)
5997*4bdc9457SAndroid Build Coastguard Worker .n(n)
5998*4bdc9457SAndroid Build Coastguard Worker .k(k)
5999*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6000*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6001*4bdc9457SAndroid Build Coastguard Worker }
6002*4bdc9457SAndroid Build Coastguard Worker }
6003*4bdc9457SAndroid Build Coastguard Worker }
6004*4bdc9457SAndroid Build Coastguard Worker }
6005*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8)6006*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8) {
6007*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6008*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6009*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6010*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6011*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6012*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6013*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6014*4bdc9457SAndroid Build Coastguard Worker .m(6)
6015*4bdc9457SAndroid Build Coastguard Worker .n(n)
6016*4bdc9457SAndroid Build Coastguard Worker .k(k)
6017*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6018*4bdc9457SAndroid Build Coastguard Worker }
6019*4bdc9457SAndroid Build Coastguard Worker }
6020*4bdc9457SAndroid Build Coastguard Worker }
6021*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_cn)6022*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_cn) {
6023*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6024*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6025*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6026*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6027*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6028*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6029*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6030*4bdc9457SAndroid Build Coastguard Worker .m(6)
6031*4bdc9457SAndroid Build Coastguard Worker .n(n)
6032*4bdc9457SAndroid Build Coastguard Worker .k(k)
6033*4bdc9457SAndroid Build Coastguard Worker .cn_stride(11)
6034*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6035*4bdc9457SAndroid Build Coastguard Worker }
6036*4bdc9457SAndroid Build Coastguard Worker }
6037*4bdc9457SAndroid Build Coastguard Worker }
6038*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_strided_a)6039*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_strided_a) {
6040*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6041*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6042*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6043*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6044*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6045*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6046*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6047*4bdc9457SAndroid Build Coastguard Worker .m(6)
6048*4bdc9457SAndroid Build Coastguard Worker .n(n)
6049*4bdc9457SAndroid Build Coastguard Worker .k(k)
6050*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6051*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6052*4bdc9457SAndroid Build Coastguard Worker }
6053*4bdc9457SAndroid Build Coastguard Worker }
6054*4bdc9457SAndroid Build Coastguard Worker }
6055*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,n_div_8_subtile)6056*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, n_div_8_subtile) {
6057*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 16; n <= 24; n += 8) {
6058*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6059*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6060*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6061*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6062*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6063*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6064*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6065*4bdc9457SAndroid Build Coastguard Worker .m(m)
6066*4bdc9457SAndroid Build Coastguard Worker .n(n)
6067*4bdc9457SAndroid Build Coastguard Worker .k(k)
6068*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6069*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6070*4bdc9457SAndroid Build Coastguard Worker }
6071*4bdc9457SAndroid Build Coastguard Worker }
6072*4bdc9457SAndroid Build Coastguard Worker }
6073*4bdc9457SAndroid Build Coastguard Worker }
6074*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm_subtile)6075*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm_subtile) {
6076*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6077*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 8; n++) {
6078*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 6; m++) {
6079*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6080*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6081*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6082*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6083*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6084*4bdc9457SAndroid Build Coastguard Worker .m(m)
6085*4bdc9457SAndroid Build Coastguard Worker .n(n)
6086*4bdc9457SAndroid Build Coastguard Worker .k(k)
6087*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
6088*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6089*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6090*4bdc9457SAndroid Build Coastguard Worker }
6091*4bdc9457SAndroid Build Coastguard Worker }
6092*4bdc9457SAndroid Build Coastguard Worker }
6093*4bdc9457SAndroid Build Coastguard Worker }
6094*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT,strided_cm)6095*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_6X8__WASMRELAXEDSIMD_FMA_LOADSPLAT, strided_cm) {
6096*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6097*4bdc9457SAndroid Build Coastguard Worker .mr(6)
6098*4bdc9457SAndroid Build Coastguard Worker .nr(8)
6099*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6100*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6101*4bdc9457SAndroid Build Coastguard Worker .m(6)
6102*4bdc9457SAndroid Build Coastguard Worker .n(8)
6103*4bdc9457SAndroid Build Coastguard Worker .k(1)
6104*4bdc9457SAndroid Build Coastguard Worker .cm_stride(11)
6105*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_6x8__wasmrelaxedsimd_fma_loadsplat);
6106*4bdc9457SAndroid Build Coastguard Worker }
6107*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_ARCH_WASMRELAXEDSIMD
6108*4bdc9457SAndroid Build Coastguard Worker
6109*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,k_eq_1)6110*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, k_eq_1) {
6111*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6112*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6113*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6114*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6115*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6116*4bdc9457SAndroid Build Coastguard Worker .m(2)
6117*4bdc9457SAndroid Build Coastguard Worker .n(4)
6118*4bdc9457SAndroid Build Coastguard Worker .k(1)
6119*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6120*4bdc9457SAndroid Build Coastguard Worker }
6121*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,strided_cn)6122*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, strided_cn) {
6123*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6124*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6125*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6126*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6127*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6128*4bdc9457SAndroid Build Coastguard Worker .m(2)
6129*4bdc9457SAndroid Build Coastguard Worker .n(4)
6130*4bdc9457SAndroid Build Coastguard Worker .k(1)
6131*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6132*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6133*4bdc9457SAndroid Build Coastguard Worker }
6134*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,k_eq_1_strided_a)6135*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, k_eq_1_strided_a) {
6136*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6137*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6138*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6139*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6140*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6141*4bdc9457SAndroid Build Coastguard Worker .m(2)
6142*4bdc9457SAndroid Build Coastguard Worker .n(4)
6143*4bdc9457SAndroid Build Coastguard Worker .k(1)
6144*4bdc9457SAndroid Build Coastguard Worker .a_stride(3)
6145*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6146*4bdc9457SAndroid Build Coastguard Worker }
6147*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,k_eq_1_subtile)6148*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, k_eq_1_subtile) {
6149*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6150*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6151*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6152*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6153*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6154*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6155*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6156*4bdc9457SAndroid Build Coastguard Worker .m(m)
6157*4bdc9457SAndroid Build Coastguard Worker .n(n)
6158*4bdc9457SAndroid Build Coastguard Worker .k(1)
6159*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6160*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6161*4bdc9457SAndroid Build Coastguard Worker }
6162*4bdc9457SAndroid Build Coastguard Worker }
6163*4bdc9457SAndroid Build Coastguard Worker }
6164*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,k_eq_1_subtile_m)6165*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, k_eq_1_subtile_m) {
6166*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6167*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6168*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6169*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6170*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6171*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6172*4bdc9457SAndroid Build Coastguard Worker .m(m)
6173*4bdc9457SAndroid Build Coastguard Worker .n(4)
6174*4bdc9457SAndroid Build Coastguard Worker .k(1)
6175*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6176*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6177*4bdc9457SAndroid Build Coastguard Worker }
6178*4bdc9457SAndroid Build Coastguard Worker }
6179*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,k_eq_1_subtile_n)6180*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, k_eq_1_subtile_n) {
6181*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6182*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6183*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6184*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6185*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6186*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6187*4bdc9457SAndroid Build Coastguard Worker .m(2)
6188*4bdc9457SAndroid Build Coastguard Worker .n(n)
6189*4bdc9457SAndroid Build Coastguard Worker .k(1)
6190*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6191*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6192*4bdc9457SAndroid Build Coastguard Worker }
6193*4bdc9457SAndroid Build Coastguard Worker }
6194*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,k_gt_1)6195*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, k_gt_1) {
6196*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6197*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6198*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6199*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6200*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6201*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6202*4bdc9457SAndroid Build Coastguard Worker .m(2)
6203*4bdc9457SAndroid Build Coastguard Worker .n(4)
6204*4bdc9457SAndroid Build Coastguard Worker .k(k)
6205*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6206*4bdc9457SAndroid Build Coastguard Worker }
6207*4bdc9457SAndroid Build Coastguard Worker }
6208*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,k_gt_1_strided_a)6209*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, k_gt_1_strided_a) {
6210*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6211*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6212*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6213*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6214*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6215*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6216*4bdc9457SAndroid Build Coastguard Worker .m(2)
6217*4bdc9457SAndroid Build Coastguard Worker .n(4)
6218*4bdc9457SAndroid Build Coastguard Worker .k(k)
6219*4bdc9457SAndroid Build Coastguard Worker .a_stride(11)
6220*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6221*4bdc9457SAndroid Build Coastguard Worker }
6222*4bdc9457SAndroid Build Coastguard Worker }
6223*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,k_gt_1_subtile)6224*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, k_gt_1_subtile) {
6225*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 2; k < 10; k++) {
6226*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6227*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6228*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6229*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6230*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6231*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6232*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6233*4bdc9457SAndroid Build Coastguard Worker .m(m)
6234*4bdc9457SAndroid Build Coastguard Worker .n(n)
6235*4bdc9457SAndroid Build Coastguard Worker .k(k)
6236*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6237*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6238*4bdc9457SAndroid Build Coastguard Worker }
6239*4bdc9457SAndroid Build Coastguard Worker }
6240*4bdc9457SAndroid Build Coastguard Worker }
6241*4bdc9457SAndroid Build Coastguard Worker }
6242*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,n_gt_4)6243*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, n_gt_4) {
6244*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6245*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6246*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6247*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6248*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6249*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6250*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6251*4bdc9457SAndroid Build Coastguard Worker .m(2)
6252*4bdc9457SAndroid Build Coastguard Worker .n(n)
6253*4bdc9457SAndroid Build Coastguard Worker .k(k)
6254*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6255*4bdc9457SAndroid Build Coastguard Worker }
6256*4bdc9457SAndroid Build Coastguard Worker }
6257*4bdc9457SAndroid Build Coastguard Worker }
6258*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,n_gt_4_strided_cn)6259*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, n_gt_4_strided_cn) {
6260*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6261*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6262*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6263*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6264*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6265*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6266*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6267*4bdc9457SAndroid Build Coastguard Worker .m(2)
6268*4bdc9457SAndroid Build Coastguard Worker .n(n)
6269*4bdc9457SAndroid Build Coastguard Worker .k(k)
6270*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6271*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6272*4bdc9457SAndroid Build Coastguard Worker }
6273*4bdc9457SAndroid Build Coastguard Worker }
6274*4bdc9457SAndroid Build Coastguard Worker }
6275*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,n_gt_4_strided_a)6276*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, n_gt_4_strided_a) {
6277*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6278*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6279*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6280*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6281*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6282*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6283*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6284*4bdc9457SAndroid Build Coastguard Worker .m(2)
6285*4bdc9457SAndroid Build Coastguard Worker .n(n)
6286*4bdc9457SAndroid Build Coastguard Worker .k(k)
6287*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6288*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6289*4bdc9457SAndroid Build Coastguard Worker }
6290*4bdc9457SAndroid Build Coastguard Worker }
6291*4bdc9457SAndroid Build Coastguard Worker }
6292*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,n_gt_4_subtile)6293*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, n_gt_4_subtile) {
6294*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 5; n < 8; n++) {
6295*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6296*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6297*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6298*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6299*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6300*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6301*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6302*4bdc9457SAndroid Build Coastguard Worker .m(m)
6303*4bdc9457SAndroid Build Coastguard Worker .n(n)
6304*4bdc9457SAndroid Build Coastguard Worker .k(k)
6305*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6306*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6307*4bdc9457SAndroid Build Coastguard Worker }
6308*4bdc9457SAndroid Build Coastguard Worker }
6309*4bdc9457SAndroid Build Coastguard Worker }
6310*4bdc9457SAndroid Build Coastguard Worker }
6311*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,n_div_4)6312*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, n_div_4) {
6313*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6314*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6315*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6316*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6317*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6318*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6319*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6320*4bdc9457SAndroid Build Coastguard Worker .m(2)
6321*4bdc9457SAndroid Build Coastguard Worker .n(n)
6322*4bdc9457SAndroid Build Coastguard Worker .k(k)
6323*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6324*4bdc9457SAndroid Build Coastguard Worker }
6325*4bdc9457SAndroid Build Coastguard Worker }
6326*4bdc9457SAndroid Build Coastguard Worker }
6327*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,n_div_4_strided_cn)6328*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, n_div_4_strided_cn) {
6329*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6330*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6331*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6332*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6333*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6334*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6335*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6336*4bdc9457SAndroid Build Coastguard Worker .m(2)
6337*4bdc9457SAndroid Build Coastguard Worker .n(n)
6338*4bdc9457SAndroid Build Coastguard Worker .k(k)
6339*4bdc9457SAndroid Build Coastguard Worker .cn_stride(7)
6340*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6341*4bdc9457SAndroid Build Coastguard Worker }
6342*4bdc9457SAndroid Build Coastguard Worker }
6343*4bdc9457SAndroid Build Coastguard Worker }
6344*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,n_div_4_strided_a)6345*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, n_div_4_strided_a) {
6346*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6347*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6348*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6349*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6350*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6351*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6352*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6353*4bdc9457SAndroid Build Coastguard Worker .m(2)
6354*4bdc9457SAndroid Build Coastguard Worker .n(n)
6355*4bdc9457SAndroid Build Coastguard Worker .k(k)
6356*4bdc9457SAndroid Build Coastguard Worker .a_stride(7)
6357*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6358*4bdc9457SAndroid Build Coastguard Worker }
6359*4bdc9457SAndroid Build Coastguard Worker }
6360*4bdc9457SAndroid Build Coastguard Worker }
6361*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,n_div_4_subtile)6362*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, n_div_4_subtile) {
6363*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 8; n <= 12; n += 4) {
6364*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6365*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6366*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6367*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6368*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6369*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6370*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6371*4bdc9457SAndroid Build Coastguard Worker .m(m)
6372*4bdc9457SAndroid Build Coastguard Worker .n(n)
6373*4bdc9457SAndroid Build Coastguard Worker .k(k)
6374*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6375*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6376*4bdc9457SAndroid Build Coastguard Worker }
6377*4bdc9457SAndroid Build Coastguard Worker }
6378*4bdc9457SAndroid Build Coastguard Worker }
6379*4bdc9457SAndroid Build Coastguard Worker }
6380*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,strided_cm_subtile)6381*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, strided_cm_subtile) {
6382*4bdc9457SAndroid Build Coastguard Worker for (size_t k = 1; k <= 5; k += 2) {
6383*4bdc9457SAndroid Build Coastguard Worker for (uint32_t n = 1; n <= 4; n++) {
6384*4bdc9457SAndroid Build Coastguard Worker for (uint32_t m = 1; m <= 2; m++) {
6385*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6386*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6387*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6388*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6389*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6390*4bdc9457SAndroid Build Coastguard Worker .m(m)
6391*4bdc9457SAndroid Build Coastguard Worker .n(n)
6392*4bdc9457SAndroid Build Coastguard Worker .k(k)
6393*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6394*4bdc9457SAndroid Build Coastguard Worker .iterations(1)
6395*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6396*4bdc9457SAndroid Build Coastguard Worker }
6397*4bdc9457SAndroid Build Coastguard Worker }
6398*4bdc9457SAndroid Build Coastguard Worker }
6399*4bdc9457SAndroid Build Coastguard Worker }
6400*4bdc9457SAndroid Build Coastguard Worker
TEST(F32_GEMM_2X4__SCALAR,strided_cm)6401*4bdc9457SAndroid Build Coastguard Worker TEST(F32_GEMM_2X4__SCALAR, strided_cm) {
6402*4bdc9457SAndroid Build Coastguard Worker GemmMicrokernelTester()
6403*4bdc9457SAndroid Build Coastguard Worker .mr(2)
6404*4bdc9457SAndroid Build Coastguard Worker .nr(4)
6405*4bdc9457SAndroid Build Coastguard Worker .kr(1)
6406*4bdc9457SAndroid Build Coastguard Worker .sr(1)
6407*4bdc9457SAndroid Build Coastguard Worker .m(2)
6408*4bdc9457SAndroid Build Coastguard Worker .n(4)
6409*4bdc9457SAndroid Build Coastguard Worker .k(1)
6410*4bdc9457SAndroid Build Coastguard Worker .cm_stride(7)
6411*4bdc9457SAndroid Build Coastguard Worker .Test(xnn_f32_gemm_ukernel_2x4__scalar);
6412*4bdc9457SAndroid Build Coastguard Worker }
6413