1*4bdc9457SAndroid Build Coastguard Worker // Copyright (c) Facebook, Inc. and its affiliates.
2*4bdc9457SAndroid Build Coastguard Worker // All rights reserved.
3*4bdc9457SAndroid Build Coastguard Worker //
4*4bdc9457SAndroid Build Coastguard Worker // Copyright 2019 Google LLC
5*4bdc9457SAndroid Build Coastguard Worker //
6*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
7*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
8*4bdc9457SAndroid Build Coastguard Worker
9*4bdc9457SAndroid Build Coastguard Worker #pragma once
10*4bdc9457SAndroid Build Coastguard Worker
11*4bdc9457SAndroid Build Coastguard Worker #include <stdbool.h>
12*4bdc9457SAndroid Build Coastguard Worker #include <stddef.h>
13*4bdc9457SAndroid Build Coastguard Worker #include <stdint.h>
14*4bdc9457SAndroid Build Coastguard Worker
15*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack.h>
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h>
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microfnptr.h>
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microparams.h>
19*4bdc9457SAndroid Build Coastguard Worker
20*4bdc9457SAndroid Build Coastguard Worker
21*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_gemm_ukernel {
22*4bdc9457SAndroid Build Coastguard Worker xnn_gemm_ukernel_function function[XNN_MAX_UARCH_TYPES];
23*4bdc9457SAndroid Build Coastguard Worker #if XNN_PLATFORM_JIT
24*4bdc9457SAndroid Build Coastguard Worker size_t generated_code_offset[XNN_MAX_UARCH_TYPES];
25*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_PLATFORM_JIT
26*4bdc9457SAndroid Build Coastguard Worker };
27*4bdc9457SAndroid Build Coastguard Worker
xnn_init_hmp_gemm_ukernel(xnn_gemm_ukernel_function function)28*4bdc9457SAndroid Build Coastguard Worker static inline struct xnn_hmp_gemm_ukernel xnn_init_hmp_gemm_ukernel(xnn_gemm_ukernel_function function) {
29*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_gemm_ukernel ukernel = {{ function }};
30*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 1; i < XNN_MAX_UARCH_TYPES; i++) {
31*4bdc9457SAndroid Build Coastguard Worker ukernel.function[i] = function;
32*4bdc9457SAndroid Build Coastguard Worker #if XNN_PLATFORM_JIT
33*4bdc9457SAndroid Build Coastguard Worker ukernel.generated_code_offset[i] = SIZE_MAX;
34*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_PLATFORM_JIT
35*4bdc9457SAndroid Build Coastguard Worker }
36*4bdc9457SAndroid Build Coastguard Worker return ukernel;
37*4bdc9457SAndroid Build Coastguard Worker }
38*4bdc9457SAndroid Build Coastguard Worker
xnn_is_hmp_gemm_ukernel(struct xnn_hmp_gemm_ukernel ukernel)39*4bdc9457SAndroid Build Coastguard Worker static inline bool xnn_is_hmp_gemm_ukernel(struct xnn_hmp_gemm_ukernel ukernel) {
40*4bdc9457SAndroid Build Coastguard Worker #if XNN_MAX_UARCH_TYPES == 1
41*4bdc9457SAndroid Build Coastguard Worker return false;
42*4bdc9457SAndroid Build Coastguard Worker #else
43*4bdc9457SAndroid Build Coastguard Worker uintptr_t default_function = (uintptr_t) ukernel.function[XNN_UARCH_DEFAULT];
44*4bdc9457SAndroid Build Coastguard Worker uintptr_t difference = 0;
45*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 1; i < XNN_MAX_UARCH_TYPES; i++) {
46*4bdc9457SAndroid Build Coastguard Worker difference |= (default_function ^ (uintptr_t) ukernel.function[i]);
47*4bdc9457SAndroid Build Coastguard Worker }
48*4bdc9457SAndroid Build Coastguard Worker return difference != 0;
49*4bdc9457SAndroid Build Coastguard Worker #endif
50*4bdc9457SAndroid Build Coastguard Worker }
51*4bdc9457SAndroid Build Coastguard Worker
52*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_igemm_ukernel {
53*4bdc9457SAndroid Build Coastguard Worker xnn_igemm_ukernel_function function[XNN_MAX_UARCH_TYPES];
54*4bdc9457SAndroid Build Coastguard Worker #if XNN_PLATFORM_JIT
55*4bdc9457SAndroid Build Coastguard Worker size_t generated_code_offset[XNN_MAX_UARCH_TYPES];
56*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_PLATFORM_JIT
57*4bdc9457SAndroid Build Coastguard Worker };
58*4bdc9457SAndroid Build Coastguard Worker
xnn_init_hmp_igemm_ukernel(xnn_igemm_ukernel_function function)59*4bdc9457SAndroid Build Coastguard Worker static inline struct xnn_hmp_igemm_ukernel xnn_init_hmp_igemm_ukernel(xnn_igemm_ukernel_function function) {
60*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_igemm_ukernel ukernel = {{ function }};
61*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 1; i < XNN_MAX_UARCH_TYPES; i++) {
62*4bdc9457SAndroid Build Coastguard Worker ukernel.function[i] = function;
63*4bdc9457SAndroid Build Coastguard Worker #if XNN_PLATFORM_JIT
64*4bdc9457SAndroid Build Coastguard Worker ukernel.generated_code_offset[i] = SIZE_MAX;
65*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_PLATFORM_JIT
66*4bdc9457SAndroid Build Coastguard Worker }
67*4bdc9457SAndroid Build Coastguard Worker return ukernel;
68*4bdc9457SAndroid Build Coastguard Worker }
69*4bdc9457SAndroid Build Coastguard Worker
xnn_is_hmp_igemm_ukernel(struct xnn_hmp_igemm_ukernel ukernel)70*4bdc9457SAndroid Build Coastguard Worker static inline bool xnn_is_hmp_igemm_ukernel(struct xnn_hmp_igemm_ukernel ukernel) {
71*4bdc9457SAndroid Build Coastguard Worker #if XNN_MAX_UARCH_TYPES == 1
72*4bdc9457SAndroid Build Coastguard Worker return false;
73*4bdc9457SAndroid Build Coastguard Worker #else
74*4bdc9457SAndroid Build Coastguard Worker uintptr_t default_function = (uintptr_t) ukernel.function[XNN_UARCH_DEFAULT];
75*4bdc9457SAndroid Build Coastguard Worker uintptr_t difference = 0;
76*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 1; i < XNN_MAX_UARCH_TYPES; i++) {
77*4bdc9457SAndroid Build Coastguard Worker difference |= (default_function ^ (uintptr_t) ukernel.function[i]);
78*4bdc9457SAndroid Build Coastguard Worker }
79*4bdc9457SAndroid Build Coastguard Worker return difference != 0;
80*4bdc9457SAndroid Build Coastguard Worker #endif
81*4bdc9457SAndroid Build Coastguard Worker }
82*4bdc9457SAndroid Build Coastguard Worker
83*4bdc9457SAndroid Build Coastguard Worker // Largest GEMM/IGEMM MR used in init.c is 7 (x86 AVX512).
84*4bdc9457SAndroid Build Coastguard Worker // Largest GEMM/IGEMM MR is 8 in e2e benchmarks.
85*4bdc9457SAndroid Build Coastguard Worker #define XNN_MAX_MR 8
86*4bdc9457SAndroid Build Coastguard Worker
87*4bdc9457SAndroid Build Coastguard Worker struct gemm_fused_ukernels {
88*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_gemm_ukernel gemm[XNN_MAX_MR];
89*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_igemm_ukernel igemm[XNN_MAX_MR];
90*4bdc9457SAndroid Build Coastguard Worker };
91*4bdc9457SAndroid Build Coastguard Worker
92*4bdc9457SAndroid Build Coastguard Worker struct transpose_parameters {
93*4bdc9457SAndroid Build Coastguard Worker union {
94*4bdc9457SAndroid Build Coastguard Worker xnn_transposec_ukernel_function const_size_ukernel;
95*4bdc9457SAndroid Build Coastguard Worker xnn_transposev_ukernel_function variable_size_ukernel;
96*4bdc9457SAndroid Build Coastguard Worker };
97*4bdc9457SAndroid Build Coastguard Worker // Maximum number of elements to process per ukernel call.
98*4bdc9457SAndroid Build Coastguard Worker uint8_t tile_size;
99*4bdc9457SAndroid Build Coastguard Worker };
100*4bdc9457SAndroid Build Coastguard Worker
101*4bdc9457SAndroid Build Coastguard Worker #if XNN_PLATFORM_JIT
102*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_gemm_codegen {
103*4bdc9457SAndroid Build Coastguard Worker xnn_jit_gemm_code_generator_function function[XNN_MAX_UARCH_TYPES];
104*4bdc9457SAndroid Build Coastguard Worker };
105*4bdc9457SAndroid Build Coastguard Worker
xnn_init_hmp_gemm_codegen(xnn_jit_gemm_code_generator_function function)106*4bdc9457SAndroid Build Coastguard Worker static inline struct xnn_hmp_gemm_codegen xnn_init_hmp_gemm_codegen(xnn_jit_gemm_code_generator_function function) {
107*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_gemm_codegen ukernel = {{ function }};
108*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 1; i < XNN_MAX_UARCH_TYPES; i++) {
109*4bdc9457SAndroid Build Coastguard Worker ukernel.function[i] = function;
110*4bdc9457SAndroid Build Coastguard Worker }
111*4bdc9457SAndroid Build Coastguard Worker return ukernel;
112*4bdc9457SAndroid Build Coastguard Worker }
113*4bdc9457SAndroid Build Coastguard Worker
xnn_is_hmp_gemm_codegen(struct xnn_hmp_gemm_codegen ukernel)114*4bdc9457SAndroid Build Coastguard Worker static inline bool xnn_is_hmp_gemm_codegen(struct xnn_hmp_gemm_codegen ukernel) {
115*4bdc9457SAndroid Build Coastguard Worker #if XNN_MAX_UARCH_TYPES == 1
116*4bdc9457SAndroid Build Coastguard Worker return false;
117*4bdc9457SAndroid Build Coastguard Worker #else
118*4bdc9457SAndroid Build Coastguard Worker uintptr_t default_function = (uintptr_t) ukernel.function[XNN_UARCH_DEFAULT];
119*4bdc9457SAndroid Build Coastguard Worker uintptr_t difference = 0;
120*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 1; i < XNN_MAX_UARCH_TYPES; i++) {
121*4bdc9457SAndroid Build Coastguard Worker difference |= (default_function ^ (uintptr_t) ukernel.function[i]);
122*4bdc9457SAndroid Build Coastguard Worker }
123*4bdc9457SAndroid Build Coastguard Worker return difference != 0;
124*4bdc9457SAndroid Build Coastguard Worker #endif
125*4bdc9457SAndroid Build Coastguard Worker }
126*4bdc9457SAndroid Build Coastguard Worker
127*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_igemm_codegen {
128*4bdc9457SAndroid Build Coastguard Worker xnn_jit_igemm_code_generator_function function[XNN_MAX_UARCH_TYPES];
129*4bdc9457SAndroid Build Coastguard Worker };
130*4bdc9457SAndroid Build Coastguard Worker
xnn_init_hmp_igemm_codegen(xnn_jit_igemm_code_generator_function function)131*4bdc9457SAndroid Build Coastguard Worker static inline struct xnn_hmp_igemm_codegen xnn_init_hmp_igemm_codegen(xnn_jit_igemm_code_generator_function function) {
132*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_igemm_codegen ukernel = {{ function }};
133*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 1; i < XNN_MAX_UARCH_TYPES; i++) {
134*4bdc9457SAndroid Build Coastguard Worker ukernel.function[i] = function;
135*4bdc9457SAndroid Build Coastguard Worker }
136*4bdc9457SAndroid Build Coastguard Worker return ukernel;
137*4bdc9457SAndroid Build Coastguard Worker }
138*4bdc9457SAndroid Build Coastguard Worker
xnn_is_hmp_igemm_codegen(struct xnn_hmp_igemm_codegen ukernel)139*4bdc9457SAndroid Build Coastguard Worker static inline bool xnn_is_hmp_igemm_codegen(struct xnn_hmp_igemm_codegen ukernel) {
140*4bdc9457SAndroid Build Coastguard Worker #if XNN_MAX_UARCH_TYPES == 1
141*4bdc9457SAndroid Build Coastguard Worker return false;
142*4bdc9457SAndroid Build Coastguard Worker #else
143*4bdc9457SAndroid Build Coastguard Worker uintptr_t default_function = (uintptr_t) ukernel.function[XNN_UARCH_DEFAULT];
144*4bdc9457SAndroid Build Coastguard Worker uintptr_t difference = 0;
145*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 1; i < XNN_MAX_UARCH_TYPES; i++) {
146*4bdc9457SAndroid Build Coastguard Worker difference |= (default_function ^ (uintptr_t) ukernel.function[i]);
147*4bdc9457SAndroid Build Coastguard Worker }
148*4bdc9457SAndroid Build Coastguard Worker return difference != 0;
149*4bdc9457SAndroid Build Coastguard Worker #endif
150*4bdc9457SAndroid Build Coastguard Worker }
151*4bdc9457SAndroid Build Coastguard Worker
152*4bdc9457SAndroid Build Coastguard Worker struct gemm_codegens {
153*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_gemm_codegen gemm;
154*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_igemm_codegen igemm;
155*4bdc9457SAndroid Build Coastguard Worker // Optional JIT GEMM and IGEMM micro-kernels with MR=1 and the same NR and KR parameters.
156*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_gemm_codegen gemm1;
157*4bdc9457SAndroid Build Coastguard Worker struct xnn_hmp_igemm_codegen igemm1;
158*4bdc9457SAndroid Build Coastguard Worker };
159*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_PLATFORM_JIT
160*4bdc9457SAndroid Build Coastguard Worker
161*4bdc9457SAndroid Build Coastguard Worker struct gemm_parameters {
162*4bdc9457SAndroid Build Coastguard Worker struct gemm_fused_ukernels minmax;
163*4bdc9457SAndroid Build Coastguard Worker struct gemm_fused_ukernels relu;
164*4bdc9457SAndroid Build Coastguard Worker struct gemm_fused_ukernels linear;
165*4bdc9457SAndroid Build Coastguard Worker #if XNN_PLATFORM_JIT
166*4bdc9457SAndroid Build Coastguard Worker struct gemm_codegens generator;
167*4bdc9457SAndroid Build Coastguard Worker #endif // XNN_PLATFORM_JIT
168*4bdc9457SAndroid Build Coastguard Worker union {
169*4bdc9457SAndroid Build Coastguard Worker xnn_init_qc8_conv_minmax_params_fn qc8;
170*4bdc9457SAndroid Build Coastguard Worker xnn_init_qs8_conv_minmax_params_fn qs8;
171*4bdc9457SAndroid Build Coastguard Worker xnn_init_qu8_conv_minmax_params_fn qu8;
172*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_minmax_params_fn f16;
173*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_minmax_params_fn f32;
174*4bdc9457SAndroid Build Coastguard Worker } init;
175*4bdc9457SAndroid Build Coastguard Worker uint8_t mr;
176*4bdc9457SAndroid Build Coastguard Worker uint8_t nr;
177*4bdc9457SAndroid Build Coastguard Worker uint8_t log2_kr;
178*4bdc9457SAndroid Build Coastguard Worker uint8_t log2_sr;
179*4bdc9457SAndroid Build Coastguard Worker };
180*4bdc9457SAndroid Build Coastguard Worker
181*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters {
182*4bdc9457SAndroid Build Coastguard Worker xnn_vunary_ukernel_function ukernel;
183*4bdc9457SAndroid Build Coastguard Worker union {
184*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_f32_cvt_params_fn f16_f32_cvt;
185*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_abs_params_fn f16_abs;
186*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_elu_params_fn f16_elu;
187*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_hswish_params_fn f16_hswish;
188*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_lrelu_params_fn f16_lrelu;
189*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_neg_params_fn f16_neg;
190*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_minmax_params_fn f16_minmax;
191*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_sigmoid_params_fn f16_sigmoid;
192*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_sqrt_params_fn f16_sqrt;
193*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_abs_params_fn f32_abs;
194*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_default_params_fn f32_default;
195*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_elu_params_fn f32_elu;
196*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_f16_cvt_params_fn f32_f16_cvt;
197*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_hswish_params_fn f32_hswish;
198*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_lrelu_params_fn f32_lrelu;
199*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_minmax_params_fn f32_minmax;
200*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_neg_params_fn f32_neg;
201*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_qs8_cvt_params_fn f32_qs8_cvt;
202*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_qu8_cvt_params_fn f32_qu8_cvt;
203*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_rnd_params_fn f32_rnd;
204*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_sigmoid_params_fn f32_sigmoid;
205*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_sqrt_params_fn f32_sqrt;
206*4bdc9457SAndroid Build Coastguard Worker xnn_init_qs8_cvt_params_fn qs8_cvt;
207*4bdc9457SAndroid Build Coastguard Worker xnn_init_qs8_f32_cvt_params_fn qs8_f32_cvt;
208*4bdc9457SAndroid Build Coastguard Worker xnn_init_qs8_lrelu_params_fn qs8_lrelu;
209*4bdc9457SAndroid Build Coastguard Worker xnn_init_qu8_cvt_params_fn qu8_cvt;
210*4bdc9457SAndroid Build Coastguard Worker xnn_init_qu8_f32_cvt_params_fn qu8_f32_cvt;
211*4bdc9457SAndroid Build Coastguard Worker xnn_init_qu8_lrelu_params_fn qu8_lrelu;
212*4bdc9457SAndroid Build Coastguard Worker xnn_init_s8_minmax_params_fn s8_minmax;
213*4bdc9457SAndroid Build Coastguard Worker xnn_init_u8_minmax_params_fn u8_minmax;
214*4bdc9457SAndroid Build Coastguard Worker } init;
215*4bdc9457SAndroid Build Coastguard Worker // Number of elements in a tile.
216*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must process a multiple of this number of elements in each call.
217*4bdc9457SAndroid Build Coastguard Worker uint8_t element_tile;
218*4bdc9457SAndroid Build Coastguard Worker };
219*4bdc9457SAndroid Build Coastguard Worker
220*4bdc9457SAndroid Build Coastguard Worker struct vbinary_fused_ukernels {
221*4bdc9457SAndroid Build Coastguard Worker xnn_vbinary_ukernel_function op_ukernel;
222*4bdc9457SAndroid Build Coastguard Worker xnn_vbinary_ukernel_function opc_ukernel;
223*4bdc9457SAndroid Build Coastguard Worker xnn_vbinary_ukernel_function ropc_ukernel;
224*4bdc9457SAndroid Build Coastguard Worker };
225*4bdc9457SAndroid Build Coastguard Worker
226*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters {
227*4bdc9457SAndroid Build Coastguard Worker struct vbinary_fused_ukernels minmax;
228*4bdc9457SAndroid Build Coastguard Worker struct vbinary_fused_ukernels linear;
229*4bdc9457SAndroid Build Coastguard Worker union {
230*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_minmax_params_fn f16_minmax;
231*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_default_params_fn f32_default;
232*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_minmax_params_fn f32_minmax;
233*4bdc9457SAndroid Build Coastguard Worker xnn_init_qs8_add_minmax_params_fn qs8_add;
234*4bdc9457SAndroid Build Coastguard Worker xnn_init_qs8_mul_minmax_params_fn qs8_mul;
235*4bdc9457SAndroid Build Coastguard Worker xnn_init_qu8_add_minmax_params_fn qu8_add;
236*4bdc9457SAndroid Build Coastguard Worker xnn_init_qu8_mul_minmax_params_fn qu8_mul;
237*4bdc9457SAndroid Build Coastguard Worker } init;
238*4bdc9457SAndroid Build Coastguard Worker // Number of elements in a tile.
239*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must process a multiple of this number of elements in each call.
240*4bdc9457SAndroid Build Coastguard Worker uint8_t element_tile;
241*4bdc9457SAndroid Build Coastguard Worker };
242*4bdc9457SAndroid Build Coastguard Worker
243*4bdc9457SAndroid Build Coastguard Worker struct spmm_parameters {
244*4bdc9457SAndroid Build Coastguard Worker xnn_spmm_ukernel_function ukernel;
245*4bdc9457SAndroid Build Coastguard Worker // Number of M-dimension elements in a tile.
246*4bdc9457SAndroid Build Coastguard Worker // Corresponds to a block of pixels in 1x1 Convolution and a block of batch size in Fully Connected operator.
247*4bdc9457SAndroid Build Coastguard Worker uint8_t mr;
248*4bdc9457SAndroid Build Coastguard Worker // Number of N-dimension elements in a tile.
249*4bdc9457SAndroid Build Coastguard Worker // Corresponds to a block of output channels/features in 1x1 Convolution and Fully Connected operator.
250*4bdc9457SAndroid Build Coastguard Worker uint8_t nr;
251*4bdc9457SAndroid Build Coastguard Worker };
252*4bdc9457SAndroid Build Coastguard Worker
253*4bdc9457SAndroid Build Coastguard Worker struct conv_hwc2chw_parameters {
254*4bdc9457SAndroid Build Coastguard Worker xnn_conv_hwc2chw_ukernel_function ukernel_with_symm_padding;
255*4bdc9457SAndroid Build Coastguard Worker // Number of output channels in a tile.
256*4bdc9457SAndroid Build Coastguard Worker // This parameter must be passed as is to weight packing function.
257*4bdc9457SAndroid Build Coastguard Worker uint8_t output_channel_tile;
258*4bdc9457SAndroid Build Coastguard Worker // Number of output height pixels in a tile.
259*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must produce a multiple of this number of rows in each call.
260*4bdc9457SAndroid Build Coastguard Worker uint8_t output_height_tile;
261*4bdc9457SAndroid Build Coastguard Worker // Number of output width pixels in a tile.
262*4bdc9457SAndroid Build Coastguard Worker uint8_t output_width_tile;
263*4bdc9457SAndroid Build Coastguard Worker };
264*4bdc9457SAndroid Build Coastguard Worker
265*4bdc9457SAndroid Build Coastguard Worker struct dwconv2d_chw_parameters {
266*4bdc9457SAndroid Build Coastguard Worker xnn_dwconv2d_chw_ukernel_function ukernel;
267*4bdc9457SAndroid Build Coastguard Worker // Number of output width pixels in a tile.
268*4bdc9457SAndroid Build Coastguard Worker uint8_t output_width_tile;
269*4bdc9457SAndroid Build Coastguard Worker // Number of output height pixels in a tile.
270*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must produce a multiple of this number of rows in each call.
271*4bdc9457SAndroid Build Coastguard Worker uint8_t output_height_tile;
272*4bdc9457SAndroid Build Coastguard Worker };
273*4bdc9457SAndroid Build Coastguard Worker
274*4bdc9457SAndroid Build Coastguard Worker struct gavgpool_cw_parameters {
275*4bdc9457SAndroid Build Coastguard Worker xnn_gavgpool_cw_ukernel_function ukernel;
276*4bdc9457SAndroid Build Coastguard Worker // Number of channels in a tile.
277*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must process a multiple of this number of channels in each call.
278*4bdc9457SAndroid Build Coastguard Worker uint8_t channel_tile;
279*4bdc9457SAndroid Build Coastguard Worker };
280*4bdc9457SAndroid Build Coastguard Worker
281*4bdc9457SAndroid Build Coastguard Worker union dwconv_fused_ukernels {
282*4bdc9457SAndroid Build Coastguard Worker xnn_dwconv_unipass_ukernel_function unipass;
283*4bdc9457SAndroid Build Coastguard Worker xnn_dwconv_multipass_ukernel_function multipass;
284*4bdc9457SAndroid Build Coastguard Worker };
285*4bdc9457SAndroid Build Coastguard Worker
286*4bdc9457SAndroid Build Coastguard Worker struct dwconv_parameters {
287*4bdc9457SAndroid Build Coastguard Worker union dwconv_fused_ukernels minmax;
288*4bdc9457SAndroid Build Coastguard Worker union dwconv_fused_ukernels linear;
289*4bdc9457SAndroid Build Coastguard Worker union {
290*4bdc9457SAndroid Build Coastguard Worker xnn_init_qc8_conv_minmax_params_fn qc8;
291*4bdc9457SAndroid Build Coastguard Worker xnn_init_qs8_conv_minmax_params_fn qs8;
292*4bdc9457SAndroid Build Coastguard Worker xnn_init_qu8_conv_minmax_params_fn qu8;
293*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_minmax_params_fn f16;
294*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_minmax_params_fn f32;
295*4bdc9457SAndroid Build Coastguard Worker } init;
296*4bdc9457SAndroid Build Coastguard Worker uint8_t channel_tile;
297*4bdc9457SAndroid Build Coastguard Worker uint8_t primary_tile;
298*4bdc9457SAndroid Build Coastguard Worker uint8_t incremental_tile;
299*4bdc9457SAndroid Build Coastguard Worker };
300*4bdc9457SAndroid Build Coastguard Worker
301*4bdc9457SAndroid Build Coastguard Worker struct gavgpool_parameters {
302*4bdc9457SAndroid Build Coastguard Worker xnn_gavgpool_unipass_ukernel_function unipass;
303*4bdc9457SAndroid Build Coastguard Worker xnn_gavgpool_multipass_ukernel_function multipass;
304*4bdc9457SAndroid Build Coastguard Worker union {
305*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_scaleminmax_params_fn f16;
306*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_scaleminmax_params_fn f32;
307*4bdc9457SAndroid Build Coastguard Worker xnn_init_qs8_avgpool_minmax_params_fn qs8;
308*4bdc9457SAndroid Build Coastguard Worker xnn_init_qu8_avgpool_minmax_params_fn qu8;
309*4bdc9457SAndroid Build Coastguard Worker } init;
310*4bdc9457SAndroid Build Coastguard Worker union {
311*4bdc9457SAndroid Build Coastguard Worker xnn_update_f16_scaleminmax_params_fn f16;
312*4bdc9457SAndroid Build Coastguard Worker xnn_update_f32_scaleminmax_params_fn f32;
313*4bdc9457SAndroid Build Coastguard Worker xnn_update_qs8_avgpool_minmax_params_fn qs8;
314*4bdc9457SAndroid Build Coastguard Worker xnn_update_qu8_avgpool_minmax_params_fn qu8;
315*4bdc9457SAndroid Build Coastguard Worker } update;
316*4bdc9457SAndroid Build Coastguard Worker // Number of rows in a tile.
317*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must produce a multiple of this number of rows in each call.
318*4bdc9457SAndroid Build Coastguard Worker uint16_t row_tile;
319*4bdc9457SAndroid Build Coastguard Worker // Number of channels in a tile.
320*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must process a multiple of this number of channels in each call.
321*4bdc9457SAndroid Build Coastguard Worker uint16_t channel_tile;
322*4bdc9457SAndroid Build Coastguard Worker };
323*4bdc9457SAndroid Build Coastguard Worker
324*4bdc9457SAndroid Build Coastguard Worker struct avgpool_parameters {
325*4bdc9457SAndroid Build Coastguard Worker xnn_avgpool_unipass_ukernel_function unipass;
326*4bdc9457SAndroid Build Coastguard Worker xnn_avgpool_multipass_ukernel_function multipass;
327*4bdc9457SAndroid Build Coastguard Worker union {
328*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_scaleminmax_params_fn f16;
329*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_scaleminmax_params_fn f32;
330*4bdc9457SAndroid Build Coastguard Worker xnn_init_qu8_avgpool_minmax_params_fn qu8;
331*4bdc9457SAndroid Build Coastguard Worker } init;
332*4bdc9457SAndroid Build Coastguard Worker // Number of rows in a primary tile.
333*4bdc9457SAndroid Build Coastguard Worker // Unipass micro-kernel must be called with this number of rows, or fewer.
334*4bdc9457SAndroid Build Coastguard Worker // Multipass micro-kernel must be called with more than this number of rows.
335*4bdc9457SAndroid Build Coastguard Worker uint8_t primary_tile;
336*4bdc9457SAndroid Build Coastguard Worker // Number of rows in an incremental tile.
337*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, multipass micro-kernel must process the number of rows in the primary tile plus a multiple
338*4bdc9457SAndroid Build Coastguard Worker // of this number of rows in each call. This number has no meaning for the unipass micro-kernel.
339*4bdc9457SAndroid Build Coastguard Worker uint8_t incremental_tile;
340*4bdc9457SAndroid Build Coastguard Worker // Number of channels in a tile.
341*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must process a multiple of this number of channels in each call.
342*4bdc9457SAndroid Build Coastguard Worker uint16_t channel_tile;
343*4bdc9457SAndroid Build Coastguard Worker };
344*4bdc9457SAndroid Build Coastguard Worker
345*4bdc9457SAndroid Build Coastguard Worker struct pavgpool_parameters {
346*4bdc9457SAndroid Build Coastguard Worker xnn_pavgpool_unipass_ukernel_function unipass;
347*4bdc9457SAndroid Build Coastguard Worker xnn_pavgpool_multipass_ukernel_function multipass;
348*4bdc9457SAndroid Build Coastguard Worker union {
349*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_minmax_params_fn f16;
350*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_minmax_params_fn f32;
351*4bdc9457SAndroid Build Coastguard Worker } init;
352*4bdc9457SAndroid Build Coastguard Worker // Number of rows in a primary tile.
353*4bdc9457SAndroid Build Coastguard Worker // Unipass micro-kernel must be called with this number of rows, or fewer.
354*4bdc9457SAndroid Build Coastguard Worker // Multipass micro-kernel must be called with more than this number of rows.
355*4bdc9457SAndroid Build Coastguard Worker uint8_t primary_tile;
356*4bdc9457SAndroid Build Coastguard Worker // Number of rows in an incremental tile.
357*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, multipass micro-kernel must process the number of rows in the primary tile plus a multiple
358*4bdc9457SAndroid Build Coastguard Worker // of this number of rows in each call. This number has no meaning for the unipass micro-kernel.
359*4bdc9457SAndroid Build Coastguard Worker uint8_t incremental_tile;
360*4bdc9457SAndroid Build Coastguard Worker // Number of channels in a tile.
361*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must process a multiple of this number of channels in each call.
362*4bdc9457SAndroid Build Coastguard Worker uint16_t channel_tile;
363*4bdc9457SAndroid Build Coastguard Worker };
364*4bdc9457SAndroid Build Coastguard Worker
365*4bdc9457SAndroid Build Coastguard Worker struct argmaxpool_parameters {
366*4bdc9457SAndroid Build Coastguard Worker union {
367*4bdc9457SAndroid Build Coastguard Worker xnn_argmaxpool_unipass_ukernel_function up;
368*4bdc9457SAndroid Build Coastguard Worker xnn_argmaxpool_multipass_ukernel_function mp;
369*4bdc9457SAndroid Build Coastguard Worker };
370*4bdc9457SAndroid Build Coastguard Worker uint8_t mr;
371*4bdc9457SAndroid Build Coastguard Worker uint8_t qr;
372*4bdc9457SAndroid Build Coastguard Worker };
373*4bdc9457SAndroid Build Coastguard Worker
374*4bdc9457SAndroid Build Coastguard Worker struct maxpool_parameters {
375*4bdc9457SAndroid Build Coastguard Worker xnn_maxpool_ukernel_function ukernel;
376*4bdc9457SAndroid Build Coastguard Worker union {
377*4bdc9457SAndroid Build Coastguard Worker xnn_init_s8_minmax_params_fn s8;
378*4bdc9457SAndroid Build Coastguard Worker xnn_init_u8_minmax_params_fn u8;
379*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_minmax_params_fn f32;
380*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_minmax_params_fn f16;
381*4bdc9457SAndroid Build Coastguard Worker } init;
382*4bdc9457SAndroid Build Coastguard Worker uint8_t mr;
383*4bdc9457SAndroid Build Coastguard Worker uint8_t qr;
384*4bdc9457SAndroid Build Coastguard Worker };
385*4bdc9457SAndroid Build Coastguard Worker
386*4bdc9457SAndroid Build Coastguard Worker struct ibilinear_parameters {
387*4bdc9457SAndroid Build Coastguard Worker xnn_ibilinear_ukernel_function ukernel;
388*4bdc9457SAndroid Build Coastguard Worker // Number of output pixels in a tile.
389*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must produce a multiple of this number of pixels in each call.
390*4bdc9457SAndroid Build Coastguard Worker uint8_t pixel_tile;
391*4bdc9457SAndroid Build Coastguard Worker // Number of channels in a tile.
392*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must process a multiple of this number of channels in each call.
393*4bdc9457SAndroid Build Coastguard Worker uint8_t channel_tile;
394*4bdc9457SAndroid Build Coastguard Worker };
395*4bdc9457SAndroid Build Coastguard Worker
396*4bdc9457SAndroid Build Coastguard Worker struct ibilinear_chw_parameters {
397*4bdc9457SAndroid Build Coastguard Worker xnn_ibilinear_chw_ukernel_function ukernel;
398*4bdc9457SAndroid Build Coastguard Worker // Number of output pixels in a tile.
399*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must produce a multiple of this number of pixels in each call.
400*4bdc9457SAndroid Build Coastguard Worker uint8_t pixel_tile;
401*4bdc9457SAndroid Build Coastguard Worker // Number of channels in a tile.
402*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must process a multiple of this number of channels in each call.
403*4bdc9457SAndroid Build Coastguard Worker uint8_t channel_tile;
404*4bdc9457SAndroid Build Coastguard Worker };
405*4bdc9457SAndroid Build Coastguard Worker
406*4bdc9457SAndroid Build Coastguard Worker struct zip_parameters {
407*4bdc9457SAndroid Build Coastguard Worker xnn_zipc_ukernel_function x2;
408*4bdc9457SAndroid Build Coastguard Worker xnn_zipc_ukernel_function x3;
409*4bdc9457SAndroid Build Coastguard Worker xnn_zipc_ukernel_function x4;
410*4bdc9457SAndroid Build Coastguard Worker xnn_zipv_ukernel_function xm;
411*4bdc9457SAndroid Build Coastguard Worker };
412*4bdc9457SAndroid Build Coastguard Worker
413*4bdc9457SAndroid Build Coastguard Worker struct prelu_parameters {
414*4bdc9457SAndroid Build Coastguard Worker xnn_prelu_ukernel_function ukernel;
415*4bdc9457SAndroid Build Coastguard Worker uint16_t row_tile;
416*4bdc9457SAndroid Build Coastguard Worker uint16_t channel_tile;
417*4bdc9457SAndroid Build Coastguard Worker };
418*4bdc9457SAndroid Build Coastguard Worker
419*4bdc9457SAndroid Build Coastguard Worker struct raddstoreexpminusmax_parameters {
420*4bdc9457SAndroid Build Coastguard Worker xnn_raddstoreexpminusmax_ukernel_function ukernel;
421*4bdc9457SAndroid Build Coastguard Worker union {
422*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_expminus_params_fn f16;
423*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_expminus_params_fn f32;
424*4bdc9457SAndroid Build Coastguard Worker } init;
425*4bdc9457SAndroid Build Coastguard Worker // Number of elements in a tile.
426*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must process a multiple of this number of elements in each call.
427*4bdc9457SAndroid Build Coastguard Worker uint8_t element_tile;
428*4bdc9457SAndroid Build Coastguard Worker };
429*4bdc9457SAndroid Build Coastguard Worker
430*4bdc9457SAndroid Build Coastguard Worker struct fill_parameters {
431*4bdc9457SAndroid Build Coastguard Worker xnn_fill_ukernel_function ukernel;
432*4bdc9457SAndroid Build Coastguard Worker // Number of rows of inputs processed in one tile.
433*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must produce a multiple of this number of rows in each call.
434*4bdc9457SAndroid Build Coastguard Worker uint8_t row_tile;
435*4bdc9457SAndroid Build Coastguard Worker };
436*4bdc9457SAndroid Build Coastguard Worker
437*4bdc9457SAndroid Build Coastguard Worker struct pad_parameters {
438*4bdc9457SAndroid Build Coastguard Worker xnn_pad_ukernel_function ukernel;
439*4bdc9457SAndroid Build Coastguard Worker // Number of rows of inputs processed in one tile.
440*4bdc9457SAndroid Build Coastguard Worker // For best efficiency, micro-kernel must produce a multiple of this number of rows in each call.
441*4bdc9457SAndroid Build Coastguard Worker uint8_t row_tile;
442*4bdc9457SAndroid Build Coastguard Worker };
443*4bdc9457SAndroid Build Coastguard Worker
444*4bdc9457SAndroid Build Coastguard Worker struct vmulcaddc_parameters {
445*4bdc9457SAndroid Build Coastguard Worker xnn_vmulcaddc_ukernel_function ukernel;
446*4bdc9457SAndroid Build Coastguard Worker union {
447*4bdc9457SAndroid Build Coastguard Worker xnn_init_f16_minmax_params_fn f16;
448*4bdc9457SAndroid Build Coastguard Worker xnn_init_f32_minmax_params_fn f32;
449*4bdc9457SAndroid Build Coastguard Worker } init;
450*4bdc9457SAndroid Build Coastguard Worker uint8_t channel_tile;
451*4bdc9457SAndroid Build Coastguard Worker uint8_t row_tile;
452*4bdc9457SAndroid Build Coastguard Worker };
453*4bdc9457SAndroid Build Coastguard Worker
454*4bdc9457SAndroid Build Coastguard Worker #define XNN_MAX_QC8_DWCONV_UKERNELS 3
455*4bdc9457SAndroid Build Coastguard Worker #define XNN_MAX_QS8_DWCONV_UKERNELS 2
456*4bdc9457SAndroid Build Coastguard Worker #define XNN_MAX_QU8_DWCONV_UKERNELS 2
457*4bdc9457SAndroid Build Coastguard Worker #define XNN_MAX_F16_DWCONV_UKERNELS 4
458*4bdc9457SAndroid Build Coastguard Worker #define XNN_MAX_F32_DWCONV_UKERNELS 4
459*4bdc9457SAndroid Build Coastguard Worker #define XNN_MAX_F32_ARGMAXPOOL_UKERNELS 3
460*4bdc9457SAndroid Build Coastguard Worker
461*4bdc9457SAndroid Build Coastguard Worker // Indicates that XNNPACK as a whole has initialized.
462*4bdc9457SAndroid Build Coastguard Worker // This does not guarantee that any particular microkernels are available.
463*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_XNNPACK 0x00000001
464*4bdc9457SAndroid Build Coastguard Worker // Indicates that F32 XNNPACK microkernels are available for use.
465*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_F32 0x00000002
466*4bdc9457SAndroid Build Coastguard Worker // Indicates that X32 XNNPACK microkernels are available for use.
467*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_X32 0x00000004
468*4bdc9457SAndroid Build Coastguard Worker // Indicates that F16 XNNPACK microkernels are available for use.
469*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_F16 0x00000008
470*4bdc9457SAndroid Build Coastguard Worker // Indicates that F16 XNNPACK microkernels are natively supported by the hardware.
471*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_F16_NATIVE 0x00000010
472*4bdc9457SAndroid Build Coastguard Worker // Indicates that X16 XNNPACK microkernels are available for use.
473*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_X16 0x00000020
474*4bdc9457SAndroid Build Coastguard Worker // Indicates that QC8 XNNPACK microkernels are available for use.
475*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_QC8 0x00000040
476*4bdc9457SAndroid Build Coastguard Worker // Indicates that QS8 XNNPACK microkernels are available for use.
477*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_QS8 0x00000080
478*4bdc9457SAndroid Build Coastguard Worker // Indicates that QU8 XNNPACK microkernels are available for use.
479*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_QU8 0x00000100
480*4bdc9457SAndroid Build Coastguard Worker // Indicates that S8 XNNPACK microkernels are available for use.
481*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_S8 0x00000200
482*4bdc9457SAndroid Build Coastguard Worker // Indicates that U8 XNNPACK microkernels are available for use.
483*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_U8 0x00000400
484*4bdc9457SAndroid Build Coastguard Worker // Indicates that X8 XNNPACK microkernels are available for use.
485*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_X8 0x00000800
486*4bdc9457SAndroid Build Coastguard Worker // Indicates that XX XNNPACK microkernels are available for use.
487*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_XX 0x00001000
488*4bdc9457SAndroid Build Coastguard Worker // Indicates that VCVT XNNPACK microkernels are available for use.
489*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_VCVT 0x00002000
490*4bdc9457SAndroid Build Coastguard Worker // Indicates that CHW XNNPACK microkernels are optimized for the host platform.
491*4bdc9457SAndroid Build Coastguard Worker #define XNN_INIT_FLAG_CHW_OPT 0x00004000
492*4bdc9457SAndroid Build Coastguard Worker
493*4bdc9457SAndroid Build Coastguard Worker struct xnn_parameters {
494*4bdc9457SAndroid Build Coastguard Worker // Bitwise combination of XNN_INIT_FLAG_* flags
495*4bdc9457SAndroid Build Coastguard Worker uint32_t init_flags;
496*4bdc9457SAndroid Build Coastguard Worker struct xnn_allocator allocator;
497*4bdc9457SAndroid Build Coastguard Worker size_t page_size;
498*4bdc9457SAndroid Build Coastguard Worker struct {
499*4bdc9457SAndroid Build Coastguard Worker struct gemm_parameters gemm;
500*4bdc9457SAndroid Build Coastguard Worker struct dwconv_parameters dwconv[XNN_MAX_QC8_DWCONV_UKERNELS];
501*4bdc9457SAndroid Build Coastguard Worker } qc8;
502*4bdc9457SAndroid Build Coastguard Worker struct {
503*4bdc9457SAndroid Build Coastguard Worker struct gemm_parameters gemm;
504*4bdc9457SAndroid Build Coastguard Worker struct dwconv_parameters dwconv[XNN_MAX_QS8_DWCONV_UKERNELS];
505*4bdc9457SAndroid Build Coastguard Worker struct gavgpool_parameters gavgpool;
506*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vadd;
507*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vmul;
508*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters lrelu;
509*4bdc9457SAndroid Build Coastguard Worker } qs8;
510*4bdc9457SAndroid Build Coastguard Worker struct {
511*4bdc9457SAndroid Build Coastguard Worker struct gemm_parameters gemm;
512*4bdc9457SAndroid Build Coastguard Worker struct dwconv_parameters dwconv[XNN_MAX_QU8_DWCONV_UKERNELS];
513*4bdc9457SAndroid Build Coastguard Worker struct avgpool_parameters avgpool;
514*4bdc9457SAndroid Build Coastguard Worker struct gavgpool_parameters gavgpool;
515*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vadd;
516*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vmul;
517*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters lrelu;
518*4bdc9457SAndroid Build Coastguard Worker } qu8;
519*4bdc9457SAndroid Build Coastguard Worker struct {
520*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters clamp;
521*4bdc9457SAndroid Build Coastguard Worker // Bilinear interpolation (2D).
522*4bdc9457SAndroid Build Coastguard Worker struct ibilinear_parameters ibilinear;
523*4bdc9457SAndroid Build Coastguard Worker struct maxpool_parameters maxpool;
524*4bdc9457SAndroid Build Coastguard Worker } s8;
525*4bdc9457SAndroid Build Coastguard Worker struct {
526*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters clamp;
527*4bdc9457SAndroid Build Coastguard Worker // Bilinear interpolation (2D).
528*4bdc9457SAndroid Build Coastguard Worker struct ibilinear_parameters ibilinear;
529*4bdc9457SAndroid Build Coastguard Worker struct maxpool_parameters maxpool;
530*4bdc9457SAndroid Build Coastguard Worker xnn_u8_lut32norm_ukernel_function lut32norm;
531*4bdc9457SAndroid Build Coastguard Worker xnn_u8_rmax_ukernel_function rmax;
532*4bdc9457SAndroid Build Coastguard Worker } u8;
533*4bdc9457SAndroid Build Coastguard Worker struct {
534*4bdc9457SAndroid Build Coastguard Worker xnn_x8_lut_ukernel_function lut;
535*4bdc9457SAndroid Build Coastguard Worker struct zip_parameters zip;
536*4bdc9457SAndroid Build Coastguard Worker struct transpose_parameters transpose;
537*4bdc9457SAndroid Build Coastguard Worker } x8;
538*4bdc9457SAndroid Build Coastguard Worker struct {
539*4bdc9457SAndroid Build Coastguard Worker struct transpose_parameters transpose;
540*4bdc9457SAndroid Build Coastguard Worker } x16;
541*4bdc9457SAndroid Build Coastguard Worker struct {
542*4bdc9457SAndroid Build Coastguard Worker struct gemm_parameters gemm;
543*4bdc9457SAndroid Build Coastguard Worker struct gemm_parameters gemm2;
544*4bdc9457SAndroid Build Coastguard Worker struct dwconv_parameters dwconv[XNN_MAX_F16_DWCONV_UKERNELS];
545*4bdc9457SAndroid Build Coastguard Worker struct avgpool_parameters avgpool;
546*4bdc9457SAndroid Build Coastguard Worker struct pavgpool_parameters pavgpool;
547*4bdc9457SAndroid Build Coastguard Worker struct gavgpool_parameters gavgpool;
548*4bdc9457SAndroid Build Coastguard Worker struct maxpool_parameters maxpool;
549*4bdc9457SAndroid Build Coastguard Worker // Bilinear interpolation (2D).
550*4bdc9457SAndroid Build Coastguard Worker struct ibilinear_parameters ibilinear;
551*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters abs;
552*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters clamp;
553*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters elu;
554*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters hswish;
555*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters lrelu;
556*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters neg;
557*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters rndne;
558*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters rndz;
559*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters rndu;
560*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters rndd;
561*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters sigmoid;
562*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters sqr;
563*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters sqrt;
564*4bdc9457SAndroid Build Coastguard Worker struct prelu_parameters prelu;
565*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vadd;
566*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vdiv;
567*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vmax;
568*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vmin;
569*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vmul;
570*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vsub;
571*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vsqrdiff;
572*4bdc9457SAndroid Build Coastguard Worker struct vmulcaddc_parameters vmulcaddc;
573*4bdc9457SAndroid Build Coastguard Worker struct raddstoreexpminusmax_parameters raddstoreexpminusmax;
574*4bdc9457SAndroid Build Coastguard Worker xnn_rmax_ukernel_function rmax;
575*4bdc9457SAndroid Build Coastguard Worker // Sparse Matrix-Dense Matrix Multiplication (NR=1 block).
576*4bdc9457SAndroid Build Coastguard Worker struct spmm_parameters spmm;
577*4bdc9457SAndroid Build Coastguard Worker // Direct 3x3 stride-2 Convolution with 3 input channels and HWC->CHW layout conversion.
578*4bdc9457SAndroid Build Coastguard Worker struct conv_hwc2chw_parameters conv_hwc2chw_3x3c3s2;
579*4bdc9457SAndroid Build Coastguard Worker // Direct 3x3 stride-1 Convolution with padding 1 on left and right in CHW layout.
580*4bdc9457SAndroid Build Coastguard Worker struct dwconv2d_chw_parameters dwconv2d_chw_3x3;
581*4bdc9457SAndroid Build Coastguard Worker // Direct 3x3 stride-2 Convolution with padding 1 on left and right in CHW layout.
582*4bdc9457SAndroid Build Coastguard Worker struct dwconv2d_chw_parameters dwconv2d_chw_3x3s2;
583*4bdc9457SAndroid Build Coastguard Worker // Direct 5x5 stride-1 Convolution with padding 2 on left and right in CHW layout.
584*4bdc9457SAndroid Build Coastguard Worker struct dwconv2d_chw_parameters dwconv2d_chw_5x5;
585*4bdc9457SAndroid Build Coastguard Worker // Direct 5x5 stride-2 Convolution with padding 2 on left and right in CHW layout.
586*4bdc9457SAndroid Build Coastguard Worker struct dwconv2d_chw_parameters dwconv2d_chw_5x5s2;
587*4bdc9457SAndroid Build Coastguard Worker // Global Average Pooling in CW layout.
588*4bdc9457SAndroid Build Coastguard Worker struct gavgpool_cw_parameters gavgpool_cw;
589*4bdc9457SAndroid Build Coastguard Worker // Bilinear interpolation (2D) in CHW layout.
590*4bdc9457SAndroid Build Coastguard Worker struct ibilinear_chw_parameters ibilinear_chw;
591*4bdc9457SAndroid Build Coastguard Worker } f16;
592*4bdc9457SAndroid Build Coastguard Worker struct {
593*4bdc9457SAndroid Build Coastguard Worker struct gemm_parameters gemm;
594*4bdc9457SAndroid Build Coastguard Worker struct gemm_parameters gemm2;
595*4bdc9457SAndroid Build Coastguard Worker struct dwconv_parameters dwconv[XNN_MAX_F32_DWCONV_UKERNELS];
596*4bdc9457SAndroid Build Coastguard Worker struct avgpool_parameters avgpool;
597*4bdc9457SAndroid Build Coastguard Worker struct pavgpool_parameters pavgpool;
598*4bdc9457SAndroid Build Coastguard Worker struct gavgpool_parameters gavgpool;
599*4bdc9457SAndroid Build Coastguard Worker struct maxpool_parameters maxpool;
600*4bdc9457SAndroid Build Coastguard Worker struct argmaxpool_parameters argmaxpool[XNN_MAX_F32_ARGMAXPOOL_UKERNELS];
601*4bdc9457SAndroid Build Coastguard Worker // Bilinear interpolation (2D).
602*4bdc9457SAndroid Build Coastguard Worker struct ibilinear_parameters ibilinear;
603*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters abs;
604*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters clamp;
605*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters elu;
606*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters hswish;
607*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters lrelu;
608*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters neg;
609*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters relu;
610*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters rndne;
611*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters rndz;
612*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters rndu;
613*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters rndd;
614*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters sigmoid;
615*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters sqr;
616*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters sqrt;
617*4bdc9457SAndroid Build Coastguard Worker struct prelu_parameters prelu;
618*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vadd;
619*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vdiv;
620*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vmax;
621*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vmin;
622*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vmul;
623*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vsub;
624*4bdc9457SAndroid Build Coastguard Worker struct vbinary_parameters vsqrdiff;
625*4bdc9457SAndroid Build Coastguard Worker struct vmulcaddc_parameters vmulcaddc;
626*4bdc9457SAndroid Build Coastguard Worker struct raddstoreexpminusmax_parameters raddstoreexpminusmax;
627*4bdc9457SAndroid Build Coastguard Worker xnn_rmax_ukernel_function rmax;
628*4bdc9457SAndroid Build Coastguard Worker // Sparse Matrix-Dense Matrix Multiplication (NR=1 block).
629*4bdc9457SAndroid Build Coastguard Worker struct spmm_parameters spmm;
630*4bdc9457SAndroid Build Coastguard Worker // Sparse Matrix-Dense Matrix Multiplication (NR=2 block).
631*4bdc9457SAndroid Build Coastguard Worker struct spmm_parameters spmm2;
632*4bdc9457SAndroid Build Coastguard Worker // Sparse Matrix-Dense Matrix Multiplication (NR=4 block).
633*4bdc9457SAndroid Build Coastguard Worker struct spmm_parameters spmm4;
634*4bdc9457SAndroid Build Coastguard Worker // Direct 3x3 stride-2 Convolution with 3 input channels and HWC->CHW layout conversion.
635*4bdc9457SAndroid Build Coastguard Worker struct conv_hwc2chw_parameters conv_hwc2chw_3x3c3s2;
636*4bdc9457SAndroid Build Coastguard Worker // Direct 3x3 stride-1 Convolution with padding 1 on left and right in CHW layout.
637*4bdc9457SAndroid Build Coastguard Worker struct dwconv2d_chw_parameters dwconv2d_chw_3x3;
638*4bdc9457SAndroid Build Coastguard Worker // Direct 3x3 stride-2 Convolution with padding 1 on left and right in CHW layout.
639*4bdc9457SAndroid Build Coastguard Worker struct dwconv2d_chw_parameters dwconv2d_chw_3x3s2;
640*4bdc9457SAndroid Build Coastguard Worker // Direct 5x5 stride-1 Convolution with padding 2 on left and right in CHW layout.
641*4bdc9457SAndroid Build Coastguard Worker struct dwconv2d_chw_parameters dwconv2d_chw_5x5;
642*4bdc9457SAndroid Build Coastguard Worker // Direct 5x5 stride-2 Convolution with padding 2 on left and right in CHW layout.
643*4bdc9457SAndroid Build Coastguard Worker struct dwconv2d_chw_parameters dwconv2d_chw_5x5s2;
644*4bdc9457SAndroid Build Coastguard Worker // Global Average Pooling in CW layout.
645*4bdc9457SAndroid Build Coastguard Worker struct gavgpool_cw_parameters gavgpool_cw;
646*4bdc9457SAndroid Build Coastguard Worker // Bilinear interpolation (2D) in CHW layout.
647*4bdc9457SAndroid Build Coastguard Worker struct ibilinear_chw_parameters ibilinear_chw;
648*4bdc9457SAndroid Build Coastguard Worker } f32;
649*4bdc9457SAndroid Build Coastguard Worker struct {
650*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters f16_to_f32;
651*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters f32_to_f16;
652*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters f32_to_qs8;
653*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters f32_to_qu8;
654*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters qs8;
655*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters qs8_to_f32;
656*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters qu8;
657*4bdc9457SAndroid Build Coastguard Worker struct vunary_parameters qu8_to_f32;
658*4bdc9457SAndroid Build Coastguard Worker } vcvt;
659*4bdc9457SAndroid Build Coastguard Worker struct {
660*4bdc9457SAndroid Build Coastguard Worker xnn_unpool_ukernel_function unpool;
661*4bdc9457SAndroid Build Coastguard Worker struct zip_parameters zip;
662*4bdc9457SAndroid Build Coastguard Worker struct transpose_parameters transpose;
663*4bdc9457SAndroid Build Coastguard Worker } x32;
664*4bdc9457SAndroid Build Coastguard Worker struct {
665*4bdc9457SAndroid Build Coastguard Worker xnn_vunary_ukernel_function copy;
666*4bdc9457SAndroid Build Coastguard Worker struct fill_parameters fill;
667*4bdc9457SAndroid Build Coastguard Worker struct pad_parameters pad;
668*4bdc9457SAndroid Build Coastguard Worker struct transpose_parameters transpose;
669*4bdc9457SAndroid Build Coastguard Worker } xx;
670*4bdc9457SAndroid Build Coastguard Worker };
671*4bdc9457SAndroid Build Coastguard Worker
672*4bdc9457SAndroid Build Coastguard Worker #ifdef __cplusplus
673*4bdc9457SAndroid Build Coastguard Worker extern "C" XNN_INTERNAL struct xnn_parameters xnn_params;
674*4bdc9457SAndroid Build Coastguard Worker #else
675*4bdc9457SAndroid Build Coastguard Worker extern XNN_INTERNAL struct xnn_parameters xnn_params;
676*4bdc9457SAndroid Build Coastguard Worker #endif
677