xref: /aosp_15_r20/external/XNNPACK/src/operators/global-average-pooling-nwc.c (revision 4bdc94577ba0e567308109d787f7fec7b531ce36)
1*4bdc9457SAndroid Build Coastguard Worker // Copyright (c) Facebook, Inc. and its affiliates.
2*4bdc9457SAndroid Build Coastguard Worker // All rights reserved.
3*4bdc9457SAndroid Build Coastguard Worker //
4*4bdc9457SAndroid Build Coastguard Worker // Copyright 2019 Google LLC
5*4bdc9457SAndroid Build Coastguard Worker //
6*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
7*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
8*4bdc9457SAndroid Build Coastguard Worker 
9*4bdc9457SAndroid Build Coastguard Worker #include <assert.h>
10*4bdc9457SAndroid Build Coastguard Worker #include <math.h>
11*4bdc9457SAndroid Build Coastguard Worker #include <stddef.h>
12*4bdc9457SAndroid Build Coastguard Worker #include <stdint.h>
13*4bdc9457SAndroid Build Coastguard Worker #include <stdlib.h>
14*4bdc9457SAndroid Build Coastguard Worker 
15*4bdc9457SAndroid Build Coastguard Worker #include <fp16.h>
16*4bdc9457SAndroid Build Coastguard Worker 
17*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack.h>
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/allocator.h>
19*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/log.h>
20*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/operator.h>
21*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microparams-init.h>
22*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/params.h>
23*4bdc9457SAndroid Build Coastguard Worker 
24*4bdc9457SAndroid Build Coastguard Worker 
create_global_average_pooling_nwc(size_t channels,size_t input_stride,size_t output_stride,uint32_t flags,uint32_t log2_element_size,size_t params_offset,const void * params,size_t params_size,uint32_t datatype_init_flags,enum xnn_operator_type operator_type,xnn_operator_t * global_average_pooling_op_out)25*4bdc9457SAndroid Build Coastguard Worker static enum xnn_status create_global_average_pooling_nwc(
26*4bdc9457SAndroid Build Coastguard Worker     size_t channels,
27*4bdc9457SAndroid Build Coastguard Worker     size_t input_stride,
28*4bdc9457SAndroid Build Coastguard Worker     size_t output_stride,
29*4bdc9457SAndroid Build Coastguard Worker     uint32_t flags,
30*4bdc9457SAndroid Build Coastguard Worker     uint32_t log2_element_size,
31*4bdc9457SAndroid Build Coastguard Worker     size_t params_offset,
32*4bdc9457SAndroid Build Coastguard Worker     const void* params,
33*4bdc9457SAndroid Build Coastguard Worker     size_t params_size,
34*4bdc9457SAndroid Build Coastguard Worker     uint32_t datatype_init_flags,
35*4bdc9457SAndroid Build Coastguard Worker     enum xnn_operator_type operator_type,
36*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t* global_average_pooling_op_out)
37*4bdc9457SAndroid Build Coastguard Worker {
38*4bdc9457SAndroid Build Coastguard Worker   xnn_operator_t global_average_pooling_op = NULL;
39*4bdc9457SAndroid Build Coastguard Worker   enum xnn_status status = xnn_status_uninitialized;
40*4bdc9457SAndroid Build Coastguard Worker 
41*4bdc9457SAndroid Build Coastguard Worker   if ((xnn_params.init_flags & XNN_INIT_FLAG_XNNPACK) == 0) {
42*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error("failed to create %s operator: XNNPACK is not initialized",
43*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(operator_type));
44*4bdc9457SAndroid Build Coastguard Worker     goto error;
45*4bdc9457SAndroid Build Coastguard Worker   }
46*4bdc9457SAndroid Build Coastguard Worker 
47*4bdc9457SAndroid Build Coastguard Worker   status = xnn_status_unsupported_hardware;
48*4bdc9457SAndroid Build Coastguard Worker 
49*4bdc9457SAndroid Build Coastguard Worker   if ((xnn_params.init_flags & datatype_init_flags) == 0) {
50*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error("failed to create %s operator: operations on data type are not supported",
51*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(operator_type));
52*4bdc9457SAndroid Build Coastguard Worker     goto error;
53*4bdc9457SAndroid Build Coastguard Worker   }
54*4bdc9457SAndroid Build Coastguard Worker 
55*4bdc9457SAndroid Build Coastguard Worker   status = xnn_status_invalid_parameter;
56*4bdc9457SAndroid Build Coastguard Worker 
57*4bdc9457SAndroid Build Coastguard Worker   if (channels == 0) {
58*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
59*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with %zu channels: number of channels must be non-zero",
60*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(operator_type), channels);
61*4bdc9457SAndroid Build Coastguard Worker     goto error;
62*4bdc9457SAndroid Build Coastguard Worker   }
63*4bdc9457SAndroid Build Coastguard Worker 
64*4bdc9457SAndroid Build Coastguard Worker   if (input_stride < channels) {
65*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
66*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with input element stride of %zu: "
67*4bdc9457SAndroid Build Coastguard Worker       "stride must be at least as large as the number of channels (%zu)",
68*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(operator_type), input_stride, channels);
69*4bdc9457SAndroid Build Coastguard Worker     goto error;
70*4bdc9457SAndroid Build Coastguard Worker   }
71*4bdc9457SAndroid Build Coastguard Worker 
72*4bdc9457SAndroid Build Coastguard Worker   if (output_stride < channels) {
73*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
74*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with output element stride of %zu: "
75*4bdc9457SAndroid Build Coastguard Worker       "stride must be at least as large as the number of channels (%zu)",
76*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(operator_type), output_stride, channels);
77*4bdc9457SAndroid Build Coastguard Worker     goto error;
78*4bdc9457SAndroid Build Coastguard Worker   }
79*4bdc9457SAndroid Build Coastguard Worker 
80*4bdc9457SAndroid Build Coastguard Worker   status = xnn_status_out_of_memory;
81*4bdc9457SAndroid Build Coastguard Worker 
82*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op = xnn_allocate_zero_simd_memory(sizeof(struct xnn_operator));
83*4bdc9457SAndroid Build Coastguard Worker   if (global_average_pooling_op == NULL) {
84*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
85*4bdc9457SAndroid Build Coastguard Worker       "failed to allocate %zu bytes for %s operator descriptor",
86*4bdc9457SAndroid Build Coastguard Worker       sizeof(struct xnn_operator), xnn_operator_type_to_string(operator_type));
87*4bdc9457SAndroid Build Coastguard Worker     goto error;
88*4bdc9457SAndroid Build Coastguard Worker   }
89*4bdc9457SAndroid Build Coastguard Worker 
90*4bdc9457SAndroid Build Coastguard Worker   const size_t zero_size = (channels << log2_element_size) + XNN_EXTRA_BYTES;
91*4bdc9457SAndroid Build Coastguard Worker   void* zero_buffer = xnn_allocate_zero_simd_memory(zero_size);
92*4bdc9457SAndroid Build Coastguard Worker   if (zero_buffer == NULL) {
93*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
94*4bdc9457SAndroid Build Coastguard Worker       "failed to allocate %zu bytes for %s operator zero padding",
95*4bdc9457SAndroid Build Coastguard Worker       zero_size, xnn_operator_type_to_string(operator_type));
96*4bdc9457SAndroid Build Coastguard Worker     goto error;
97*4bdc9457SAndroid Build Coastguard Worker   }
98*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->zero_buffer = zero_buffer;
99*4bdc9457SAndroid Build Coastguard Worker 
100*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->channels = channels;
101*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->input_pixel_stride = input_stride;
102*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->output_pixel_stride = output_stride;
103*4bdc9457SAndroid Build Coastguard Worker   memcpy((void*) ((uintptr_t) global_average_pooling_op + params_offset), params, params_size);
104*4bdc9457SAndroid Build Coastguard Worker 
105*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->type = operator_type;
106*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->flags = flags;
107*4bdc9457SAndroid Build Coastguard Worker 
108*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->state = xnn_run_state_invalid;
109*4bdc9457SAndroid Build Coastguard Worker 
110*4bdc9457SAndroid Build Coastguard Worker   *global_average_pooling_op_out = global_average_pooling_op;
111*4bdc9457SAndroid Build Coastguard Worker   return xnn_status_success;
112*4bdc9457SAndroid Build Coastguard Worker 
113*4bdc9457SAndroid Build Coastguard Worker error:
114*4bdc9457SAndroid Build Coastguard Worker   xnn_delete_operator(global_average_pooling_op);
115*4bdc9457SAndroid Build Coastguard Worker   return status;
116*4bdc9457SAndroid Build Coastguard Worker }
117*4bdc9457SAndroid Build Coastguard Worker 
setup_global_average_pooling_nwc(xnn_operator_t global_average_pooling_op,size_t batch_size,size_t width,const void * input,void * output,size_t log2_element_size,const struct gavgpool_parameters gavgpool[restrict XNN_MIN_ELEMENTS (1)],uint32_t datatype_init_flags,enum xnn_operator_type expected_operator_type,const void * params,size_t params_size,void (* update_params)(xnn_operator_t,size_t),pthreadpool_t threadpool)118*4bdc9457SAndroid Build Coastguard Worker static enum xnn_status setup_global_average_pooling_nwc(
119*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t global_average_pooling_op,
120*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
121*4bdc9457SAndroid Build Coastguard Worker     size_t width,
122*4bdc9457SAndroid Build Coastguard Worker     const void* input,
123*4bdc9457SAndroid Build Coastguard Worker     void* output,
124*4bdc9457SAndroid Build Coastguard Worker     size_t log2_element_size,
125*4bdc9457SAndroid Build Coastguard Worker     const struct gavgpool_parameters gavgpool[restrict XNN_MIN_ELEMENTS(1)],
126*4bdc9457SAndroid Build Coastguard Worker     uint32_t datatype_init_flags,
127*4bdc9457SAndroid Build Coastguard Worker     enum xnn_operator_type expected_operator_type,
128*4bdc9457SAndroid Build Coastguard Worker     const void* params,
129*4bdc9457SAndroid Build Coastguard Worker     size_t params_size,
130*4bdc9457SAndroid Build Coastguard Worker     void (*update_params)(xnn_operator_t, size_t),
131*4bdc9457SAndroid Build Coastguard Worker     pthreadpool_t threadpool)
132*4bdc9457SAndroid Build Coastguard Worker {
133*4bdc9457SAndroid Build Coastguard Worker   if (global_average_pooling_op->type != expected_operator_type) {
134*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error("failed to setup operator: operator type mismatch (expected %s, got %s)",
135*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(expected_operator_type),
136*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(global_average_pooling_op->type));
137*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
138*4bdc9457SAndroid Build Coastguard Worker   }
139*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->state = xnn_run_state_invalid;
140*4bdc9457SAndroid Build Coastguard Worker 
141*4bdc9457SAndroid Build Coastguard Worker   if ((xnn_params.init_flags & XNN_INIT_FLAG_XNNPACK) == 0) {
142*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error("failed to setup %s operator: XNNPACK is not initialized",
143*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(global_average_pooling_op->type));
144*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_uninitialized;
145*4bdc9457SAndroid Build Coastguard Worker   }
146*4bdc9457SAndroid Build Coastguard Worker 
147*4bdc9457SAndroid Build Coastguard Worker   if ((xnn_params.init_flags & datatype_init_flags) == 0) {
148*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error("failed to setup %s operator: operations on data type are not supported",
149*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(global_average_pooling_op->type));
150*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_unsupported_hardware;
151*4bdc9457SAndroid Build Coastguard Worker   }
152*4bdc9457SAndroid Build Coastguard Worker 
153*4bdc9457SAndroid Build Coastguard Worker   if (width == 0) {
154*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error("failed to setup %s operator with width %zu: width must be non-zero",
155*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(global_average_pooling_op->type), width);
156*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
157*4bdc9457SAndroid Build Coastguard Worker   }
158*4bdc9457SAndroid Build Coastguard Worker 
159*4bdc9457SAndroid Build Coastguard Worker   if (batch_size == 0) {
160*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->state = xnn_run_state_skip;
161*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_success;
162*4bdc9457SAndroid Build Coastguard Worker   }
163*4bdc9457SAndroid Build Coastguard Worker 
164*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->batch_size = batch_size;
165*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->input_width = width;
166*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->input = input;
167*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->output = output;
168*4bdc9457SAndroid Build Coastguard Worker 
169*4bdc9457SAndroid Build Coastguard Worker   update_params(global_average_pooling_op, width);
170*4bdc9457SAndroid Build Coastguard Worker 
171*4bdc9457SAndroid Build Coastguard Worker   assert(gavgpool->row_tile != 0);
172*4bdc9457SAndroid Build Coastguard Worker 
173*4bdc9457SAndroid Build Coastguard Worker   const size_t input_stride_in_bytes = global_average_pooling_op->input_pixel_stride << log2_element_size;
174*4bdc9457SAndroid Build Coastguard Worker   const size_t channels = global_average_pooling_op->channels;
175*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->context.global_average_pooling_nwc = (struct global_average_pooling_nwc_context) {
176*4bdc9457SAndroid Build Coastguard Worker       .input = input,
177*4bdc9457SAndroid Build Coastguard Worker       .zero = global_average_pooling_op->zero_buffer,
178*4bdc9457SAndroid Build Coastguard Worker       .input_pixel_stride = input_stride_in_bytes,
179*4bdc9457SAndroid Build Coastguard Worker       .input_batch_stride = input_stride_in_bytes * width,
180*4bdc9457SAndroid Build Coastguard Worker       .input_elements = width,
181*4bdc9457SAndroid Build Coastguard Worker       .channels = channels,
182*4bdc9457SAndroid Build Coastguard Worker       .output = output,
183*4bdc9457SAndroid Build Coastguard Worker       .output_batch_stride = (global_average_pooling_op->output_pixel_stride << log2_element_size),
184*4bdc9457SAndroid Build Coastguard Worker   };
185*4bdc9457SAndroid Build Coastguard Worker   memcpy(&global_average_pooling_op->context.global_average_pooling_nwc.params, params, params_size);
186*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->compute.type = xnn_parallelization_type_1d;
187*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->compute.range[0] = batch_size;
188*4bdc9457SAndroid Build Coastguard Worker 
189*4bdc9457SAndroid Build Coastguard Worker   if (width <= gavgpool->row_tile) {
190*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->compute.task_1d = (pthreadpool_task_1d_t) xnn_compute_global_average_pooling_nwc_unipass;
191*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->context.global_average_pooling_nwc.unipass_ukernel = gavgpool->unipass;
192*4bdc9457SAndroid Build Coastguard Worker   } else {
193*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->compute.task_1d = (pthreadpool_task_1d_t) xnn_compute_global_average_pooling_nwc_multipass;
194*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->context.global_average_pooling_nwc.multipass_ukernel = gavgpool->multipass;
195*4bdc9457SAndroid Build Coastguard Worker   }
196*4bdc9457SAndroid Build Coastguard Worker   global_average_pooling_op->state = xnn_run_state_ready;
197*4bdc9457SAndroid Build Coastguard Worker 
198*4bdc9457SAndroid Build Coastguard Worker   return xnn_status_success;
199*4bdc9457SAndroid Build Coastguard Worker }
200*4bdc9457SAndroid Build Coastguard Worker 
xnn_create_global_average_pooling_nwc_qu8(size_t channels,size_t input_stride,size_t output_stride,uint8_t input_zero_point,float input_scale,uint8_t output_zero_point,float output_scale,uint8_t output_min,uint8_t output_max,uint32_t flags,xnn_operator_t * global_average_pooling_op_out)201*4bdc9457SAndroid Build Coastguard Worker enum xnn_status xnn_create_global_average_pooling_nwc_qu8(
202*4bdc9457SAndroid Build Coastguard Worker     size_t channels,
203*4bdc9457SAndroid Build Coastguard Worker     size_t input_stride,
204*4bdc9457SAndroid Build Coastguard Worker     size_t output_stride,
205*4bdc9457SAndroid Build Coastguard Worker     uint8_t input_zero_point,
206*4bdc9457SAndroid Build Coastguard Worker     float input_scale,
207*4bdc9457SAndroid Build Coastguard Worker     uint8_t output_zero_point,
208*4bdc9457SAndroid Build Coastguard Worker     float output_scale,
209*4bdc9457SAndroid Build Coastguard Worker     uint8_t output_min,
210*4bdc9457SAndroid Build Coastguard Worker     uint8_t output_max,
211*4bdc9457SAndroid Build Coastguard Worker     uint32_t flags,
212*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t* global_average_pooling_op_out)
213*4bdc9457SAndroid Build Coastguard Worker {
214*4bdc9457SAndroid Build Coastguard Worker   if (input_scale <= 0.0f || !isnormal(input_scale)) {
215*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
216*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with %.7g input scale: scale must be finite, normalized, and positive",
217*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_qu8), input_scale);
218*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
219*4bdc9457SAndroid Build Coastguard Worker   }
220*4bdc9457SAndroid Build Coastguard Worker 
221*4bdc9457SAndroid Build Coastguard Worker   if (output_scale <= 0.0f || !isnormal(output_scale)) {
222*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
223*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with %.7g output scale: scale must be finite, normalized, and positive",
224*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_qu8), output_scale);
225*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
226*4bdc9457SAndroid Build Coastguard Worker   }
227*4bdc9457SAndroid Build Coastguard Worker 
228*4bdc9457SAndroid Build Coastguard Worker   if (output_min >= output_max) {
229*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
230*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with [%" PRIu8 ", %" PRIu8 "] output range: range min must be below range max",
231*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_qu8), output_min, output_max);
232*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
233*4bdc9457SAndroid Build Coastguard Worker   }
234*4bdc9457SAndroid Build Coastguard Worker 
235*4bdc9457SAndroid Build Coastguard Worker   const float input_output_scale = input_scale / output_scale;
236*4bdc9457SAndroid Build Coastguard Worker   if (input_output_scale < 0x1.0p-8f || input_output_scale >= 0x1.0p+8f) {
237*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
238*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with %.7g input-to-output scale ratio: scale ratio must be in [2**-8, 2**8) range",
239*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_qu8), input_output_scale);
240*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_unsupported_parameter;
241*4bdc9457SAndroid Build Coastguard Worker   }
242*4bdc9457SAndroid Build Coastguard Worker 
243*4bdc9457SAndroid Build Coastguard Worker   union xnn_qu8_avgpool_minmax_params params;
244*4bdc9457SAndroid Build Coastguard Worker   if (xnn_params.qu8.gavgpool.init.qu8 != NULL) {
245*4bdc9457SAndroid Build Coastguard Worker     xnn_params.qu8.gavgpool.init.qu8(&params,
246*4bdc9457SAndroid Build Coastguard Worker       0 /* bias */, 1.0f /* scale */, output_zero_point, output_min, output_max);
247*4bdc9457SAndroid Build Coastguard Worker   }
248*4bdc9457SAndroid Build Coastguard Worker   const enum xnn_status status = create_global_average_pooling_nwc(
249*4bdc9457SAndroid Build Coastguard Worker     channels, input_stride, output_stride, flags,
250*4bdc9457SAndroid Build Coastguard Worker     0 /* log2(sizeof(uint8_t)) */,
251*4bdc9457SAndroid Build Coastguard Worker     offsetof(struct xnn_operator, params.qu8_gavgpool),
252*4bdc9457SAndroid Build Coastguard Worker     &params, sizeof(params),
253*4bdc9457SAndroid Build Coastguard Worker     XNN_INIT_FLAG_QU8,
254*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_type_global_average_pooling_nwc_qu8,
255*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op_out);
256*4bdc9457SAndroid Build Coastguard Worker   if (status == xnn_status_success) {
257*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t global_average_pooling_op = *global_average_pooling_op_out;
258*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->input_zero_point = (int32_t) (uint32_t) input_zero_point;
259*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->input_scale = input_scale;
260*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->output_scale = output_scale;
261*4bdc9457SAndroid Build Coastguard Worker   }
262*4bdc9457SAndroid Build Coastguard Worker   return status;
263*4bdc9457SAndroid Build Coastguard Worker }
264*4bdc9457SAndroid Build Coastguard Worker 
xnn_create_global_average_pooling_nwc_qs8(size_t channels,size_t input_stride,size_t output_stride,int8_t input_zero_point,float input_scale,int8_t output_zero_point,float output_scale,int8_t output_min,int8_t output_max,uint32_t flags,xnn_operator_t * global_average_pooling_op_out)265*4bdc9457SAndroid Build Coastguard Worker enum xnn_status xnn_create_global_average_pooling_nwc_qs8(
266*4bdc9457SAndroid Build Coastguard Worker     size_t channels,
267*4bdc9457SAndroid Build Coastguard Worker     size_t input_stride,
268*4bdc9457SAndroid Build Coastguard Worker     size_t output_stride,
269*4bdc9457SAndroid Build Coastguard Worker     int8_t input_zero_point,
270*4bdc9457SAndroid Build Coastguard Worker     float input_scale,
271*4bdc9457SAndroid Build Coastguard Worker     int8_t output_zero_point,
272*4bdc9457SAndroid Build Coastguard Worker     float output_scale,
273*4bdc9457SAndroid Build Coastguard Worker     int8_t output_min,
274*4bdc9457SAndroid Build Coastguard Worker     int8_t output_max,
275*4bdc9457SAndroid Build Coastguard Worker     uint32_t flags,
276*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t* global_average_pooling_op_out)
277*4bdc9457SAndroid Build Coastguard Worker {
278*4bdc9457SAndroid Build Coastguard Worker   if (input_scale <= 0.0f || !isnormal(input_scale)) {
279*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
280*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with %.7g input scale: scale must be finite, normalized, and positive",
281*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_qs8), input_scale);
282*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
283*4bdc9457SAndroid Build Coastguard Worker   }
284*4bdc9457SAndroid Build Coastguard Worker 
285*4bdc9457SAndroid Build Coastguard Worker   if (output_scale <= 0.0f || !isnormal(output_scale)) {
286*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
287*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with %.7g output scale: scale must be finite, normalized, and positive",
288*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_qs8), output_scale);
289*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
290*4bdc9457SAndroid Build Coastguard Worker   }
291*4bdc9457SAndroid Build Coastguard Worker 
292*4bdc9457SAndroid Build Coastguard Worker   if (output_min >= output_max) {
293*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
294*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with [%" PRId8 ", %" PRId8 "] output range: range min must be below range max",
295*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_qs8), output_min, output_max);
296*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
297*4bdc9457SAndroid Build Coastguard Worker   }
298*4bdc9457SAndroid Build Coastguard Worker 
299*4bdc9457SAndroid Build Coastguard Worker   const float input_output_scale = input_scale / output_scale;
300*4bdc9457SAndroid Build Coastguard Worker   if (input_output_scale < 0x1.0p-8f || input_output_scale >= 0x1.0p+8f) {
301*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
302*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with %.7g input-to-output scale ratio: scale ratio must be in [2**-8, 2**8) range",
303*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_qs8), input_output_scale);
304*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_unsupported_parameter;
305*4bdc9457SAndroid Build Coastguard Worker   }
306*4bdc9457SAndroid Build Coastguard Worker 
307*4bdc9457SAndroid Build Coastguard Worker   union xnn_qs8_avgpool_minmax_params params;
308*4bdc9457SAndroid Build Coastguard Worker   if (xnn_params.qs8.gavgpool.init.qs8 != NULL) {
309*4bdc9457SAndroid Build Coastguard Worker     xnn_params.qs8.gavgpool.init.qs8(&params,
310*4bdc9457SAndroid Build Coastguard Worker       0 /* bias */, 1.0f /* scale */, output_zero_point, output_min, output_max);
311*4bdc9457SAndroid Build Coastguard Worker   }
312*4bdc9457SAndroid Build Coastguard Worker   const enum xnn_status status = create_global_average_pooling_nwc(
313*4bdc9457SAndroid Build Coastguard Worker     channels, input_stride, output_stride, flags,
314*4bdc9457SAndroid Build Coastguard Worker     0 /* log2(sizeof(int8_t)) */,
315*4bdc9457SAndroid Build Coastguard Worker     offsetof(struct xnn_operator, params.qs8_gavgpool),
316*4bdc9457SAndroid Build Coastguard Worker     &params, sizeof(params),
317*4bdc9457SAndroid Build Coastguard Worker     XNN_INIT_FLAG_QS8,
318*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_type_global_average_pooling_nwc_qs8,
319*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op_out);
320*4bdc9457SAndroid Build Coastguard Worker   if (status == xnn_status_success) {
321*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t global_average_pooling_op = *global_average_pooling_op_out;
322*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->input_zero_point = (int32_t) input_zero_point;
323*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->input_scale = input_scale;
324*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op->output_scale = output_scale;
325*4bdc9457SAndroid Build Coastguard Worker   }
326*4bdc9457SAndroid Build Coastguard Worker   return status;
327*4bdc9457SAndroid Build Coastguard Worker }
328*4bdc9457SAndroid Build Coastguard Worker 
xnn_create_global_average_pooling_nwc_f16(size_t channels,size_t input_stride,size_t output_stride,float output_min,float output_max,uint32_t flags,xnn_operator_t * global_average_pooling_op_out)329*4bdc9457SAndroid Build Coastguard Worker enum xnn_status xnn_create_global_average_pooling_nwc_f16(
330*4bdc9457SAndroid Build Coastguard Worker     size_t channels,
331*4bdc9457SAndroid Build Coastguard Worker     size_t input_stride,
332*4bdc9457SAndroid Build Coastguard Worker     size_t output_stride,
333*4bdc9457SAndroid Build Coastguard Worker     float output_min,
334*4bdc9457SAndroid Build Coastguard Worker     float output_max,
335*4bdc9457SAndroid Build Coastguard Worker     uint32_t flags,
336*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t* global_average_pooling_op_out)
337*4bdc9457SAndroid Build Coastguard Worker {
338*4bdc9457SAndroid Build Coastguard Worker   if (isnan(output_min)) {
339*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
340*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with NaN output lower bound: lower bound must be non-NaN",
341*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_f16));
342*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
343*4bdc9457SAndroid Build Coastguard Worker   }
344*4bdc9457SAndroid Build Coastguard Worker 
345*4bdc9457SAndroid Build Coastguard Worker   if (isnan(output_max)) {
346*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
347*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with NaN output upper bound: upper bound must be non-NaN",
348*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_f16));
349*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
350*4bdc9457SAndroid Build Coastguard Worker   }
351*4bdc9457SAndroid Build Coastguard Worker 
352*4bdc9457SAndroid Build Coastguard Worker   if (fp16_ieee_to_fp32_value(fp16_ieee_from_fp32_value(output_min)) >= fp16_ieee_to_fp32_value(fp16_ieee_from_fp32_value(output_max))) {
353*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
354*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with [%.7g, %.7g] output range: lower bound must be below upper bound",
355*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_f16),
356*4bdc9457SAndroid Build Coastguard Worker       fp16_ieee_to_fp32_value(fp16_ieee_from_fp32_value(output_min)),
357*4bdc9457SAndroid Build Coastguard Worker       fp16_ieee_to_fp32_value(fp16_ieee_from_fp32_value(output_max)));
358*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
359*4bdc9457SAndroid Build Coastguard Worker   }
360*4bdc9457SAndroid Build Coastguard Worker 
361*4bdc9457SAndroid Build Coastguard Worker   union xnn_f16_scaleminmax_params params;
362*4bdc9457SAndroid Build Coastguard Worker   if (xnn_params.f16.gavgpool.init.f16 != NULL) {
363*4bdc9457SAndroid Build Coastguard Worker     xnn_params.f16.gavgpool.init.f16(&params,
364*4bdc9457SAndroid Build Coastguard Worker       0 /* scale */, fp16_ieee_from_fp32_value(output_min), fp16_ieee_from_fp32_value(output_max));
365*4bdc9457SAndroid Build Coastguard Worker   }
366*4bdc9457SAndroid Build Coastguard Worker   return create_global_average_pooling_nwc(
367*4bdc9457SAndroid Build Coastguard Worker     channels, input_stride, output_stride, flags,
368*4bdc9457SAndroid Build Coastguard Worker     1 /* log2(sizeof(uint16_t)) */,
369*4bdc9457SAndroid Build Coastguard Worker     offsetof(struct xnn_operator, params.f16_scaleminmax),
370*4bdc9457SAndroid Build Coastguard Worker     &params, sizeof(params),
371*4bdc9457SAndroid Build Coastguard Worker     XNN_INIT_FLAG_F16,
372*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_type_global_average_pooling_nwc_f16,
373*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op_out);
374*4bdc9457SAndroid Build Coastguard Worker }
375*4bdc9457SAndroid Build Coastguard Worker 
xnn_create_global_average_pooling_nwc_f32(size_t channels,size_t input_stride,size_t output_stride,float output_min,float output_max,uint32_t flags,xnn_operator_t * global_average_pooling_op_out)376*4bdc9457SAndroid Build Coastguard Worker enum xnn_status xnn_create_global_average_pooling_nwc_f32(
377*4bdc9457SAndroid Build Coastguard Worker     size_t channels,
378*4bdc9457SAndroid Build Coastguard Worker     size_t input_stride,
379*4bdc9457SAndroid Build Coastguard Worker     size_t output_stride,
380*4bdc9457SAndroid Build Coastguard Worker     float output_min,
381*4bdc9457SAndroid Build Coastguard Worker     float output_max,
382*4bdc9457SAndroid Build Coastguard Worker     uint32_t flags,
383*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t* global_average_pooling_op_out)
384*4bdc9457SAndroid Build Coastguard Worker {
385*4bdc9457SAndroid Build Coastguard Worker   if (isnan(output_min)) {
386*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
387*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with NaN output lower bound: lower bound must be non-NaN",
388*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_f32));
389*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
390*4bdc9457SAndroid Build Coastguard Worker   }
391*4bdc9457SAndroid Build Coastguard Worker 
392*4bdc9457SAndroid Build Coastguard Worker   if (isnan(output_max)) {
393*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
394*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with NaN output upper bound: upper bound must be non-NaN",
395*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_f32));
396*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
397*4bdc9457SAndroid Build Coastguard Worker   }
398*4bdc9457SAndroid Build Coastguard Worker 
399*4bdc9457SAndroid Build Coastguard Worker   if (output_min >= output_max) {
400*4bdc9457SAndroid Build Coastguard Worker     xnn_log_error(
401*4bdc9457SAndroid Build Coastguard Worker       "failed to create %s operator with [%.7g, %.7g] output range: lower bound must be below upper bound",
402*4bdc9457SAndroid Build Coastguard Worker       xnn_operator_type_to_string(xnn_operator_type_global_average_pooling_nwc_f32), output_min, output_max);
403*4bdc9457SAndroid Build Coastguard Worker     return xnn_status_invalid_parameter;
404*4bdc9457SAndroid Build Coastguard Worker   }
405*4bdc9457SAndroid Build Coastguard Worker 
406*4bdc9457SAndroid Build Coastguard Worker   union xnn_f32_scaleminmax_params params;
407*4bdc9457SAndroid Build Coastguard Worker   if (xnn_params.f32.gavgpool.init.f32 != NULL) {
408*4bdc9457SAndroid Build Coastguard Worker     xnn_params.f32.gavgpool.init.f32(&params,
409*4bdc9457SAndroid Build Coastguard Worker       0.0f /* scale */, output_min, output_max);
410*4bdc9457SAndroid Build Coastguard Worker   }
411*4bdc9457SAndroid Build Coastguard Worker   return create_global_average_pooling_nwc(
412*4bdc9457SAndroid Build Coastguard Worker     channels, input_stride, output_stride, flags,
413*4bdc9457SAndroid Build Coastguard Worker     2 /* log2(sizeof(float)) */,
414*4bdc9457SAndroid Build Coastguard Worker     offsetof(struct xnn_operator, params.f32_scaleminmax),
415*4bdc9457SAndroid Build Coastguard Worker     &params, sizeof(params),
416*4bdc9457SAndroid Build Coastguard Worker     XNN_INIT_FLAG_F32,
417*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_type_global_average_pooling_nwc_f32,
418*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op_out);
419*4bdc9457SAndroid Build Coastguard Worker }
420*4bdc9457SAndroid Build Coastguard Worker 
update_params_qu8(xnn_operator_t global_average_pooling_op,size_t width)421*4bdc9457SAndroid Build Coastguard Worker static void update_params_qu8(
422*4bdc9457SAndroid Build Coastguard Worker   xnn_operator_t global_average_pooling_op,
423*4bdc9457SAndroid Build Coastguard Worker   size_t width)
424*4bdc9457SAndroid Build Coastguard Worker {
425*4bdc9457SAndroid Build Coastguard Worker   const int32_t bias = -((int32_t) width * global_average_pooling_op->input_zero_point);
426*4bdc9457SAndroid Build Coastguard Worker   const float scale = global_average_pooling_op->input_scale / (global_average_pooling_op->output_scale * (float) width);
427*4bdc9457SAndroid Build Coastguard Worker   xnn_params.qu8.gavgpool.update.qu8(&global_average_pooling_op->params.qu8_gavgpool, bias, scale);
428*4bdc9457SAndroid Build Coastguard Worker }
429*4bdc9457SAndroid Build Coastguard Worker 
xnn_setup_global_average_pooling_nwc_qu8(xnn_operator_t global_average_pooling_op,size_t batch_size,size_t width,const uint8_t * input,uint8_t * output,pthreadpool_t threadpool)430*4bdc9457SAndroid Build Coastguard Worker enum xnn_status xnn_setup_global_average_pooling_nwc_qu8(
431*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t global_average_pooling_op,
432*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
433*4bdc9457SAndroid Build Coastguard Worker     size_t width,
434*4bdc9457SAndroid Build Coastguard Worker     const uint8_t* input,
435*4bdc9457SAndroid Build Coastguard Worker     uint8_t* output,
436*4bdc9457SAndroid Build Coastguard Worker     pthreadpool_t threadpool)
437*4bdc9457SAndroid Build Coastguard Worker {
438*4bdc9457SAndroid Build Coastguard Worker   return setup_global_average_pooling_nwc(
439*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op,
440*4bdc9457SAndroid Build Coastguard Worker     batch_size, width,
441*4bdc9457SAndroid Build Coastguard Worker     input, output,
442*4bdc9457SAndroid Build Coastguard Worker     0 /* log2(sizeof(uint8_t)) */,
443*4bdc9457SAndroid Build Coastguard Worker     &xnn_params.qu8.gavgpool,
444*4bdc9457SAndroid Build Coastguard Worker     XNN_INIT_FLAG_QU8,
445*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_type_global_average_pooling_nwc_qu8,
446*4bdc9457SAndroid Build Coastguard Worker     &global_average_pooling_op->params.qu8_gavgpool,
447*4bdc9457SAndroid Build Coastguard Worker     sizeof(global_average_pooling_op->params.qu8_gavgpool),
448*4bdc9457SAndroid Build Coastguard Worker     update_params_qu8,
449*4bdc9457SAndroid Build Coastguard Worker     threadpool);
450*4bdc9457SAndroid Build Coastguard Worker }
451*4bdc9457SAndroid Build Coastguard Worker 
update_params_qs8(xnn_operator_t global_average_pooling_op,size_t width)452*4bdc9457SAndroid Build Coastguard Worker static void update_params_qs8(
453*4bdc9457SAndroid Build Coastguard Worker   xnn_operator_t global_average_pooling_op,
454*4bdc9457SAndroid Build Coastguard Worker   size_t width)
455*4bdc9457SAndroid Build Coastguard Worker {
456*4bdc9457SAndroid Build Coastguard Worker   const int32_t bias = -((int32_t) width * global_average_pooling_op->input_zero_point);
457*4bdc9457SAndroid Build Coastguard Worker   const float scale = global_average_pooling_op->input_scale / (global_average_pooling_op->output_scale * (float) width);
458*4bdc9457SAndroid Build Coastguard Worker   xnn_params.qs8.gavgpool.update.qs8(&global_average_pooling_op->params.qs8_gavgpool, bias, scale);
459*4bdc9457SAndroid Build Coastguard Worker }
460*4bdc9457SAndroid Build Coastguard Worker 
xnn_setup_global_average_pooling_nwc_qs8(xnn_operator_t global_average_pooling_op,size_t batch_size,size_t width,const int8_t * input,int8_t * output,pthreadpool_t threadpool)461*4bdc9457SAndroid Build Coastguard Worker enum xnn_status xnn_setup_global_average_pooling_nwc_qs8(
462*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t global_average_pooling_op,
463*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
464*4bdc9457SAndroid Build Coastguard Worker     size_t width,
465*4bdc9457SAndroid Build Coastguard Worker     const int8_t* input,
466*4bdc9457SAndroid Build Coastguard Worker     int8_t* output,
467*4bdc9457SAndroid Build Coastguard Worker     pthreadpool_t threadpool)
468*4bdc9457SAndroid Build Coastguard Worker {
469*4bdc9457SAndroid Build Coastguard Worker   return setup_global_average_pooling_nwc(
470*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op,
471*4bdc9457SAndroid Build Coastguard Worker     batch_size, width,
472*4bdc9457SAndroid Build Coastguard Worker     input, output,
473*4bdc9457SAndroid Build Coastguard Worker     0 /* log2(sizeof(int8_t)) */,
474*4bdc9457SAndroid Build Coastguard Worker     &xnn_params.qs8.gavgpool,
475*4bdc9457SAndroid Build Coastguard Worker     XNN_INIT_FLAG_QS8,
476*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_type_global_average_pooling_nwc_qs8,
477*4bdc9457SAndroid Build Coastguard Worker     &global_average_pooling_op->params.qs8_gavgpool,
478*4bdc9457SAndroid Build Coastguard Worker     sizeof(global_average_pooling_op->params.qs8_gavgpool),
479*4bdc9457SAndroid Build Coastguard Worker     update_params_qs8,
480*4bdc9457SAndroid Build Coastguard Worker     threadpool);
481*4bdc9457SAndroid Build Coastguard Worker }
482*4bdc9457SAndroid Build Coastguard Worker 
update_params_f16(xnn_operator_t global_average_pooling_op,size_t width)483*4bdc9457SAndroid Build Coastguard Worker static void update_params_f16(
484*4bdc9457SAndroid Build Coastguard Worker   xnn_operator_t global_average_pooling_op,
485*4bdc9457SAndroid Build Coastguard Worker   size_t width)
486*4bdc9457SAndroid Build Coastguard Worker {
487*4bdc9457SAndroid Build Coastguard Worker   xnn_params.f16.gavgpool.update.f16(
488*4bdc9457SAndroid Build Coastguard Worker     &global_average_pooling_op->params.f16_scaleminmax,
489*4bdc9457SAndroid Build Coastguard Worker     fp16_ieee_from_fp32_value(1.0f / (float) width));
490*4bdc9457SAndroid Build Coastguard Worker }
491*4bdc9457SAndroid Build Coastguard Worker 
xnn_setup_global_average_pooling_nwc_f16(xnn_operator_t global_average_pooling_op,size_t batch_size,size_t width,const void * input,void * output,pthreadpool_t threadpool)492*4bdc9457SAndroid Build Coastguard Worker enum xnn_status xnn_setup_global_average_pooling_nwc_f16(
493*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t global_average_pooling_op,
494*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
495*4bdc9457SAndroid Build Coastguard Worker     size_t width,
496*4bdc9457SAndroid Build Coastguard Worker     const void* input,
497*4bdc9457SAndroid Build Coastguard Worker     void* output,
498*4bdc9457SAndroid Build Coastguard Worker     pthreadpool_t threadpool)
499*4bdc9457SAndroid Build Coastguard Worker {
500*4bdc9457SAndroid Build Coastguard Worker   return setup_global_average_pooling_nwc(
501*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op,
502*4bdc9457SAndroid Build Coastguard Worker     batch_size, width,
503*4bdc9457SAndroid Build Coastguard Worker     input, output,
504*4bdc9457SAndroid Build Coastguard Worker     1 /* log2(sizeof(uint16_t)) */,
505*4bdc9457SAndroid Build Coastguard Worker     &xnn_params.f16.gavgpool,
506*4bdc9457SAndroid Build Coastguard Worker     XNN_INIT_FLAG_F16,
507*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_type_global_average_pooling_nwc_f16,
508*4bdc9457SAndroid Build Coastguard Worker     &global_average_pooling_op->params.f16_scaleminmax,
509*4bdc9457SAndroid Build Coastguard Worker     sizeof(global_average_pooling_op->params.f16_scaleminmax),
510*4bdc9457SAndroid Build Coastguard Worker     update_params_f16,
511*4bdc9457SAndroid Build Coastguard Worker     threadpool);
512*4bdc9457SAndroid Build Coastguard Worker }
513*4bdc9457SAndroid Build Coastguard Worker 
update_params_f32(xnn_operator_t global_average_pooling_op,size_t width)514*4bdc9457SAndroid Build Coastguard Worker static void update_params_f32(
515*4bdc9457SAndroid Build Coastguard Worker   xnn_operator_t global_average_pooling_op,
516*4bdc9457SAndroid Build Coastguard Worker   size_t width)
517*4bdc9457SAndroid Build Coastguard Worker {
518*4bdc9457SAndroid Build Coastguard Worker   xnn_params.f32.gavgpool.update.f32(&global_average_pooling_op->params.f32_scaleminmax, 1.0f / (float) width);
519*4bdc9457SAndroid Build Coastguard Worker }
520*4bdc9457SAndroid Build Coastguard Worker 
xnn_setup_global_average_pooling_nwc_f32(xnn_operator_t global_average_pooling_op,size_t batch_size,size_t width,const float * input,float * output,pthreadpool_t threadpool)521*4bdc9457SAndroid Build Coastguard Worker enum xnn_status xnn_setup_global_average_pooling_nwc_f32(
522*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_t global_average_pooling_op,
523*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
524*4bdc9457SAndroid Build Coastguard Worker     size_t width,
525*4bdc9457SAndroid Build Coastguard Worker     const float* input,
526*4bdc9457SAndroid Build Coastguard Worker     float* output,
527*4bdc9457SAndroid Build Coastguard Worker     pthreadpool_t threadpool)
528*4bdc9457SAndroid Build Coastguard Worker {
529*4bdc9457SAndroid Build Coastguard Worker   return setup_global_average_pooling_nwc(
530*4bdc9457SAndroid Build Coastguard Worker     global_average_pooling_op,
531*4bdc9457SAndroid Build Coastguard Worker     batch_size, width,
532*4bdc9457SAndroid Build Coastguard Worker     input, output,
533*4bdc9457SAndroid Build Coastguard Worker     2 /* log2(sizeof(float)) */,
534*4bdc9457SAndroid Build Coastguard Worker     &xnn_params.f32.gavgpool,
535*4bdc9457SAndroid Build Coastguard Worker     XNN_INIT_FLAG_F32,
536*4bdc9457SAndroid Build Coastguard Worker     xnn_operator_type_global_average_pooling_nwc_f32,
537*4bdc9457SAndroid Build Coastguard Worker     &global_average_pooling_op->params.f32_scaleminmax,
538*4bdc9457SAndroid Build Coastguard Worker     sizeof(global_average_pooling_op->params.f32_scaleminmax),
539*4bdc9457SAndroid Build Coastguard Worker     update_params_f32,
540*4bdc9457SAndroid Build Coastguard Worker     threadpool);
541*4bdc9457SAndroid Build Coastguard Worker }
542