xref: /aosp_15_r20/external/XNNPACK/test/convolution-test-helpers.cc (revision 4bdc94577ba0e567308109d787f7fec7b531ce36)
1*4bdc9457SAndroid Build Coastguard Worker // Copyright 2022 Google LLC
2*4bdc9457SAndroid Build Coastguard Worker //
3*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
4*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
5*4bdc9457SAndroid Build Coastguard Worker 
6*4bdc9457SAndroid Build Coastguard Worker #include "convolution-test-helpers.h"
7*4bdc9457SAndroid Build Coastguard Worker 
8*4bdc9457SAndroid Build Coastguard Worker #include <algorithm>
9*4bdc9457SAndroid Build Coastguard Worker #include <cstdint>
10*4bdc9457SAndroid Build Coastguard Worker #include <cstddef>
11*4bdc9457SAndroid Build Coastguard Worker #include <vector>
12*4bdc9457SAndroid Build Coastguard Worker 
13*4bdc9457SAndroid Build Coastguard Worker namespace xnnpack{
14*4bdc9457SAndroid Build Coastguard Worker 
compute_convolution_qs8_reference_results(size_t batch_size,size_t output_height,size_t output_width,size_t input_height,size_t input_width,size_t input_padding_top,size_t input_padding_right,size_t input_padding_bottom,size_t input_padding_left,size_t kernel_height,size_t kernel_width,size_t subsampling_height,size_t subsampling_width,size_t dilation_height,size_t dilation_width,size_t groups,size_t group_input_channels,size_t group_output_channels,size_t input_channel_stride,int8_t input_zero_point,const std::vector<int8_t> & input,const std::vector<int8_t> & filter,std::vector<int32_t> & accumulators,bool has_bias,const std::vector<int32_t> & bias)15*4bdc9457SAndroid Build Coastguard Worker void compute_convolution_qs8_reference_results(
16*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
17*4bdc9457SAndroid Build Coastguard Worker     size_t output_height,
18*4bdc9457SAndroid Build Coastguard Worker     size_t output_width,
19*4bdc9457SAndroid Build Coastguard Worker     size_t input_height,
20*4bdc9457SAndroid Build Coastguard Worker     size_t input_width,
21*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_top,
22*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_right,
23*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_bottom,
24*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_left,
25*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_height,
26*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_width,
27*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_height,
28*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_width,
29*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_height,
30*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_width,
31*4bdc9457SAndroid Build Coastguard Worker     size_t groups,
32*4bdc9457SAndroid Build Coastguard Worker     size_t group_input_channels,
33*4bdc9457SAndroid Build Coastguard Worker     size_t group_output_channels,
34*4bdc9457SAndroid Build Coastguard Worker     size_t input_channel_stride,
35*4bdc9457SAndroid Build Coastguard Worker     int8_t input_zero_point,
36*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int8_t>& input,
37*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int8_t>& filter,
38*4bdc9457SAndroid Build Coastguard Worker     std::vector<int32_t>& accumulators,
39*4bdc9457SAndroid Build Coastguard Worker     bool has_bias,
40*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int32_t>& bias)
41*4bdc9457SAndroid Build Coastguard Worker {
42*4bdc9457SAndroid Build Coastguard Worker   if (!has_bias) {
43*4bdc9457SAndroid Build Coastguard Worker     std::fill(accumulators.begin(), accumulators.end(), 0);
44*4bdc9457SAndroid Build Coastguard Worker   }
45*4bdc9457SAndroid Build Coastguard Worker 
46*4bdc9457SAndroid Build Coastguard Worker   for (size_t i = 0; i < batch_size; i++) {
47*4bdc9457SAndroid Build Coastguard Worker     for (size_t oy = 0; oy < output_height; oy++) {
48*4bdc9457SAndroid Build Coastguard Worker       for (size_t ox = 0; ox < output_width; ox++) {
49*4bdc9457SAndroid Build Coastguard Worker         // Initialize Bias
50*4bdc9457SAndroid Build Coastguard Worker         if (has_bias) {
51*4bdc9457SAndroid Build Coastguard Worker           for (size_t g = 0; g < groups; g++) {
52*4bdc9457SAndroid Build Coastguard Worker             for (size_t oc = 0; oc < group_output_channels; oc++) {
53*4bdc9457SAndroid Build Coastguard Worker               accumulators[(((i * output_height + oy) * output_width + ox) * groups + g) * group_output_channels + oc] =
54*4bdc9457SAndroid Build Coastguard Worker                   bias[g * group_output_channels + oc];
55*4bdc9457SAndroid Build Coastguard Worker             }
56*4bdc9457SAndroid Build Coastguard Worker           }
57*4bdc9457SAndroid Build Coastguard Worker         }
58*4bdc9457SAndroid Build Coastguard Worker         // Compute reference results.
59*4bdc9457SAndroid Build Coastguard Worker         for (size_t ky = 0; ky < kernel_height; ky++) {
60*4bdc9457SAndroid Build Coastguard Worker           const size_t iy = oy * subsampling_height + ky * dilation_height - input_padding_top;
61*4bdc9457SAndroid Build Coastguard Worker           if (iy < input_height) {
62*4bdc9457SAndroid Build Coastguard Worker             for (size_t kx = 0; kx < kernel_width; kx++) {
63*4bdc9457SAndroid Build Coastguard Worker               const size_t ix = ox * subsampling_width + kx * dilation_width - input_padding_left;
64*4bdc9457SAndroid Build Coastguard Worker               if (ix < input_width) {
65*4bdc9457SAndroid Build Coastguard Worker                 for (size_t g = 0; g < groups; g++) {
66*4bdc9457SAndroid Build Coastguard Worker                   for (size_t oc = 0; oc < group_output_channels; oc++) {
67*4bdc9457SAndroid Build Coastguard Worker                     for (size_t ic = 0; ic < group_input_channels; ic++) {
68*4bdc9457SAndroid Build Coastguard Worker                       accumulators[(((i * output_height + oy) * output_width + ox) * groups + g) * group_output_channels + oc] +=
69*4bdc9457SAndroid Build Coastguard Worker                         (int32_t(input[((i * input_height + iy) * input_width + ix) * input_channel_stride +
70*4bdc9457SAndroid Build Coastguard Worker                                     g * group_input_channels + ic]) -
71*4bdc9457SAndroid Build Coastguard Worker                          int32_t(input_zero_point)) *
72*4bdc9457SAndroid Build Coastguard Worker                         int32_t(filter[(((g * group_output_channels + oc) * kernel_height + ky) * kernel_width + kx) * group_input_channels + ic]);
73*4bdc9457SAndroid Build Coastguard Worker                     }
74*4bdc9457SAndroid Build Coastguard Worker                   }
75*4bdc9457SAndroid Build Coastguard Worker                 }
76*4bdc9457SAndroid Build Coastguard Worker               }
77*4bdc9457SAndroid Build Coastguard Worker             }
78*4bdc9457SAndroid Build Coastguard Worker           }
79*4bdc9457SAndroid Build Coastguard Worker         }
80*4bdc9457SAndroid Build Coastguard Worker       }
81*4bdc9457SAndroid Build Coastguard Worker     }
82*4bdc9457SAndroid Build Coastguard Worker   }
83*4bdc9457SAndroid Build Coastguard Worker }
84*4bdc9457SAndroid Build Coastguard Worker 
compute_convolution_qs8_reference_results(size_t batch_size,size_t output_height,size_t output_width,size_t input_height,size_t input_width,size_t input_padding_top,size_t input_padding_right,size_t input_padding_bottom,size_t input_padding_left,size_t kernel_height,size_t kernel_width,size_t subsampling_height,size_t subsampling_width,size_t dilation_height,size_t dilation_width,size_t groups,size_t group_input_channels,size_t group_output_channels,int8_t input_zero_point,const std::vector<int8_t> & input,const std::vector<int8_t> & filter,std::vector<int32_t> & accumulators,bool has_bias,const std::vector<int32_t> & bias)85*4bdc9457SAndroid Build Coastguard Worker void compute_convolution_qs8_reference_results(
86*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
87*4bdc9457SAndroid Build Coastguard Worker     size_t output_height,
88*4bdc9457SAndroid Build Coastguard Worker     size_t output_width,
89*4bdc9457SAndroid Build Coastguard Worker     size_t input_height,
90*4bdc9457SAndroid Build Coastguard Worker     size_t input_width,
91*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_top,
92*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_right,
93*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_bottom,
94*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_left,
95*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_height,
96*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_width,
97*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_height,
98*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_width,
99*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_height,
100*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_width,
101*4bdc9457SAndroid Build Coastguard Worker     size_t groups,
102*4bdc9457SAndroid Build Coastguard Worker     size_t group_input_channels,
103*4bdc9457SAndroid Build Coastguard Worker     size_t group_output_channels,
104*4bdc9457SAndroid Build Coastguard Worker     int8_t input_zero_point,
105*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int8_t>& input,
106*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int8_t>& filter,
107*4bdc9457SAndroid Build Coastguard Worker     std::vector<int32_t>& accumulators,
108*4bdc9457SAndroid Build Coastguard Worker     bool has_bias,
109*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int32_t>& bias)
110*4bdc9457SAndroid Build Coastguard Worker {
111*4bdc9457SAndroid Build Coastguard Worker   compute_convolution_qs8_reference_results(
112*4bdc9457SAndroid Build Coastguard Worker       batch_size,
113*4bdc9457SAndroid Build Coastguard Worker       output_height,
114*4bdc9457SAndroid Build Coastguard Worker       output_width,
115*4bdc9457SAndroid Build Coastguard Worker       input_height,
116*4bdc9457SAndroid Build Coastguard Worker       input_width,
117*4bdc9457SAndroid Build Coastguard Worker       input_padding_top,
118*4bdc9457SAndroid Build Coastguard Worker       input_padding_right,
119*4bdc9457SAndroid Build Coastguard Worker       input_padding_bottom,
120*4bdc9457SAndroid Build Coastguard Worker       input_padding_left,
121*4bdc9457SAndroid Build Coastguard Worker       kernel_height,
122*4bdc9457SAndroid Build Coastguard Worker       kernel_width,
123*4bdc9457SAndroid Build Coastguard Worker       subsampling_height,
124*4bdc9457SAndroid Build Coastguard Worker       subsampling_width,
125*4bdc9457SAndroid Build Coastguard Worker       dilation_height,
126*4bdc9457SAndroid Build Coastguard Worker       dilation_width,
127*4bdc9457SAndroid Build Coastguard Worker       groups,
128*4bdc9457SAndroid Build Coastguard Worker       group_input_channels,
129*4bdc9457SAndroid Build Coastguard Worker       group_output_channels,
130*4bdc9457SAndroid Build Coastguard Worker       groups * group_input_channels,
131*4bdc9457SAndroid Build Coastguard Worker       input_zero_point,
132*4bdc9457SAndroid Build Coastguard Worker       input,
133*4bdc9457SAndroid Build Coastguard Worker       filter,
134*4bdc9457SAndroid Build Coastguard Worker       accumulators,
135*4bdc9457SAndroid Build Coastguard Worker       has_bias,
136*4bdc9457SAndroid Build Coastguard Worker       bias);
137*4bdc9457SAndroid Build Coastguard Worker }
138*4bdc9457SAndroid Build Coastguard Worker 
compute_convolution_qu8_reference_results(size_t batch_size,size_t output_height,size_t output_width,size_t input_height,size_t input_width,size_t input_padding_top,size_t input_padding_right,size_t input_padding_bottom,size_t input_padding_left,size_t kernel_height,size_t kernel_width,size_t subsampling_height,size_t subsampling_width,size_t dilation_height,size_t dilation_width,size_t groups,size_t group_input_channels,size_t group_output_channels,size_t input_channel_stride,uint8_t input_zero_point,uint8_t kernel_zero_point,const std::vector<uint8_t> & input,const std::vector<uint8_t> & filter,std::vector<int32_t> & accumulators,bool has_bias,const std::vector<int32_t> & bias)139*4bdc9457SAndroid Build Coastguard Worker void compute_convolution_qu8_reference_results(
140*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
141*4bdc9457SAndroid Build Coastguard Worker     size_t output_height,
142*4bdc9457SAndroid Build Coastguard Worker     size_t output_width,
143*4bdc9457SAndroid Build Coastguard Worker     size_t input_height,
144*4bdc9457SAndroid Build Coastguard Worker     size_t input_width,
145*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_top,
146*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_right,
147*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_bottom,
148*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_left,
149*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_height,
150*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_width,
151*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_height,
152*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_width,
153*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_height,
154*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_width,
155*4bdc9457SAndroid Build Coastguard Worker     size_t groups,
156*4bdc9457SAndroid Build Coastguard Worker     size_t group_input_channels,
157*4bdc9457SAndroid Build Coastguard Worker     size_t group_output_channels,
158*4bdc9457SAndroid Build Coastguard Worker     size_t input_channel_stride,
159*4bdc9457SAndroid Build Coastguard Worker     uint8_t input_zero_point,
160*4bdc9457SAndroid Build Coastguard Worker     uint8_t kernel_zero_point,
161*4bdc9457SAndroid Build Coastguard Worker     const std::vector<uint8_t>& input,
162*4bdc9457SAndroid Build Coastguard Worker     const std::vector<uint8_t>& filter,
163*4bdc9457SAndroid Build Coastguard Worker     std::vector<int32_t>& accumulators,
164*4bdc9457SAndroid Build Coastguard Worker     bool has_bias,
165*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int32_t>& bias)
166*4bdc9457SAndroid Build Coastguard Worker {
167*4bdc9457SAndroid Build Coastguard Worker   if (!has_bias) {
168*4bdc9457SAndroid Build Coastguard Worker     std::fill(accumulators.begin(), accumulators.end(), 0);
169*4bdc9457SAndroid Build Coastguard Worker   }
170*4bdc9457SAndroid Build Coastguard Worker 
171*4bdc9457SAndroid Build Coastguard Worker   for (size_t i = 0; i < batch_size; i++) {
172*4bdc9457SAndroid Build Coastguard Worker     for (size_t oy = 0; oy < output_height; oy++) {
173*4bdc9457SAndroid Build Coastguard Worker       for (size_t ox = 0; ox < output_width; ox++) {
174*4bdc9457SAndroid Build Coastguard Worker         // Initialize Bias
175*4bdc9457SAndroid Build Coastguard Worker         if (has_bias) {
176*4bdc9457SAndroid Build Coastguard Worker           for (size_t g = 0; g < groups; g++) {
177*4bdc9457SAndroid Build Coastguard Worker             for (size_t oc = 0; oc < group_output_channels; oc++) {
178*4bdc9457SAndroid Build Coastguard Worker               accumulators[(((i * output_height + oy) * output_width + ox) * groups + g) * group_output_channels + oc] =
179*4bdc9457SAndroid Build Coastguard Worker                   bias[g * group_output_channels + oc];
180*4bdc9457SAndroid Build Coastguard Worker             }
181*4bdc9457SAndroid Build Coastguard Worker           }
182*4bdc9457SAndroid Build Coastguard Worker         }
183*4bdc9457SAndroid Build Coastguard Worker         // Compute reference results.
184*4bdc9457SAndroid Build Coastguard Worker         for (size_t ky = 0; ky < kernel_height; ky++) {
185*4bdc9457SAndroid Build Coastguard Worker           const size_t iy = oy * subsampling_height + ky * dilation_height - input_padding_top;
186*4bdc9457SAndroid Build Coastguard Worker           if (iy < input_height) {
187*4bdc9457SAndroid Build Coastguard Worker             for (size_t kx = 0; kx < kernel_width; kx++) {
188*4bdc9457SAndroid Build Coastguard Worker               const size_t ix = ox * subsampling_width + kx * dilation_width - input_padding_left;
189*4bdc9457SAndroid Build Coastguard Worker               if (ix < input_width) {
190*4bdc9457SAndroid Build Coastguard Worker                 for (size_t g = 0; g < groups; g++) {
191*4bdc9457SAndroid Build Coastguard Worker                   for (size_t oc = 0; oc < group_output_channels; oc++) {
192*4bdc9457SAndroid Build Coastguard Worker                     for (size_t ic = 0; ic < group_input_channels; ic++) {
193*4bdc9457SAndroid Build Coastguard Worker                       accumulators[(((i * output_height + oy) * output_width + ox) * groups + g) * group_output_channels + oc] +=
194*4bdc9457SAndroid Build Coastguard Worker                         (int32_t(input[((i * input_height + iy) * input_width + ix) * input_channel_stride + g * group_input_channels + ic]) -
195*4bdc9457SAndroid Build Coastguard Worker                          int32_t(input_zero_point)) *
196*4bdc9457SAndroid Build Coastguard Worker                         (int32_t(filter[(((g * group_output_channels + oc) * kernel_height + ky) * kernel_width + kx) * group_input_channels + ic]) - int32_t(kernel_zero_point));
197*4bdc9457SAndroid Build Coastguard Worker                     }
198*4bdc9457SAndroid Build Coastguard Worker                   }
199*4bdc9457SAndroid Build Coastguard Worker                 }
200*4bdc9457SAndroid Build Coastguard Worker               }
201*4bdc9457SAndroid Build Coastguard Worker             }
202*4bdc9457SAndroid Build Coastguard Worker           }
203*4bdc9457SAndroid Build Coastguard Worker         }
204*4bdc9457SAndroid Build Coastguard Worker       }
205*4bdc9457SAndroid Build Coastguard Worker     }
206*4bdc9457SAndroid Build Coastguard Worker   }
207*4bdc9457SAndroid Build Coastguard Worker }
208*4bdc9457SAndroid Build Coastguard Worker 
compute_convolution_qu8_reference_results(size_t batch_size,size_t output_height,size_t output_width,size_t input_height,size_t input_width,size_t input_padding_top,size_t input_padding_right,size_t input_padding_bottom,size_t input_padding_left,size_t kernel_height,size_t kernel_width,size_t subsampling_height,size_t subsampling_width,size_t dilation_height,size_t dilation_width,size_t groups,size_t group_input_channels,size_t group_output_channels,uint8_t input_zero_point,uint8_t kernel_zero_point,const std::vector<uint8_t> & input,const std::vector<uint8_t> & filter,std::vector<int32_t> & accumulators,bool has_bias,const std::vector<int32_t> & bias)209*4bdc9457SAndroid Build Coastguard Worker void compute_convolution_qu8_reference_results(
210*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
211*4bdc9457SAndroid Build Coastguard Worker     size_t output_height,
212*4bdc9457SAndroid Build Coastguard Worker     size_t output_width,
213*4bdc9457SAndroid Build Coastguard Worker     size_t input_height,
214*4bdc9457SAndroid Build Coastguard Worker     size_t input_width,
215*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_top,
216*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_right,
217*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_bottom,
218*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_left,
219*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_height,
220*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_width,
221*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_height,
222*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_width,
223*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_height,
224*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_width,
225*4bdc9457SAndroid Build Coastguard Worker     size_t groups,
226*4bdc9457SAndroid Build Coastguard Worker     size_t group_input_channels,
227*4bdc9457SAndroid Build Coastguard Worker     size_t group_output_channels,
228*4bdc9457SAndroid Build Coastguard Worker     uint8_t input_zero_point,
229*4bdc9457SAndroid Build Coastguard Worker     uint8_t kernel_zero_point,
230*4bdc9457SAndroid Build Coastguard Worker     const std::vector<uint8_t>& input,
231*4bdc9457SAndroid Build Coastguard Worker     const std::vector<uint8_t>& filter,
232*4bdc9457SAndroid Build Coastguard Worker     std::vector<int32_t>& accumulators,
233*4bdc9457SAndroid Build Coastguard Worker     bool has_bias,
234*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int32_t>& bias)
235*4bdc9457SAndroid Build Coastguard Worker {
236*4bdc9457SAndroid Build Coastguard Worker   compute_convolution_qu8_reference_results(
237*4bdc9457SAndroid Build Coastguard Worker       batch_size,
238*4bdc9457SAndroid Build Coastguard Worker       output_height,
239*4bdc9457SAndroid Build Coastguard Worker       output_width,
240*4bdc9457SAndroid Build Coastguard Worker       input_height,
241*4bdc9457SAndroid Build Coastguard Worker       input_width,
242*4bdc9457SAndroid Build Coastguard Worker       input_padding_top,
243*4bdc9457SAndroid Build Coastguard Worker       input_padding_right,
244*4bdc9457SAndroid Build Coastguard Worker       input_padding_bottom,
245*4bdc9457SAndroid Build Coastguard Worker       input_padding_left,
246*4bdc9457SAndroid Build Coastguard Worker       kernel_height,
247*4bdc9457SAndroid Build Coastguard Worker       kernel_width,
248*4bdc9457SAndroid Build Coastguard Worker       subsampling_height,
249*4bdc9457SAndroid Build Coastguard Worker       subsampling_width,
250*4bdc9457SAndroid Build Coastguard Worker       dilation_height,
251*4bdc9457SAndroid Build Coastguard Worker       dilation_width,
252*4bdc9457SAndroid Build Coastguard Worker       groups,
253*4bdc9457SAndroid Build Coastguard Worker       group_input_channels,
254*4bdc9457SAndroid Build Coastguard Worker       group_output_channels,
255*4bdc9457SAndroid Build Coastguard Worker       groups * group_input_channels,
256*4bdc9457SAndroid Build Coastguard Worker       input_zero_point,
257*4bdc9457SAndroid Build Coastguard Worker       kernel_zero_point,
258*4bdc9457SAndroid Build Coastguard Worker       input,
259*4bdc9457SAndroid Build Coastguard Worker       filter,
260*4bdc9457SAndroid Build Coastguard Worker       accumulators,
261*4bdc9457SAndroid Build Coastguard Worker       has_bias,
262*4bdc9457SAndroid Build Coastguard Worker       bias);
263*4bdc9457SAndroid Build Coastguard Worker }
264*4bdc9457SAndroid Build Coastguard Worker 
compute_depthwise_convolution_qs8_reference_results(size_t batch_size,size_t output_height,size_t output_width,size_t input_height,size_t input_width,size_t input_padding_top,size_t input_padding_right,size_t input_padding_bottom,size_t input_padding_left,size_t kernel_height,size_t kernel_width,size_t subsampling_height,size_t subsampling_width,size_t dilation_height,size_t dilation_width,size_t input_channels,size_t depth_multiplier,size_t input_channel_stride,int8_t input_zero_point,const std::vector<int8_t> & input,const std::vector<int8_t> & filter,std::vector<int32_t> & accumulators,bool has_bias,const std::vector<int32_t> & bias)265*4bdc9457SAndroid Build Coastguard Worker void compute_depthwise_convolution_qs8_reference_results(
266*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
267*4bdc9457SAndroid Build Coastguard Worker     size_t output_height,
268*4bdc9457SAndroid Build Coastguard Worker     size_t output_width,
269*4bdc9457SAndroid Build Coastguard Worker     size_t input_height,
270*4bdc9457SAndroid Build Coastguard Worker     size_t input_width,
271*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_top,
272*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_right,
273*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_bottom,
274*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_left,
275*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_height,
276*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_width,
277*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_height,
278*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_width,
279*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_height,
280*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_width,
281*4bdc9457SAndroid Build Coastguard Worker     size_t input_channels,
282*4bdc9457SAndroid Build Coastguard Worker     size_t depth_multiplier,
283*4bdc9457SAndroid Build Coastguard Worker     size_t input_channel_stride,
284*4bdc9457SAndroid Build Coastguard Worker     int8_t input_zero_point,
285*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int8_t>& input,
286*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int8_t>& filter,
287*4bdc9457SAndroid Build Coastguard Worker     std::vector<int32_t>& accumulators,
288*4bdc9457SAndroid Build Coastguard Worker     bool has_bias,
289*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int32_t>& bias)
290*4bdc9457SAndroid Build Coastguard Worker {
291*4bdc9457SAndroid Build Coastguard Worker   if (!has_bias) {
292*4bdc9457SAndroid Build Coastguard Worker     std::fill(accumulators.begin(), accumulators.end(), 0);
293*4bdc9457SAndroid Build Coastguard Worker   }
294*4bdc9457SAndroid Build Coastguard Worker 
295*4bdc9457SAndroid Build Coastguard Worker   for (size_t i = 0; i < batch_size; i++) {
296*4bdc9457SAndroid Build Coastguard Worker     for (size_t oy = 0; oy < output_height; oy++) {
297*4bdc9457SAndroid Build Coastguard Worker       for (size_t ox = 0; ox < output_width; ox++) {
298*4bdc9457SAndroid Build Coastguard Worker         // Initialize Bias
299*4bdc9457SAndroid Build Coastguard Worker         if (has_bias) {
300*4bdc9457SAndroid Build Coastguard Worker           for (size_t g = 0; g < input_channels; g++) {
301*4bdc9457SAndroid Build Coastguard Worker             for (size_t oc = 0; oc < depth_multiplier; oc++) {
302*4bdc9457SAndroid Build Coastguard Worker               accumulators[(((i * output_height + oy) * output_width + ox) * input_channels + g) * depth_multiplier + oc] =
303*4bdc9457SAndroid Build Coastguard Worker                   bias[g * depth_multiplier + oc];
304*4bdc9457SAndroid Build Coastguard Worker             }
305*4bdc9457SAndroid Build Coastguard Worker           }
306*4bdc9457SAndroid Build Coastguard Worker         }
307*4bdc9457SAndroid Build Coastguard Worker         // Compute reference results.
308*4bdc9457SAndroid Build Coastguard Worker         for (size_t ky = 0; ky < kernel_height; ky++) {
309*4bdc9457SAndroid Build Coastguard Worker           const size_t iy = oy * subsampling_height + ky * dilation_height - input_padding_top;
310*4bdc9457SAndroid Build Coastguard Worker           if (iy < input_height) {
311*4bdc9457SAndroid Build Coastguard Worker             for (size_t kx = 0; kx < kernel_width; kx++) {
312*4bdc9457SAndroid Build Coastguard Worker               const size_t ix = ox * subsampling_width + kx * dilation_width - input_padding_left;
313*4bdc9457SAndroid Build Coastguard Worker               if (ix < input_width) {
314*4bdc9457SAndroid Build Coastguard Worker                 for (size_t g = 0; g < input_channels; g++) {
315*4bdc9457SAndroid Build Coastguard Worker                   for (size_t oc = 0; oc < depth_multiplier; oc++) {
316*4bdc9457SAndroid Build Coastguard Worker                     accumulators[(((i * output_height + oy) * output_width + ox) * input_channels + g) * depth_multiplier + oc] +=
317*4bdc9457SAndroid Build Coastguard Worker                         (int32_t(input[((i * input_height + iy) * input_width + ix) * input_channel_stride + g]) - int32_t(input_zero_point)) *
318*4bdc9457SAndroid Build Coastguard Worker                         int32_t(filter[((ky * kernel_width + kx) * input_channels + g) * depth_multiplier + oc]);
319*4bdc9457SAndroid Build Coastguard Worker                   }
320*4bdc9457SAndroid Build Coastguard Worker                 }
321*4bdc9457SAndroid Build Coastguard Worker               }
322*4bdc9457SAndroid Build Coastguard Worker             }
323*4bdc9457SAndroid Build Coastguard Worker           }
324*4bdc9457SAndroid Build Coastguard Worker         }
325*4bdc9457SAndroid Build Coastguard Worker       }
326*4bdc9457SAndroid Build Coastguard Worker     }
327*4bdc9457SAndroid Build Coastguard Worker   }
328*4bdc9457SAndroid Build Coastguard Worker }
329*4bdc9457SAndroid Build Coastguard Worker 
compute_depthwise_convolution_qs8_reference_results(size_t batch_size,size_t output_height,size_t output_width,size_t input_height,size_t input_width,size_t input_padding_top,size_t input_padding_right,size_t input_padding_bottom,size_t input_padding_left,size_t kernel_height,size_t kernel_width,size_t subsampling_height,size_t subsampling_width,size_t dilation_height,size_t dilation_width,size_t input_channels,size_t depth_multiplier,int8_t input_zero_point,const std::vector<int8_t> & input,const std::vector<int8_t> & filter,std::vector<int32_t> & accumulators,bool has_bias,const std::vector<int32_t> & bias)330*4bdc9457SAndroid Build Coastguard Worker void compute_depthwise_convolution_qs8_reference_results(
331*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
332*4bdc9457SAndroid Build Coastguard Worker     size_t output_height,
333*4bdc9457SAndroid Build Coastguard Worker     size_t output_width,
334*4bdc9457SAndroid Build Coastguard Worker     size_t input_height,
335*4bdc9457SAndroid Build Coastguard Worker     size_t input_width,
336*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_top,
337*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_right,
338*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_bottom,
339*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_left,
340*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_height,
341*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_width,
342*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_height,
343*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_width,
344*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_height,
345*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_width,
346*4bdc9457SAndroid Build Coastguard Worker     size_t input_channels,
347*4bdc9457SAndroid Build Coastguard Worker     size_t depth_multiplier,
348*4bdc9457SAndroid Build Coastguard Worker     int8_t input_zero_point,
349*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int8_t>& input,
350*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int8_t>& filter,
351*4bdc9457SAndroid Build Coastguard Worker     std::vector<int32_t>& accumulators,
352*4bdc9457SAndroid Build Coastguard Worker     bool has_bias,
353*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int32_t>& bias)
354*4bdc9457SAndroid Build Coastguard Worker {
355*4bdc9457SAndroid Build Coastguard Worker   compute_depthwise_convolution_qs8_reference_results(
356*4bdc9457SAndroid Build Coastguard Worker     batch_size,
357*4bdc9457SAndroid Build Coastguard Worker     output_height,
358*4bdc9457SAndroid Build Coastguard Worker     output_width,
359*4bdc9457SAndroid Build Coastguard Worker     input_height,
360*4bdc9457SAndroid Build Coastguard Worker     input_width,
361*4bdc9457SAndroid Build Coastguard Worker     input_padding_top,
362*4bdc9457SAndroid Build Coastguard Worker     input_padding_right,
363*4bdc9457SAndroid Build Coastguard Worker     input_padding_bottom,
364*4bdc9457SAndroid Build Coastguard Worker     input_padding_left,
365*4bdc9457SAndroid Build Coastguard Worker     kernel_height,
366*4bdc9457SAndroid Build Coastguard Worker     kernel_width,
367*4bdc9457SAndroid Build Coastguard Worker     subsampling_height,
368*4bdc9457SAndroid Build Coastguard Worker     subsampling_width,
369*4bdc9457SAndroid Build Coastguard Worker     dilation_height,
370*4bdc9457SAndroid Build Coastguard Worker     dilation_width,
371*4bdc9457SAndroid Build Coastguard Worker     input_channels,
372*4bdc9457SAndroid Build Coastguard Worker     depth_multiplier,
373*4bdc9457SAndroid Build Coastguard Worker     input_channels,
374*4bdc9457SAndroid Build Coastguard Worker     input_zero_point,
375*4bdc9457SAndroid Build Coastguard Worker     input,
376*4bdc9457SAndroid Build Coastguard Worker     filter,
377*4bdc9457SAndroid Build Coastguard Worker     accumulators,
378*4bdc9457SAndroid Build Coastguard Worker     has_bias,
379*4bdc9457SAndroid Build Coastguard Worker     bias);
380*4bdc9457SAndroid Build Coastguard Worker }
381*4bdc9457SAndroid Build Coastguard Worker 
compute_depthwise_convolution_qu8_reference_results(size_t batch_size,size_t output_height,size_t output_width,size_t input_height,size_t input_width,size_t input_padding_top,size_t input_padding_right,size_t input_padding_bottom,size_t input_padding_left,size_t kernel_height,size_t kernel_width,size_t subsampling_height,size_t subsampling_width,size_t dilation_height,size_t dilation_width,size_t input_channels,size_t depth_multiplier,size_t input_channel_stride,uint8_t input_zero_point,uint8_t kernel_zero_point,const std::vector<uint8_t> & input,const std::vector<uint8_t> & filter,std::vector<int32_t> & accumulators,bool has_bias,const std::vector<int32_t> & bias)382*4bdc9457SAndroid Build Coastguard Worker void compute_depthwise_convolution_qu8_reference_results(
383*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
384*4bdc9457SAndroid Build Coastguard Worker     size_t output_height,
385*4bdc9457SAndroid Build Coastguard Worker     size_t output_width,
386*4bdc9457SAndroid Build Coastguard Worker     size_t input_height,
387*4bdc9457SAndroid Build Coastguard Worker     size_t input_width,
388*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_top,
389*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_right,
390*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_bottom,
391*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_left,
392*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_height,
393*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_width,
394*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_height,
395*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_width,
396*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_height,
397*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_width,
398*4bdc9457SAndroid Build Coastguard Worker     size_t input_channels,
399*4bdc9457SAndroid Build Coastguard Worker     size_t depth_multiplier,
400*4bdc9457SAndroid Build Coastguard Worker     size_t input_channel_stride,
401*4bdc9457SAndroid Build Coastguard Worker     uint8_t input_zero_point,
402*4bdc9457SAndroid Build Coastguard Worker     uint8_t kernel_zero_point,
403*4bdc9457SAndroid Build Coastguard Worker     const std::vector<uint8_t>& input,
404*4bdc9457SAndroid Build Coastguard Worker     const std::vector<uint8_t>& filter,
405*4bdc9457SAndroid Build Coastguard Worker     std::vector<int32_t>& accumulators,
406*4bdc9457SAndroid Build Coastguard Worker     bool has_bias,
407*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int32_t>& bias)
408*4bdc9457SAndroid Build Coastguard Worker {
409*4bdc9457SAndroid Build Coastguard Worker   if (!has_bias) {
410*4bdc9457SAndroid Build Coastguard Worker     std::fill(accumulators.begin(), accumulators.end(), 0);
411*4bdc9457SAndroid Build Coastguard Worker   }
412*4bdc9457SAndroid Build Coastguard Worker 
413*4bdc9457SAndroid Build Coastguard Worker   for (size_t i = 0; i < batch_size; i++) {
414*4bdc9457SAndroid Build Coastguard Worker     for (size_t oy = 0; oy < output_height; oy++) {
415*4bdc9457SAndroid Build Coastguard Worker       for (size_t ox = 0; ox < output_width; ox++) {
416*4bdc9457SAndroid Build Coastguard Worker         // Initialize Bias
417*4bdc9457SAndroid Build Coastguard Worker         if (has_bias) {
418*4bdc9457SAndroid Build Coastguard Worker           for (size_t g = 0; g < input_channels; g++) {
419*4bdc9457SAndroid Build Coastguard Worker             for (size_t oc = 0; oc < depth_multiplier; oc++) {
420*4bdc9457SAndroid Build Coastguard Worker               accumulators[(((i * output_height + oy) * output_width + ox) * input_channels + g) * depth_multiplier + oc] =
421*4bdc9457SAndroid Build Coastguard Worker                   bias[g * depth_multiplier + oc];
422*4bdc9457SAndroid Build Coastguard Worker             }
423*4bdc9457SAndroid Build Coastguard Worker           }
424*4bdc9457SAndroid Build Coastguard Worker         }
425*4bdc9457SAndroid Build Coastguard Worker         // Compute reference results.
426*4bdc9457SAndroid Build Coastguard Worker         for (size_t ky = 0; ky < kernel_height; ky++) {
427*4bdc9457SAndroid Build Coastguard Worker           const size_t iy = oy * subsampling_height + ky * dilation_height - input_padding_top;
428*4bdc9457SAndroid Build Coastguard Worker           if (iy < input_height) {
429*4bdc9457SAndroid Build Coastguard Worker             for (size_t kx = 0; kx < kernel_width; kx++) {
430*4bdc9457SAndroid Build Coastguard Worker               const size_t ix = ox * subsampling_width + kx * dilation_width - input_padding_left;
431*4bdc9457SAndroid Build Coastguard Worker               if (ix < input_width) {
432*4bdc9457SAndroid Build Coastguard Worker                 for (size_t g = 0; g < input_channels; g++) {
433*4bdc9457SAndroid Build Coastguard Worker                   for (size_t oc = 0; oc < depth_multiplier; oc++) {
434*4bdc9457SAndroid Build Coastguard Worker                     accumulators[(((i * output_height + oy) * output_width + ox) * input_channels + g) * depth_multiplier + oc] +=
435*4bdc9457SAndroid Build Coastguard Worker                         (int32_t(input[((i * input_height + iy) * input_width + ix) * input_channel_stride + g]) - int32_t(input_zero_point)) *
436*4bdc9457SAndroid Build Coastguard Worker                         (int32_t(filter[((ky * kernel_width + kx) * input_channels + g) * depth_multiplier + oc]) - int32_t(kernel_zero_point));
437*4bdc9457SAndroid Build Coastguard Worker                   }
438*4bdc9457SAndroid Build Coastguard Worker                 }
439*4bdc9457SAndroid Build Coastguard Worker               }
440*4bdc9457SAndroid Build Coastguard Worker             }
441*4bdc9457SAndroid Build Coastguard Worker           }
442*4bdc9457SAndroid Build Coastguard Worker         }
443*4bdc9457SAndroid Build Coastguard Worker       }
444*4bdc9457SAndroid Build Coastguard Worker     }
445*4bdc9457SAndroid Build Coastguard Worker   }
446*4bdc9457SAndroid Build Coastguard Worker }
447*4bdc9457SAndroid Build Coastguard Worker 
compute_depthwise_convolution_qu8_reference_results(size_t batch_size,size_t output_height,size_t output_width,size_t input_height,size_t input_width,size_t input_padding_top,size_t input_padding_right,size_t input_padding_bottom,size_t input_padding_left,size_t kernel_height,size_t kernel_width,size_t subsampling_height,size_t subsampling_width,size_t dilation_height,size_t dilation_width,size_t input_channels,size_t depth_multiplier,uint8_t input_zero_point,uint8_t kernel_zero_point,const std::vector<uint8_t> & input,const std::vector<uint8_t> & filter,std::vector<int32_t> & accumulators,bool has_bias,const std::vector<int32_t> & bias)448*4bdc9457SAndroid Build Coastguard Worker void compute_depthwise_convolution_qu8_reference_results(
449*4bdc9457SAndroid Build Coastguard Worker     size_t batch_size,
450*4bdc9457SAndroid Build Coastguard Worker     size_t output_height,
451*4bdc9457SAndroid Build Coastguard Worker     size_t output_width,
452*4bdc9457SAndroid Build Coastguard Worker     size_t input_height,
453*4bdc9457SAndroid Build Coastguard Worker     size_t input_width,
454*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_top,
455*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_right,
456*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_bottom,
457*4bdc9457SAndroid Build Coastguard Worker     size_t input_padding_left,
458*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_height,
459*4bdc9457SAndroid Build Coastguard Worker     size_t kernel_width,
460*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_height,
461*4bdc9457SAndroid Build Coastguard Worker     size_t subsampling_width,
462*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_height,
463*4bdc9457SAndroid Build Coastguard Worker     size_t dilation_width,
464*4bdc9457SAndroid Build Coastguard Worker     size_t input_channels,
465*4bdc9457SAndroid Build Coastguard Worker     size_t depth_multiplier,
466*4bdc9457SAndroid Build Coastguard Worker     uint8_t input_zero_point,
467*4bdc9457SAndroid Build Coastguard Worker     uint8_t kernel_zero_point,
468*4bdc9457SAndroid Build Coastguard Worker     const std::vector<uint8_t>& input,
469*4bdc9457SAndroid Build Coastguard Worker     const std::vector<uint8_t>& filter,
470*4bdc9457SAndroid Build Coastguard Worker     std::vector<int32_t>& accumulators,
471*4bdc9457SAndroid Build Coastguard Worker     bool has_bias,
472*4bdc9457SAndroid Build Coastguard Worker     const std::vector<int32_t>& bias)
473*4bdc9457SAndroid Build Coastguard Worker {
474*4bdc9457SAndroid Build Coastguard Worker   compute_depthwise_convolution_qu8_reference_results(
475*4bdc9457SAndroid Build Coastguard Worker     batch_size,
476*4bdc9457SAndroid Build Coastguard Worker     output_height,
477*4bdc9457SAndroid Build Coastguard Worker     output_width,
478*4bdc9457SAndroid Build Coastguard Worker     input_height,
479*4bdc9457SAndroid Build Coastguard Worker     input_width,
480*4bdc9457SAndroid Build Coastguard Worker     input_padding_top,
481*4bdc9457SAndroid Build Coastguard Worker     input_padding_right,
482*4bdc9457SAndroid Build Coastguard Worker     input_padding_bottom,
483*4bdc9457SAndroid Build Coastguard Worker     input_padding_left,
484*4bdc9457SAndroid Build Coastguard Worker     kernel_height,
485*4bdc9457SAndroid Build Coastguard Worker     kernel_width,
486*4bdc9457SAndroid Build Coastguard Worker     subsampling_height,
487*4bdc9457SAndroid Build Coastguard Worker     subsampling_width,
488*4bdc9457SAndroid Build Coastguard Worker     dilation_height,
489*4bdc9457SAndroid Build Coastguard Worker     dilation_width,
490*4bdc9457SAndroid Build Coastguard Worker     input_channels,
491*4bdc9457SAndroid Build Coastguard Worker     depth_multiplier,
492*4bdc9457SAndroid Build Coastguard Worker     input_channels,
493*4bdc9457SAndroid Build Coastguard Worker     input_zero_point,
494*4bdc9457SAndroid Build Coastguard Worker     kernel_zero_point,
495*4bdc9457SAndroid Build Coastguard Worker     input,
496*4bdc9457SAndroid Build Coastguard Worker     filter,
497*4bdc9457SAndroid Build Coastguard Worker     accumulators,
498*4bdc9457SAndroid Build Coastguard Worker     has_bias,
499*4bdc9457SAndroid Build Coastguard Worker     bias);
500*4bdc9457SAndroid Build Coastguard Worker }
501*4bdc9457SAndroid Build Coastguard Worker }
502