Home
last modified time | relevance | path

Searched refs:num_elems_processed_per_iteration (Results 1 – 25 of 38) sorted by relevance

12

/aosp_15_r20/external/ComputeLibrary/src/gpu/cl/kernels/
H A DClIm2ColKernel.cpp58 unsigned int num_elems_processed_per_iteration{}; member
96 …unsigned int num_elems_processed_per_iteration, bool is_padding_required_nchw, unsigned int num_gr… in validate_and_configure_window() argument
117 win = calculate_max_window(*src, Steps(num_elems_processed_per_iteration)); in validate_and_configure_window()
125 … Steps(num_elems_processed_per_iteration * conv_info.stride().first, conv_info.stride().second)); in validate_and_configure_window()
129 …eil_to_multiple(input_width + border.right, kernel_dims.width * num_elems_processed_per_iteration), in validate_and_configure_window()
164 unsigned int num_elems_processed_per_iteration = 1; in configure_opencl_kernel() local
191 num_elems_processed_per_iteration = std::min(2U, input_channel); in configure_opencl_kernel()
213 const unsigned int vec_size = num_elems_processed_per_iteration; in configure_opencl_kernel()
234 num_elems_processed_per_iteration = 4; in configure_opencl_kernel()
240 num_elems_processed_per_iteration = 1; in configure_opencl_kernel()
[all …]
H A DClWidthConcatenate4TensorsKernel.cpp88 const unsigned int num_elems_processed_per_iteration = adjust_vec_size(8, min_dimension); in configure() local
89 …gned int vec_size_leftover = dst->dimension(0) % num_elems_processed_per_iteration; in configure()
94 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
97 …t::cpp11::to_string((src1->dimension(0) - vec_size_leftover) % num_elems_processed_per_iteration)); in configure()
98 …src1->dimension(0) + src2->dimension(0) - vec_size_leftover) % num_elems_processed_per_iteration)); in configure()
99 …src2->dimension(0) + src3->dimension(0) - vec_size_leftover) % num_elems_processed_per_iteration)); in configure()
136 Window win = calculate_max_window(*dst, Steps(num_elems_processed_per_iteration)); in configure()
H A DClWidthConcatenate2TensorsKernel.cpp84 const unsigned int num_elems_processed_per_iteration = adjust_vec_size(8, min_dimension); in configure() local
85 …gned int vec_size_leftover = dst->dimension(0) % num_elems_processed_per_iteration; in configure()
90 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
93 …t::cpp11::to_string((src1->dimension(0) - vec_size_leftover) % num_elems_processed_per_iteration)); in configure()
123 Window win = calculate_max_window(*dst, Steps(num_elems_processed_per_iteration)); in configure()
H A DClHeightConcatenateKernel.cpp86 const unsigned int num_elems_processed_per_iteration = adjust_vec_size(4, src->dimension(0)); in configure() local
90 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
92 …IZE_LEFTOVER=" + support::cpp11::to_string(src->dimension(0) % num_elems_processed_per_iteration)); in configure()
116 Window win = calculate_max_window(*src, Steps(num_elems_processed_per_iteration)); in configure()
H A DClWidthConcatenateKernel.cpp82 const unsigned int num_elems_processed_per_iteration = adjust_vec_size(16, src->dimension(0)); in configure() local
87 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
88 …IZE_LEFTOVER=" + support::cpp11::to_string(src->dimension(0) % num_elems_processed_per_iteration)); in configure()
111 Window win = calculate_max_window(*src, Steps(num_elems_processed_per_iteration)); in configure()
H A DClDepthConcatenateKernel.cpp76 …const unsigned int num_elems_processed_per_iteration = adjust_vec_size(16 / src->element_size(), s… in configure() local
81 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
82 …IZE_LEFTOVER=" + support::cpp11::to_string(src->dimension(0) % num_elems_processed_per_iteration)); in configure()
103 auto win = calculate_max_window(*dst, Steps(num_elems_processed_per_iteration)); in configure()
H A DClGemmLowpQuantizeDownInt32ScaleByFixedPointKernel.cpp97 const unsigned int num_elems_processed_per_iteration = adjust_vec_size(4, src->dimension(0)); in configure() local
103 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
104 …IZE_LEFTOVER=" + support::cpp11::to_string(src->dimension(0) % num_elems_processed_per_iteration)); in configure()
124 auto win = calculate_max_window(*dst, Steps(num_elems_processed_per_iteration)); in configure()
H A DClGemmLowpQuantizeDownInt32ScaleByFloatKernel.cpp100 const unsigned int num_elems_processed_per_iteration = adjust_vec_size(4, src->dimension(0)); in configure() local
107 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
108 …IZE_LEFTOVER=" + support::cpp11::to_string(src->dimension(0) % num_elems_processed_per_iteration)); in configure()
125 Window win = calculate_max_window(*src, Steps(num_elems_processed_per_iteration)); in configure()
H A DClBatchConcatenateKernel.cpp76 …const unsigned int num_elems_processed_per_iteration = adjust_vec_size(16 / src->element_size(), s… in configure() local
81 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
82 …IZE_LEFTOVER=" + support::cpp11::to_string(src->dimension(0) % num_elems_processed_per_iteration)); in configure()
103 auto win = calculate_max_window(*dst, Steps(num_elems_processed_per_iteration)); in configure()
H A DClGemmLowpQuantizeDownInt32ScaleKernel.cpp97 const unsigned int num_elems_processed_per_iteration = adjust_vec_size(4, src->dimension(0)); in configure() local
103 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
104 …IZE_LEFTOVER=" + support::cpp11::to_string(src->dimension(0) % num_elems_processed_per_iteration)); in configure()
124 Window win = calculate_max_window(*src, Steps(num_elems_processed_per_iteration)); in configure()
H A DClCastKernel.cpp96 …const unsigned int num_elems_processed_per_iteration = adjust_vec_size(16 / src->element_size(), s… in configure() local
100 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
101 …IZE_LEFTOVER=" + support::cpp11::to_string(src->dimension(0) % num_elems_processed_per_iteration)); in configure()
114 Window win = calculate_max_window(*src, Steps(num_elems_processed_per_iteration)); in configure()
H A DClElementwiseKernel.cpp188 …const unsigned int num_elems_processed_per_iteration = adjust_vec_size(vector_size_byte_opencl / d… in generate_build_options_with_arithmetic_rules() local
191 …IN1=" + support::cpp11::to_string(src1.dimension(0) == 1 ? 1 : num_elems_processed_per_iteration)); in generate_build_options_with_arithmetic_rules()
192 …IN2=" + support::cpp11::to_string(src2.dimension(0) == 1 ? 1 : num_elems_processed_per_iteration)); in generate_build_options_with_arithmetic_rules()
193 …_opts.add_option("-DVEC_SIZE_OUT=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in generate_build_options_with_arithmetic_rules()
194 …SIZE_LEFTOVER=" + support::cpp11::to_string(dst.dimension(0) % num_elems_processed_per_iteration)); in generate_build_options_with_arithmetic_rules()
222 …const unsigned int num_elems_processed_per_iteration = adjust_vec_size(vector_size_byte_opencl / d… in configure_window_arithmetic_common() local
223 … = calculate_max_window(dst, Steps(num_elems_processed_per_iteration)); in configure_window_arithmetic_common()
H A DClGemmLowpOffsetContributionKernel.cpp123 …const unsigned int num_elems_processed_per_iteration = adjust_vec_size(4, mm_result->dimension(0)); in configure() local
127 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
128 …FTOVER=" + support::cpp11::to_string(mm_result->dimension(0) % num_elems_processed_per_iteration)); in configure()
152 Window win = calculate_max_window(*mm_result, Steps(num_elems_processed_per_iteration)); in configure()
H A DClActivationKernel.cpp110 …const unsigned int num_elems_processed_per_iteration = adjust_vec_size(16 / src->element_size(), s… in configure() local
130 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
131 …IZE_LEFTOVER=" + support::cpp11::to_string(src->dimension(0) % num_elems_processed_per_iteration)); in configure()
209 Window win = calculate_max_window(*src, Steps(num_elems_processed_per_iteration)); in configure()
/aosp_15_r20/external/ComputeLibrary/src/core/CL/kernels/
H A DCLNormalizePlanarYUVLayerKernel.cpp69 const unsigned int num_elems_processed_per_iteration = 16 / input->element_size(); in validate_and_configure_window_nchw() local
71 Window win = calculate_max_window(*input, Steps(num_elems_processed_per_iteration)); in validate_and_configure_window_nchw()
73 AccessWindowHorizontal input_access(input, 0, num_elems_processed_per_iteration); in validate_and_configure_window_nchw()
74 AccessWindowHorizontal output_access(output, 0, num_elems_processed_per_iteration); in validate_and_configure_window_nchw()
113 …const unsigned int num_elems_processed_per_iteration = (data_layout == DataLayout::NHWC) ? adjust_… in configure() local
122 …ld_opts.add_option(("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration))); in configure()
123 …R=" + support::cpp11::to_string(input->info()->dimension(0) % num_elems_processed_per_iteration))); in configure()
142 Window win = calculate_max_window(*input->info(), Steps(num_elems_processed_per_iteration)); in configure()
H A DCLBatchNormalizationLayerKernel.cpp86 …const unsigned int num_elems_processed_per_iteration = adjust_vec_size(16 / input->element_size(),… in validate_and_configure_window_nchw() local
89 …indow win = calculate_max_window(*input, Steps(num_elems_processed_per_iteration)); in validate_and_configure_window_nchw()
90 AccessWindowHorizontal input_access(input, 0, num_elems_processed_per_iteration); in validate_and_configure_window_nchw()
95 AccessWindowHorizontal output_access(output, 0, num_elems_processed_per_iteration); in validate_and_configure_window_nchw()
142 …unsigned int num_elems_processed_per_iteration = adjust_vec_size(16 / input->info()->element_size(… in configure() local
147 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
148 …ER=" + support::cpp11::to_string(input->info()->dimension(0) % num_elems_processed_per_iteration)); in configure()
181 Window win = calculate_max_window(*input->info(), Steps(num_elems_processed_per_iteration)); in configure()
H A DCLComparisonKernel.cpp79 …const unsigned int num_elems_processed_per_iteration = calculate_num_elems_processed_per_iteration… in validate_and_configure_window() local
84 Window win = calculate_max_window(out_shape, Steps(num_elems_processed_per_iteration)); in validate_and_configure_window()
88 AccessWindowHorizontal input1_access(&input1, 0, num_elems_processed_per_iteration); in validate_and_configure_window()
89 AccessWindowHorizontal input2_access(&input2, 0, num_elems_processed_per_iteration); in validate_and_configure_window()
90 AccessWindowHorizontal output_access(&output, 0, num_elems_processed_per_iteration); in validate_and_configure_window()
220 …const int num_elems_processed_per_iteration = calculate_num_elems_processed_per_iteration(*_input1… in border_size() local
223 …const unsigned int border = std::min<unsigned int>(num_elems_processed_per_iteration - 1U, … in border_size()
H A DCLRangeKernel.cpp85 …unsigned int num_elems_processed_per_iteration = adjust_vec_size(vector_size_byte_opencl / output-… in configure() local
86 … = calculate_max_window(*output->info(), Steps(num_elems_processed_per_iteration)); in configure()
100 …d_opts.add_option("-DVECTOR_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
101 …R=" + support::cpp11::to_string(output->info()->dimension(0) % num_elems_processed_per_iteration)); in configure()
H A DCLQLSTMLayerNormalizationKernel.cpp50 …const uint32_t num_elems_processed_per_iteration = (input->dimension(0) < temp_num_elems_processed… in validate_and_configure_window() local
53 Window win = calculate_max_window(*input, Steps(num_elems_processed_per_iteration)); in validate_and_configure_window()
100 …const uint32_t num_elems_processed_per_iteration = max_cl_vector_width / input->info()->element_si… in configure() local
111 …uild_opts.add_option("-DVEC_SIZE=" + support::cpp11::to_string(num_elems_processed_per_iteration)); in configure()
/aosp_15_r20/external/ComputeLibrary/src/core/NEON/kernels/
H A DNEBitwiseOrKernel.cpp79 constexpr unsigned int num_elems_processed_per_iteration = 16; in configure() local
82 … win = calculate_max_window(*input1->info(), Steps(num_elems_processed_per_iteration)); in configure()
83 AccessWindowHorizontal output_access(output->info(), 0, num_elems_processed_per_iteration); in configure()
86 … AccessWindowHorizontal(input1->info(), 0, num_elems_processed_per_iteration), in configure()
87 … AccessWindowHorizontal(input2->info(), 0, num_elems_processed_per_iteration), in configure()
H A DNEBitwiseXorKernel.cpp79 constexpr unsigned int num_elems_processed_per_iteration = 16; in configure() local
81 … win = calculate_max_window(*input1->info(), Steps(num_elems_processed_per_iteration)); in configure()
82 AccessWindowHorizontal output_access(output->info(), 0, num_elems_processed_per_iteration); in configure()
84 …ndow_and_padding(win, AccessWindowHorizontal(input1->info(), 0, num_elems_processed_per_iteration), in configure()
85 … AccessWindowHorizontal(input2->info(), 0, num_elems_processed_per_iteration), output_access); in configure()
H A DNEBitwiseAndKernel.cpp83 constexpr unsigned int num_elems_processed_per_iteration = 16; in configure() local
86 … win = calculate_max_window(*input1->info(), Steps(num_elems_processed_per_iteration)); in configure()
87 AccessWindowHorizontal output_access(output->info(), 0, num_elems_processed_per_iteration); in configure()
90 … AccessWindowHorizontal(input1->info(), 0, num_elems_processed_per_iteration), in configure()
91 … AccessWindowHorizontal(input2->info(), 0, num_elems_processed_per_iteration), in configure()
H A DNEBitwiseNotKernel.cpp75 constexpr unsigned int num_elems_processed_per_iteration = 16; in configure() local
78 … win = calculate_max_window(*input->info(), Steps(num_elems_processed_per_iteration)); in configure()
79 AccessWindowHorizontal output_access(output->info(), 0, num_elems_processed_per_iteration); in configure()
80 …w_and_padding(win, AccessWindowHorizontal(input->info(), 0, num_elems_processed_per_iteration), ou… in configure()
/aosp_15_r20/external/ComputeLibrary/src/core/CL/
H A DICLSimpleKernel.cpp38 …ure(const ICLTensor *input, ICLTensor *output, unsigned int num_elems_processed_per_iteration, boo… in configure() argument
44 … win = calculate_max_window(*input->info(), Steps(num_elems_processed_per_iteration), bo… in configure()
45 AccessWindowHorizontal output_access(output->info(), 0, num_elems_processed_per_iteration); in configure()
48 … AccessWindowHorizontal(input->info(), 0, num_elems_processed_per_iteration), in configure()
/aosp_15_r20/external/ComputeLibrary/src/cpu/kernels/
H A DCpuPool2dKernel.cpp206 … unsigned int &num_elems_processed_per_iteration, in validate_and_configure_window() argument
232 num_elems_processed_per_iteration = 1; in validate_and_configure_window()
243 num_elems_processed_per_iteration = (pool_stride_x == 2) ? 8 : 15; in validate_and_configure_window()
246 num_elems_processed_per_iteration = (pool_stride_x == 2) ? 7 : 14; in validate_and_configure_window()
254 num_elems_processed_per_iteration = 1; in validate_and_configure_window()
258 num_elems_processed_per_iteration = 1; in validate_and_configure_window()
273 win = calculate_max_window(dst_info, Steps(num_elems_processed_per_iteration)); in validate_and_configure_window()
330 unsigned int num_elems_processed_per_iteration = 0; in validate() local
344 … (indices) ? indices->clone().get() : nullptr, pool_info, num_elems_processed_per_iteration, in validate()

12