xref: /aosp_15_r20/external/ComputeLibrary/src/cpu/kernels/CpuReshapeKernel.cpp (revision c217d954acce2dbc11938adb493fc0abd69584f3)
1 /*
2  * Copyright (c) 2017-2022 Arm Limited.
3  *
4  * SPDX-License-Identifier: MIT
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a copy
7  * of this software and associated documentation files (the "Software"), to
8  * deal in the Software without restriction, including without limitation the
9  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10  * sell copies of the Software, and to permit persons to whom the Software is
11  * furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in all
14  * copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  */
24 #include "src/cpu/kernels/CpuReshapeKernel.h"
25 
26 #include "arm_compute/core/Error.h"
27 #include "arm_compute/core/Helpers.h"
28 #include "arm_compute/core/ITensor.h"
29 #include "arm_compute/core/TensorInfo.h"
30 #include "arm_compute/core/Types.h"
31 #include "arm_compute/core/Validate.h"
32 #include "src/core/CPP/Validate.h"
33 #include "src/core/NEON/INEKernel.h"
34 #include "src/core/helpers/AutoConfiguration.h"
35 #include "src/core/helpers/WindowHelpers.h"
36 
37 #include <cstdint>
38 
39 /** [NEReshapeLayerKernel Kernel] **/
40 namespace arm_compute
41 {
42 namespace cpu
43 {
44 namespace kernels
45 {
46 namespace
47 {
validate_arguments(const ITensorInfo * src,const ITensorInfo * dst)48 Status validate_arguments(const ITensorInfo *src, const ITensorInfo *dst)
49 {
50     ARM_COMPUTE_RETURN_ERROR_ON_NULLPTR(src, dst);
51     // Note: ARM_COMPUTE_RETURN_ERROR_ON_CPU_F16_UNSUPPORTED(src) is not needed here as this kernel doesn't use CPU FP16 instructions.
52     ARM_COMPUTE_RETURN_ERROR_ON(src->data_type() == DataType::UNKNOWN);
53 
54     if(dst->tensor_shape().total_size() != 0)
55     {
56         ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(src, dst);
57         ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_QUANTIZATION_INFO(src, dst);
58         ARM_COMPUTE_RETURN_ERROR_ON(src->tensor_shape().total_size() != dst->tensor_shape().total_size());
59     }
60 
61     return Status{};
62 }
63 
64 template <typename T>
reshape_tensor(const Window & window,const ITensor * src,ITensor * dst)65 inline void reshape_tensor(const Window &window, const ITensor *src, ITensor *dst)
66 {
67     const TensorShape &src_shape = src->info()->tensor_shape();
68     const TensorShape &dst_shape = dst->info()->tensor_shape();
69     Coordinates        dst_coord{};
70 
71     Iterator src_it(src, window);
72 
73     execute_window_loop(window, [&](const Coordinates & id)
74     {
75         dst_coord                                              = index2coords(dst_shape, coords2index(src_shape, id));
76         *reinterpret_cast<T *>(dst->ptr_to_element(dst_coord)) = *reinterpret_cast<T *>(src_it.ptr());
77     },
78     src_it);
79 }
80 } // namespace
81 
configure(const ITensorInfo * src,ITensorInfo * dst)82 void CpuReshapeKernel::configure(const ITensorInfo *src, ITensorInfo *dst)
83 {
84     ARM_COMPUTE_ERROR_ON_NULLPTR(src, dst);
85     ARM_COMPUTE_ERROR_THROW_ON(validate_arguments(src, dst));
86     ARM_COMPUTE_UNUSED(dst);
87 
88     // Configure kernel window
89     Window win = calculate_max_window(*src);
90 
91     ICpuKernel::configure(win);
92 }
93 
validate(const ITensorInfo * src,const ITensorInfo * dst)94 Status CpuReshapeKernel::validate(const ITensorInfo *src, const ITensorInfo *dst)
95 {
96     ARM_COMPUTE_RETURN_ON_ERROR(validate_arguments(src, dst));
97 
98     return Status{};
99 }
100 
run_op(ITensorPack & tensors,const Window & window,const ThreadInfo & info)101 void CpuReshapeKernel::run_op(ITensorPack &tensors, const Window &window, const ThreadInfo &info)
102 {
103     ARM_COMPUTE_UNUSED(info);
104     ARM_COMPUTE_ERROR_ON_UNCONFIGURED_KERNEL(this);
105     ARM_COMPUTE_ERROR_ON_INVALID_SUBWINDOW(ICpuKernel::window(), window);
106 
107     const auto src = tensors.get_const_tensor(TensorType::ACL_SRC);
108     auto       dst = tensors.get_tensor(TensorType::ACL_DST);
109 
110     switch(src->info()->data_type())
111     {
112         case DataType::U8:
113         case DataType::S8:
114         case DataType::QASYMM8:
115         case DataType::QASYMM8_SIGNED:
116             reshape_tensor<uint8_t>(window, src, dst);
117             break;
118         case DataType::U16:
119         case DataType::S16:
120         case DataType::F16:
121             reshape_tensor<uint16_t>(window, src, dst);
122             break;
123         case DataType::U32:
124         case DataType::S32:
125         case DataType::F32:
126             reshape_tensor<uint32_t>(window, src, dst);
127             break;
128         default:
129             ARM_COMPUTE_ERROR("Unsupported data type!");
130     }
131 }
132 
name() const133 const char *CpuReshapeKernel::name() const
134 {
135     return "CpuReshapeKernel";
136 }
137 
get_mws(const CPUInfo & platform,size_t thread_count) const138 size_t CpuReshapeKernel::get_mws(const CPUInfo &platform, size_t thread_count) const
139 {
140     ARM_COMPUTE_UNUSED(thread_count);
141     ARM_COMPUTE_UNUSED(platform);
142 
143     return ICPPKernel::default_mws;
144 }
145 
146 } // namespace kernels
147 } // namespace cpu
148 } // namespace arm_compute
149 /** [NEReshapeLayerKernel Kernel] **/
150