xref: /aosp_15_r20/external/ComputeLibrary/src/graph/nodes/DepthwiseConvolutionLayerNode.cpp (revision c217d954acce2dbc11938adb493fc0abd69584f3)
1 /*
2  * Copyright (c) 2018-2019, 2021 Arm Limited.
3  *
4  * SPDX-License-Identifier: MIT
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a copy
7  * of this software and associated documentation files (the "Software"), to
8  * deal in the Software without restriction, including without limitation the
9  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10  * sell copies of the Software, and to permit persons to whom the Software is
11  * furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in all
14  * copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  */
24 #include "arm_compute/graph/nodes/DepthwiseConvolutionLayerNode.h"
25 
26 #include "arm_compute/core/Utils.h"
27 #include "arm_compute/graph/Graph.h"
28 #include "arm_compute/graph/INodeVisitor.h"
29 #include "arm_compute/graph/Utils.h"
30 
31 namespace arm_compute
32 {
33 namespace graph
34 {
DepthwiseConvolutionLayerNode(PadStrideInfo info,int depth_multiplier,DepthwiseConvolutionMethod method,QuantizationInfo out_quant_info)35 DepthwiseConvolutionLayerNode::DepthwiseConvolutionLayerNode(PadStrideInfo info, int depth_multiplier, DepthwiseConvolutionMethod method,
36                                                              QuantizationInfo out_quant_info)
37     : _info(std::move(info)), _depth_multiplier(depth_multiplier), _method(method), _out_quant_info(std::move(out_quant_info)), _fused_activation()
38 {
39     _input_edges.resize(3, EmptyEdgeID);
40     _outputs.resize(1, NullTensorID);
41 }
42 
depth_multiplier() const43 int DepthwiseConvolutionLayerNode::depth_multiplier() const
44 {
45     return _depth_multiplier;
46 }
47 
set_depthwise_convolution_method(DepthwiseConvolutionMethod method)48 void DepthwiseConvolutionLayerNode::set_depthwise_convolution_method(DepthwiseConvolutionMethod method)
49 {
50     _method = method;
51 }
52 
depthwise_convolution_method() const53 DepthwiseConvolutionMethod DepthwiseConvolutionLayerNode::depthwise_convolution_method() const
54 {
55     return _method;
56 }
57 
convolution_info() const58 PadStrideInfo DepthwiseConvolutionLayerNode::convolution_info() const
59 {
60     return _info;
61 }
62 
fused_activation() const63 ActivationLayerInfo DepthwiseConvolutionLayerNode::fused_activation() const
64 {
65     return _fused_activation;
66 }
67 
set_fused_activation(ActivationLayerInfo fused_activation)68 void DepthwiseConvolutionLayerNode::set_fused_activation(ActivationLayerInfo fused_activation)
69 {
70     _fused_activation = fused_activation;
71 }
72 
set_convolution_info(PadStrideInfo info)73 void DepthwiseConvolutionLayerNode::set_convolution_info(PadStrideInfo info)
74 {
75     _info = info;
76 }
77 
compute_output_descriptor(const TensorDescriptor & input_descriptor,const TensorDescriptor & weights_descriptor,const PadStrideInfo & info,int depth_multiplier)78 TensorDescriptor DepthwiseConvolutionLayerNode::compute_output_descriptor(const TensorDescriptor &input_descriptor,
79                                                                           const TensorDescriptor &weights_descriptor,
80                                                                           const PadStrideInfo    &info,
81                                                                           int                     depth_multiplier)
82 {
83     unsigned int output_width  = 0;
84     unsigned int output_height = 0;
85 
86     const unsigned int input_width    = get_dimension_size(input_descriptor, DataLayoutDimension::WIDTH);
87     const unsigned int input_height   = get_dimension_size(input_descriptor, DataLayoutDimension::HEIGHT);
88     const unsigned int input_channels = get_dimension_size(input_descriptor, DataLayoutDimension::CHANNEL);
89     const unsigned int kernel_width   = get_dimension_size(weights_descriptor, DataLayoutDimension::WIDTH);
90     const unsigned int kernel_height  = get_dimension_size(weights_descriptor, DataLayoutDimension::HEIGHT);
91 
92     std::tie(output_width, output_height) = scaled_dimensions(input_width, input_height, kernel_width, kernel_height, info);
93 
94     const DataLayout data_layout       = input_descriptor.layout;
95     TensorDescriptor output_descriptor = input_descriptor;
96     output_descriptor.shape.set(get_dimension_idx(data_layout, DataLayoutDimension::WIDTH), output_width);
97     output_descriptor.shape.set(get_dimension_idx(data_layout, DataLayoutDimension::HEIGHT), output_height);
98     output_descriptor.shape.set(get_dimension_idx(data_layout, DataLayoutDimension::CHANNEL), input_channels * depth_multiplier);
99 
100     return output_descriptor;
101 }
102 
forward_descriptors()103 bool DepthwiseConvolutionLayerNode::forward_descriptors()
104 {
105     if((input_id(0) != NullTensorID) && (input_id(1) != NullTensorID) && (output_id(0) != NullTensorID))
106     {
107         Tensor *dst = output(0);
108         ARM_COMPUTE_ERROR_ON(dst == nullptr);
109         dst->desc() = configure_output(0);
110         return true;
111     }
112     return false;
113 }
114 
configure_output(size_t idx) const115 TensorDescriptor DepthwiseConvolutionLayerNode::configure_output(size_t idx) const
116 {
117     ARM_COMPUTE_UNUSED(idx);
118     const Tensor *src     = input(0);
119     const Tensor *weights = input(1);
120 
121     ARM_COMPUTE_ERROR_ON(src == nullptr || weights == nullptr);
122 
123     TensorDescriptor output_info = compute_output_descriptor(src->desc(), weights->desc(), _info, _depth_multiplier);
124     if(!_out_quant_info.empty())
125     {
126         output_info.quant_info = _out_quant_info;
127     }
128 
129     return output_info;
130 }
131 
type() const132 NodeType DepthwiseConvolutionLayerNode::type() const
133 {
134     return DepthwiseConvolutionLayerNode::node_type;
135 }
136 
accept(INodeVisitor & v)137 void DepthwiseConvolutionLayerNode::accept(INodeVisitor &v)
138 {
139     v.visit(*this);
140 }
141 } // namespace graph
142 } // namespace arm_compute