validation/reference/DepthwiseConvolutionLayer.cpp

*c217d954SCole Faust/*
*c217d954SCole Faust * Copyright (c) 2017-2020 Arm Limited.
*c217d954SCole Faust *
*c217d954SCole Faust * SPDX-License-Identifier: MIT
*c217d954SCole Faust *
*c217d954SCole Faust * Permission is hereby granted, free of charge, to any person obtaining a copy
*c217d954SCole Faust * of this software and associated documentation files (the "Software"), to
*c217d954SCole Faust * deal in the Software without restriction, including without limitation the
*c217d954SCole Faust * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
*c217d954SCole Faust * sell copies of the Software, and to permit persons to whom the Software is
*c217d954SCole Faust * furnished to do so, subject to the following conditions:
*c217d954SCole Faust *
*c217d954SCole Faust * The above copyright notice and this permission notice shall be included in all
*c217d954SCole Faust * copies or substantial portions of the Software.
*c217d954SCole Faust *
*c217d954SCole Faust * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
*c217d954SCole Faust * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
*c217d954SCole Faust * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
*c217d954SCole Faust * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
*c217d954SCole Faust * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
*c217d954SCole Faust * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
*c217d954SCole Faust * SOFTWARE.
*c217d954SCole Faust */
*c217d954SCole Faust#include "DepthwiseConvolutionLayer.h"
*c217d954SCole Faust
*c217d954SCole Faust#include "ConvolutionLayer.h"
*c217d954SCole Faust#include "Utils.h"
*c217d954SCole Faust
*c217d954SCole Faust#include "tests/validation/Helpers.h"
*c217d954SCole Faust#include "tests/validation/reference/Utils.h"
*c217d954SCole Faust#include "tests/validation/reference/UtilsQuantizedAsymm.h"
*c217d954SCole Faust
*c217d954SCole Faust#include "arm_compute/core/utils/quantization/AsymmHelpers.h"
*c217d954SCole Faust
*c217d954SCole Faustnamespace arm_compute
*c217d954SCole Faust{
*c217d954SCole Faustnamespace test
*c217d954SCole Faust{
*c217d954SCole Faustnamespace validation
*c217d954SCole Faust{
*c217d954SCole Faustnamespace reference
*c217d954SCole Faust{
*c217d954SCole Faustnamespace
*c217d954SCole Faust{
*c217d954SCole Faust/** Perform a depthwise convolution for floating-point types
*c217d954SCole Faust *
*c217d954SCole Faust * - Three dimensions tensors
*c217d954SCole Faust * - Third dimention is number of channels
*c217d954SCole Faust * - Depths of input tensor and filter are equals
*c217d954SCole Faust * - Padding, stride and output shape "match"
*c217d954SCole Faust *
*c217d954SCole Faust */
*c217d954SCole Fausttemplate <typename T>
*c217d954SCole FaustSimpleTensor<T> depthwise_convolution_fp(const SimpleTensor<T> &src, const SimpleTensor<T> &weights, const SimpleTensor<T> &biases, const TensorShape &dst_shape, const PadStrideInfo &conv_info,
*c217d954SCole Faust                                         unsigned int depth_multiplier, const Size2D &dilation, const QuantizationInfo &out_quant_info)
*c217d954SCole Faust{
*c217d954SCole Faust    ARM_COMPUTE_UNUSED(out_quant_info);
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<T> dst{ dst_shape, src.data_type(), 1 };
*c217d954SCole Faust
*c217d954SCole Faust    // Compute reference
*c217d954SCole Faust    const int filter_width  = weights.shape().x();
*c217d954SCole Faust    const int filter_height = weights.shape().y();
*c217d954SCole Faust    const int filter_plane  = filter_width * filter_height;
*c217d954SCole Faust    const int input_width   = src.shape().x();
*c217d954SCole Faust    const int input_height  = src.shape().y();
*c217d954SCole Faust    const int input_depth   = src.shape().z();
*c217d954SCole Faust    const int num_batches   = src.shape().total_size() / (input_width * input_height * input_depth);
*c217d954SCole Faust
*c217d954SCole Faust    const int pad_left = conv_info.pad_left();
*c217d954SCole Faust    const int pad_top  = conv_info.pad_top();
*c217d954SCole Faust
*c217d954SCole Faust    const float patch_width  = (filter_width + (dilation.x() - 1) * (filter_width - 1));
*c217d954SCole Faust    const float patch_height = (filter_height + (dilation.y() - 1) * (filter_height - 1));
*c217d954SCole Faust
*c217d954SCole Faust    const int patch_half_width_floor  = patch_width / 2;
*c217d954SCole Faust    const int patch_half_height_floor = patch_height / 2;
*c217d954SCole Faust
*c217d954SCole Faust    const auto patch_half_width_ceil  = static_cast<int>(std::ceil(patch_width / 2));
*c217d954SCole Faust    const auto patch_half_height_ceil = static_cast<int>(std::ceil(patch_height / 2));
*c217d954SCole Faust
*c217d954SCole Faust    const int minimum_x = -pad_left + patch_half_width_floor;
*c217d954SCole Faust    const int minimum_y = -pad_top + patch_half_height_floor;
*c217d954SCole Faust    const int maximum_x = (conv_info.stride().first * (dst_shape[0] - 1));
*c217d954SCole Faust    const int maximum_y = (conv_info.stride().second * (dst_shape[1] - 1));
*c217d954SCole Faust
*c217d954SCole Faust    const T border_value(0);
*c217d954SCole Faust
*c217d954SCole Faust    int out_pos = 0;
*c217d954SCole Faust    for(int r = 0; r < num_batches; ++r)
*c217d954SCole Faust    {
*c217d954SCole Faust        for(int z = 0; z < input_depth; ++z)
*c217d954SCole Faust        {
*c217d954SCole Faust            for(unsigned int m = 0; m < depth_multiplier; ++m)
*c217d954SCole Faust            {
*c217d954SCole Faust                const int out_z = z * depth_multiplier + m;
*c217d954SCole Faust
*c217d954SCole Faust                for(int y = minimum_y; y <= minimum_y + maximum_y; y += conv_info.stride().second)
*c217d954SCole Faust                {
*c217d954SCole Faust                    for(int x = minimum_x; x <= minimum_x + maximum_x; x += conv_info.stride().first)
*c217d954SCole Faust                    {
*c217d954SCole Faust                        Coordinates coords(static_cast<int>(x), static_cast<int>(y), static_cast<int>(z), static_cast<int>(r));
*c217d954SCole Faust                        size_t      filter_offset = filter_plane * out_z;
*c217d954SCole Faust
*c217d954SCole Faust                        T val(0);
*c217d954SCole Faust                        for(int j = y - patch_half_height_floor; j < y + patch_half_height_ceil; j += dilation.y())
*c217d954SCole Faust                        {
*c217d954SCole Faust                            for(int i = x - patch_half_width_floor; i < x + patch_half_width_ceil; i += dilation.x())
*c217d954SCole Faust                            {
*c217d954SCole Faust                                coords.set(0, i);
*c217d954SCole Faust                                coords.set(1, j);
*c217d954SCole Faust                                val += *(weights.data() + filter_offset) * tensor_elem_at(src, coords, BorderMode::CONSTANT, border_value);
*c217d954SCole Faust                                ++filter_offset;
*c217d954SCole Faust                            }
*c217d954SCole Faust                        }
*c217d954SCole Faust
*c217d954SCole Faust                        dst[out_pos++] = saturate_cast<T>(val + *static_cast<const T *>(biases(Coordinates(out_z))));
*c217d954SCole Faust                    }
*c217d954SCole Faust                }
*c217d954SCole Faust            }
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    return dst;
*c217d954SCole Faust}
*c217d954SCole Faust
*c217d954SCole Faust/** Perform a quantized depthwise convolution
*c217d954SCole Faust *
*c217d954SCole Faust * - Three dimensions tensors
*c217d954SCole Faust * - Third dimention is number of channels
*c217d954SCole Faust * - Depths of input tensor and filter are equals
*c217d954SCole Faust * - Padding, stride and output shape "match"
*c217d954SCole Faust * - QASYMM8/QASYMM8_SIGNED input, output
*c217d954SCole Faust * - QASYMM8/QASYMM8_SIGNED or QSYMM8_PER_CHANNEL filter
*c217d954SCole Faust *
*c217d954SCole Faust */
*c217d954SCole Fausttemplate <typename T, typename TW, typename TB>
*c217d954SCole FaustSimpleTensor<T> depthwise_convolution_quantized(const SimpleTensor<T> &src, const SimpleTensor<TW> &weights, const SimpleTensor<int32_t> &biases, const TensorShape &dst_shape,
*c217d954SCole Faust                                                const PadStrideInfo &conv_info, unsigned int depth_multiplier, const Size2D &dilation, const QuantizationInfo &out_quant_info)
*c217d954SCole Faust{
*c217d954SCole Faust    // if no explicit quantization has been set you the same as src
*c217d954SCole Faust    const QuantizationInfo &dst_qinfo = out_quant_info.uniform().empty() ? src.quantization_info() : out_quant_info;
*c217d954SCole Faust    SimpleTensor<T>         dst{ dst_shape, src.data_type(), 1, dst_qinfo };
*c217d954SCole Faust
*c217d954SCole Faust    // Create reference
*c217d954SCole Faust    const int   input_offset   = -src.quantization_info().uniform().offset;
*c217d954SCole Faust    const float input_scale    = src.quantization_info().uniform().scale;
*c217d954SCole Faust    const int   weights_offset = -weights.quantization_info().uniform().offset;
*c217d954SCole Faust    const int   output_offset  = dst_qinfo.uniform().offset;
*c217d954SCole Faust    const float output_scale   = dst_qinfo.uniform().scale;
*c217d954SCole Faust
*c217d954SCole Faust    const std::vector<float> weights_scale_vec = weights.quantization_info().scale();
*c217d954SCole Faust
*c217d954SCole Faust    // Compute reference
*c217d954SCole Faust    const int filter_width  = weights.shape().x();
*c217d954SCole Faust    const int filter_height = weights.shape().y();
*c217d954SCole Faust    const int filter_plane  = filter_width * filter_height;
*c217d954SCole Faust    const int input_width   = src.shape().x();
*c217d954SCole Faust    const int input_height  = src.shape().y();
*c217d954SCole Faust    const int input_depth   = src.shape().z();
*c217d954SCole Faust    const int num_batches   = src.shape().total_size() / (input_width * input_height * input_depth);
*c217d954SCole Faust
*c217d954SCole Faust    const int pad_left = conv_info.pad_left();
*c217d954SCole Faust    const int pad_top  = conv_info.pad_top();
*c217d954SCole Faust
*c217d954SCole Faust    const float patch_width  = (filter_width + (dilation.x() - 1) * (filter_width - 1));
*c217d954SCole Faust    const float patch_height = (filter_height + (dilation.y() - 1) * (filter_height - 1));
*c217d954SCole Faust
*c217d954SCole Faust    const int patch_half_width_floor  = patch_width / 2;
*c217d954SCole Faust    const int patch_half_height_floor = patch_height / 2;
*c217d954SCole Faust
*c217d954SCole Faust    const auto patch_half_width_ceil  = static_cast<int>(std::ceil(patch_width / 2));
*c217d954SCole Faust    const auto patch_half_height_ceil = static_cast<int>(std::ceil(patch_height / 2));
*c217d954SCole Faust
*c217d954SCole Faust    const int minimum_x = -pad_left + patch_half_width_floor;
*c217d954SCole Faust    const int minimum_y = -pad_top + patch_half_height_floor;
*c217d954SCole Faust    const int maximum_x = (conv_info.stride().first * (dst_shape[0] - 1));
*c217d954SCole Faust    const int maximum_y = (conv_info.stride().second * (dst_shape[1] - 1));
*c217d954SCole Faust
*c217d954SCole Faust    const bool is_quantized_per_channel = is_data_type_quantized_per_channel(weights.data_type());
*c217d954SCole Faust
*c217d954SCole Faust    const int min = std::numeric_limits<T>::lowest();
*c217d954SCole Faust    const int max = std::numeric_limits<T>::max();
*c217d954SCole Faust
*c217d954SCole Faust    int out_pos = 0;
*c217d954SCole Faust    for(int r = 0; r < num_batches; ++r)
*c217d954SCole Faust    {
*c217d954SCole Faust        for(int z = 0; z < input_depth; ++z)
*c217d954SCole Faust        {
*c217d954SCole Faust            for(unsigned int m = 0; m < depth_multiplier; ++m)
*c217d954SCole Faust            {
*c217d954SCole Faust                const int     out_z    = z * depth_multiplier + m;
*c217d954SCole Faust                const int32_t bias_val = *static_cast<const int32_t *>(biases(Coordinates(out_z)));
*c217d954SCole Faust
*c217d954SCole Faust                int         output_multiplier = 0;
*c217d954SCole Faust                int         output_shift      = 0;
*c217d954SCole Faust                const float weights_scale     = (is_quantized_per_channel) ? weights_scale_vec[out_z] : weights_scale_vec[0];
*c217d954SCole Faust                const float multiplier        = input_scale * weights_scale / output_scale;
*c217d954SCole Faust                arm_compute::quantization::calculate_quantized_multiplier(multiplier, &output_multiplier, &output_shift);
*c217d954SCole Faust
*c217d954SCole Faust                for(int y = minimum_y; y <= minimum_y + maximum_y; y += conv_info.stride().second)
*c217d954SCole Faust                {
*c217d954SCole Faust                    for(int x = minimum_x; x <= minimum_x + maximum_x; x += conv_info.stride().first)
*c217d954SCole Faust                    {
*c217d954SCole Faust                        Coordinates coords(x, y, z, r);
*c217d954SCole Faust                        int         filter_offset = filter_plane * out_z;
*c217d954SCole Faust
*c217d954SCole Faust                        int32_t val = 0;
*c217d954SCole Faust                        for(int j = y - patch_half_height_floor; j < y + patch_half_height_ceil; j += dilation.y())
*c217d954SCole Faust                        {
*c217d954SCole Faust                            for(int i = x - patch_half_width_floor; i < x + patch_half_width_ceil; i += dilation.x())
*c217d954SCole Faust                            {
*c217d954SCole Faust                                coords.set(0, i);
*c217d954SCole Faust                                coords.set(1, j);
*c217d954SCole Faust                                const auto in_val = tensor_elem_at<T>(src, coords, BorderMode::CONSTANT, -input_offset);
*c217d954SCole Faust                                const TW   w_val  = *(weights.data() + filter_offset);
*c217d954SCole Faust                                val += (in_val + input_offset) * (w_val + weights_offset);
*c217d954SCole Faust                                ++filter_offset;
*c217d954SCole Faust                            }
*c217d954SCole Faust                        }
*c217d954SCole Faust                        val += bias_val;
*c217d954SCole Faust                        // Quantize down
*c217d954SCole Faust                        val = quantize_down_scale_by_fixedpoint(val, output_multiplier, output_shift, output_offset, min, max);
*c217d954SCole Faust
*c217d954SCole Faust                        // Store the result
*c217d954SCole Faust                        dst[out_pos++] = val;
*c217d954SCole Faust                    }
*c217d954SCole Faust                }
*c217d954SCole Faust            }
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    return dst;
*c217d954SCole Faust}
*c217d954SCole Faust} // namespace
*c217d954SCole Faust
*c217d954SCole Fausttemplate <>
*c217d954SCole FaustSimpleTensor<float> depthwise_convolution(const SimpleTensor<float> &src, const SimpleTensor<float> &weights, const SimpleTensor<float> &biases, const TensorShape &dst_shape,
*c217d954SCole Faust                                          const PadStrideInfo &conv_info, unsigned int depth_multiplier, const Size2D &dilation, const QuantizationInfo &out_quant_info)
*c217d954SCole Faust{
*c217d954SCole Faust    return depthwise_convolution_fp(src, weights, biases, dst_shape, conv_info, depth_multiplier, dilation, out_quant_info);
*c217d954SCole Faust}
*c217d954SCole Faust
*c217d954SCole Fausttemplate <>
*c217d954SCole FaustSimpleTensor<half> depthwise_convolution(const SimpleTensor<half> &src, const SimpleTensor<half> &weights, const SimpleTensor<half> &biases, const TensorShape &dst_shape,
*c217d954SCole Faust                                         const PadStrideInfo &conv_info, unsigned int depth_multiplier, const Size2D &dilation, const QuantizationInfo &out_quant_info)
*c217d954SCole Faust{
*c217d954SCole Faust    return depthwise_convolution_fp(src, weights, biases, dst_shape, conv_info, depth_multiplier, dilation, out_quant_info);
*c217d954SCole Faust}
*c217d954SCole Faust
*c217d954SCole Fausttemplate <>
*c217d954SCole FaustSimpleTensor<uint8_t> depthwise_convolution(const SimpleTensor<uint8_t> &src, const SimpleTensor<uint8_t> &weights, const SimpleTensor<int32_t> &biases, const TensorShape &dst_shape,
*c217d954SCole Faust                                            const PadStrideInfo &conv_info, unsigned int depth_multiplier, const Size2D &dilation, const QuantizationInfo &out_quant_info)
*c217d954SCole Faust{
*c217d954SCole Faust    return depthwise_convolution_quantized<uint8_t, uint8_t, int32_t>(src, weights, biases, dst_shape, conv_info, depth_multiplier, dilation, out_quant_info);
*c217d954SCole Faust}
*c217d954SCole Faust
*c217d954SCole Fausttemplate <>
*c217d954SCole FaustSimpleTensor<uint8_t> depthwise_convolution(const SimpleTensor<uint8_t> &src, const SimpleTensor<int8_t> &weights, const SimpleTensor<int32_t> &biases, const TensorShape &dst_shape,
*c217d954SCole Faust                                            const PadStrideInfo &conv_info, unsigned int depth_multiplier, const Size2D &dilation, const QuantizationInfo &out_quant_info)
*c217d954SCole Faust{
*c217d954SCole Faust    return depthwise_convolution_quantized<uint8_t, int8_t, int32_t>(src, weights, biases, dst_shape, conv_info, depth_multiplier, dilation, out_quant_info);
*c217d954SCole Faust}
*c217d954SCole Faust
*c217d954SCole Fausttemplate <>
*c217d954SCole FaustSimpleTensor<int8_t> depthwise_convolution(const SimpleTensor<int8_t> &src, const SimpleTensor<int8_t> &weights, const SimpleTensor<int32_t> &biases, const TensorShape &dst_shape,
*c217d954SCole Faust                                           const PadStrideInfo &conv_info, unsigned int depth_multiplier, const Size2D &dilation, const QuantizationInfo &out_quant_info)
*c217d954SCole Faust{
*c217d954SCole Faust    return depthwise_convolution_quantized<int8_t, int8_t, int32_t>(src, weights, biases, dst_shape, conv_info, depth_multiplier, dilation, out_quant_info);
*c217d954SCole Faust}
*c217d954SCole Faust} // namespace reference
*c217d954SCole Faust} // namespace validation
*c217d954SCole Faust} // namespace test
*c217d954SCole Faust} // namespace arm_compute