blob: 207e5fc45c49fb3a682263da97ad79e628b968ae [file] [log] [blame]
Giorgio Arena93a690e2017-08-01 16:09:33 +01001/*
Georgios Pinitasf72f9362018-01-12 16:29:45 +00002 * Copyright (c) 2017-2018 ARM Limited.
Giorgio Arena93a690e2017-08-01 16:09:33 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Giorgio Arena04a8f8c2017-11-23 11:45:24 +000024#include "DepthwiseConvolutionLayer.h"
Giorgio Arena93a690e2017-08-01 16:09:33 +010025
26#include "ConvolutionLayer.h"
Giorgio Arena1ed1fc62018-03-26 16:20:05 +010027#include "Permute.h"
Isabella Gottardi1fab09f2017-07-13 15:55:57 +010028#include "Utils.h"
Giorgio Arena93a690e2017-08-01 16:09:33 +010029
Dmitry Savenkod7295b72017-11-20 22:00:08 +070030#include "tests/validation/FixedPoint.h"
Moritz Pflanzera09de0c2017-09-01 20:41:12 +010031#include "tests/validation/Helpers.h"
Georgios Pinitas5a7e7762017-12-01 16:27:29 +000032#include "tests/validation/reference/Utils.h"
33#include "tests/validation/reference/UtilsQuantizedAsymm.h"
Giorgio Arena93a690e2017-08-01 16:09:33 +010034
Dmitry Savenkod7295b72017-11-20 22:00:08 +070035#include "arm_compute/core/utils/quantization/AsymmHelpers.h"
36
Giorgio Arena93a690e2017-08-01 16:09:33 +010037namespace arm_compute
38{
39namespace test
40{
41namespace validation
42{
43namespace reference
44{
45/** Perform a depthwise convolution
46 *
47 * - Three dimensions tensors
48 * - Third dimention is number of channels
49 * - Depths of input tensor and filter are equals
50 * - Padding, stride and output shape "match"
51 *
52 */
Dmitry Savenkod7295b72017-11-20 22:00:08 +070053template <typename T, typename TB>
Giorgio Arena76572242018-04-04 17:44:26 +010054void depthwise_convolution_nchw(const SimpleTensor<T> &src, const SimpleTensor<T> &weights, const SimpleTensor<TB> &biases, SimpleTensor<T> &dst, const PadStrideInfo &conv_info,
55 unsigned int depth_multiplier)
Giorgio Arena93a690e2017-08-01 16:09:33 +010056{
Giorgio Arena93a690e2017-08-01 16:09:33 +010057 // Compute reference
Jaroslaw Rzepeckia1ed41f2017-10-13 11:13:58 +010058 const int filter_width = weights.shape().x();
59 const int filter_height = weights.shape().y();
60 const int filter_plane = filter_width * filter_height;
61 const int input_width = src.shape().x();
62 const int input_height = src.shape().y();
63 const int input_depth = src.shape().z();
64 const int num_batches = src.shape().total_size() / (input_width * input_height * input_depth);
Giorgio Arena93a690e2017-08-01 16:09:33 +010065
Jaroslaw Rzepeckia1ed41f2017-10-13 11:13:58 +010066 const int filter_half_width = filter_width / 2;
67 const int filter_half_height = filter_height / 2;
68
Georgios Pinitas4074c992018-01-30 18:13:46 +000069 const int pad_left = conv_info.pad_left();
70 const int pad_top = conv_info.pad_top();
71 const int pad_right = conv_info.pad_right();
72 const int pad_bottom = conv_info.pad_bottom();
Jaroslaw Rzepeckia1ed41f2017-10-13 11:13:58 +010073
74 const int minimum_x = -pad_left + filter_half_width;
75 const int minimum_y = -pad_top + filter_half_height;
76 const int maximum_x = input_width + pad_left - filter_half_width + pad_right - filter_half_width;
77 const int maximum_y = input_height + pad_top - filter_half_height + pad_bottom - filter_half_height;
Giorgio Arena93a690e2017-08-01 16:09:33 +010078
Giorgio Arena76572242018-04-04 17:44:26 +010079 const T border_value(0);
80
Giorgio Arena93a690e2017-08-01 16:09:33 +010081 int out_pos = 0;
Giorgio Arena9fe41442017-08-23 16:36:24 +010082 for(int r = 0; r < num_batches; ++r)
Giorgio Arena93a690e2017-08-01 16:09:33 +010083 {
Jaroslaw Rzepeckia1ed41f2017-10-13 11:13:58 +010084 for(int z = 0; z < input_depth; ++z)
Giorgio Arena93a690e2017-08-01 16:09:33 +010085 {
Giorgio Arena76572242018-04-04 17:44:26 +010086 for(unsigned int m = 0; m < depth_multiplier; ++m)
Giorgio Arena93a690e2017-08-01 16:09:33 +010087 {
Giorgio Arena76572242018-04-04 17:44:26 +010088 const int out_z = z * depth_multiplier + m;
Giorgio Arena9fe41442017-08-23 16:36:24 +010089
Giorgio Arena76572242018-04-04 17:44:26 +010090 for(int y = minimum_y; y < minimum_y + maximum_y; y += conv_info.stride().second)
91 {
92 for(int x = minimum_x; x < minimum_x + maximum_x; x += conv_info.stride().first)
Giorgio Arena93a690e2017-08-01 16:09:33 +010093 {
Giorgio Arena76572242018-04-04 17:44:26 +010094 Coordinates coords(static_cast<int>(x), static_cast<int>(y), static_cast<int>(z), static_cast<int>(r));
95 size_t filter_offset = filter_plane * out_z;
96
97 T val(0);
98 for(int j = y - filter_half_height; j <= static_cast<int>(y + filter_half_height); ++j)
Giorgio Arena9fe41442017-08-23 16:36:24 +010099 {
Giorgio Arena76572242018-04-04 17:44:26 +0100100 for(int i = x - filter_half_width; i <= static_cast<int>(x + filter_half_width); ++i)
101 {
102 coords.set(0, i);
103 coords.set(1, j);
104
105 val += *(weights.data() + filter_offset) * tensor_elem_at(src, coords, BorderMode::CONSTANT, border_value);
106 ++filter_offset;
107 }
Giorgio Arena9fe41442017-08-23 16:36:24 +0100108 }
Giorgio Arena76572242018-04-04 17:44:26 +0100109
110 dst[out_pos++] = saturate_cast<T>(val + *static_cast<const TB *>(biases(Coordinates(out_z))));
Giorgio Arena93a690e2017-08-01 16:09:33 +0100111 }
112 }
Giorgio Arena93a690e2017-08-01 16:09:33 +0100113 }
114 }
115 }
Giorgio Arena93a690e2017-08-01 16:09:33 +0100116}
117
Giorgio Arena76572242018-04-04 17:44:26 +0100118void depthwise_convolution_nchw(const SimpleTensor<uint8_t> &src, const SimpleTensor<uint8_t> &weights, const SimpleTensor<int32_t> &biases, SimpleTensor<uint8_t> &dst, const PadStrideInfo &conv_info,
119 unsigned int depth_multiplier)
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700120{
121 // Create reference
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700122 const int input_offset = -src.quantization_info().offset;
123 const float input_scale = src.quantization_info().scale;
124 const int weights_offset = -weights.quantization_info().offset;
125 const float weights_scale = weights.quantization_info().scale;
126 const int output_offset = dst.quantization_info().offset;
127 const float output_scale = dst.quantization_info().scale;
128
129 int output_multiplier;
130 int output_shift;
131 const float multiplier = input_scale * weights_scale / output_scale;
132 arm_compute::quantization::calculate_quantized_multiplier_less_than_one(multiplier, &output_multiplier, &output_shift);
133
134 // Compute reference
135 const int filter_width = weights.shape().x();
136 const int filter_height = weights.shape().y();
137 const int filter_plane = filter_width * filter_height;
138 const int input_width = src.shape().x();
139 const int input_height = src.shape().y();
140 const int input_depth = src.shape().z();
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000141 const int num_batches = src.shape().total_size() / (input_width * input_height * input_depth);
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700142
Georgios Pinitasd05dce42018-01-22 16:29:17 +0000143 const int filter_half_width = filter_width / 2;
144 const int filter_half_height = filter_height / 2;
145
Georgios Pinitas15997872018-02-19 13:58:22 +0000146 const int pad_left = conv_info.pad_left();
147 const int pad_top = conv_info.pad_top();
148 const int pad_right = conv_info.pad_right();
149 const int pad_bottom = conv_info.pad_bottom();
Georgios Pinitasd05dce42018-01-22 16:29:17 +0000150
151 const int minimum_x = -pad_left + filter_half_width;
152 const int minimum_y = -pad_top + filter_half_height;
153 const int maximum_x = input_width + pad_left - filter_half_width + pad_right - filter_half_width;
154 const int maximum_y = input_height + pad_top - filter_half_height + pad_bottom - filter_half_height;
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700155
156 int out_pos = 0;
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000157 for(int r = 0; r < num_batches; ++r)
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700158 {
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000159 for(int z = 0; z < input_depth; ++z)
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700160 {
Giorgio Arena76572242018-04-04 17:44:26 +0100161 for(unsigned int m = 0; m < depth_multiplier; ++m)
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700162 {
Giorgio Arena76572242018-04-04 17:44:26 +0100163 const int out_z = z * depth_multiplier + m;
164 const int32_t bias_val = *static_cast<const int32_t *>(biases(Coordinates(out_z)));
165
166 for(int y = minimum_y; y < minimum_y + maximum_y; y += conv_info.stride().second)
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700167 {
Giorgio Arena76572242018-04-04 17:44:26 +0100168 for(int x = minimum_x; x < minimum_x + maximum_x; x += conv_info.stride().first)
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000169 {
Giorgio Arena76572242018-04-04 17:44:26 +0100170 Coordinates coords(x, y, z, r);
171 int filter_offset = filter_plane * out_z;
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000172
Giorgio Arena76572242018-04-04 17:44:26 +0100173 int32_t val = 0;
174 for(int j = y - filter_half_height; j <= (y + filter_half_height); ++j)
175 {
176 for(int i = x - filter_half_width; i <= (x + filter_half_width); ++i)
177 {
178 coords.set(0, i);
179 coords.set(1, j);
180 const auto in_val = tensor_elem_at<uint8_t>(src, coords, BorderMode::CONSTANT, -input_offset);
181 const uint8_t w_val = *(weights.data() + filter_offset);
182 val += (in_val + input_offset) * (w_val + weights_offset);
183 ++filter_offset;
184 }
185 }
186 val += bias_val;
187 val = asymm_rounding_divide_by_pow2(asymm_int_mult(val, output_multiplier), output_shift);
188 val += output_offset;
189 val = std::max<int32_t>(val, 0);
190 val = std::min<int32_t>(val, 255);
191
192 // Store the result
193 dst[out_pos++] = val;
194 }
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000195 }
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700196 }
197 }
198 }
Giorgio Arenadfca60b2018-01-31 10:30:59 +0000199}
200
Giorgio Arena76572242018-04-04 17:44:26 +0100201template <typename T, typename TB>
202SimpleTensor<T> depthwise_convolution(const SimpleTensor<T> &src, const SimpleTensor<T> &weights, const SimpleTensor<TB> &biases, const TensorShape &dst_shape, const PadStrideInfo &conv_info,
203 unsigned int depth_multiplier)
Giorgio Arenadfca60b2018-01-31 10:30:59 +0000204{
Giorgio Arena76572242018-04-04 17:44:26 +0100205 SimpleTensor<T> dst{ dst_shape, src.data_type(), 1, src.fixed_point_position(), src.quantization_info() };
Giorgio Arenadfca60b2018-01-31 10:30:59 +0000206
207 if(src.data_layout() == DataLayout::NHWC)
208 {
Giorgio Arena1ed1fc62018-03-26 16:20:05 +0100209 SimpleTensor<T> src_nchw = reference::permute<T>(src, PermutationVector(1U, 2U, 0U));
210 SimpleTensor<T> weights_nchw = reference::permute<T>(weights, PermutationVector(1U, 2U, 0U));
211 SimpleTensor<T> dst_nchw = reference::permute<T>(dst, PermutationVector(1U, 2U, 0U));
212
Giorgio Arena76572242018-04-04 17:44:26 +0100213 depthwise_convolution_nchw(src_nchw, weights_nchw, biases, dst_nchw, conv_info, depth_multiplier);
Giorgio Arena1ed1fc62018-03-26 16:20:05 +0100214
215 return reference::permute<T>(dst_nchw, PermutationVector(2U, 0U, 1U));
216 }
217
Giorgio Arena76572242018-04-04 17:44:26 +0100218 depthwise_convolution_nchw(src, weights, biases, dst, conv_info, depth_multiplier);
Giorgio Arena1ed1fc62018-03-26 16:20:05 +0100219
220 return dst;
221}
222
Giorgio Arena76572242018-04-04 17:44:26 +0100223template SimpleTensor<uint8_t> depthwise_convolution(const SimpleTensor<uint8_t> &src, const SimpleTensor<uint8_t> &weights, const SimpleTensor<int32_t> &biases, const TensorShape &dst_shape,
224 const PadStrideInfo &conv_info, unsigned int depth_multiplier);
225
Georgios Pinitas81a26ad2017-10-23 20:29:30 +0100226template SimpleTensor<float> depthwise_convolution(const SimpleTensor<float> &src, const SimpleTensor<float> &weights, const SimpleTensor<float> &biases, const TensorShape &dst_shape,
Giorgio Arena76572242018-04-04 17:44:26 +0100227 const PadStrideInfo &conv_info, unsigned int depth_multiplier);
Frank Lei8cdfdb82018-01-02 16:49:33 +0800228
229template SimpleTensor<half> depthwise_convolution(const SimpleTensor<half> &src, const SimpleTensor<half> &weights, const SimpleTensor<half> &biases, const TensorShape &dst_shape,
Giorgio Arena76572242018-04-04 17:44:26 +0100230 const PadStrideInfo &conv_info, unsigned int depth_multiplier);
Giorgio Arena93a690e2017-08-01 16:09:33 +0100231} // namespace reference
232} // namespace validation
233} // namespace test
234} // namespace arm_compute