blob: 229e044783d7473ee566fb9d777165ed93431ab6 [file] [log] [blame]
Giorgio Arena93a690e2017-08-01 16:09:33 +01001/*
2 * Copyright (c) 2017 ARM Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#include "DepthwiseConvolution.h"
25
26#include "ConvolutionLayer.h"
Isabella Gottardi1fab09f2017-07-13 15:55:57 +010027#include "Utils.h"
Giorgio Arena93a690e2017-08-01 16:09:33 +010028
Dmitry Savenkod7295b72017-11-20 22:00:08 +070029#include "tests/validation/CPP/Utils.h"
30#include "tests/validation/CPP/UtilsQuantizedAsymm.h"
31#include "tests/validation/FixedPoint.h"
Moritz Pflanzera09de0c2017-09-01 20:41:12 +010032#include "tests/validation/Helpers.h"
Giorgio Arena93a690e2017-08-01 16:09:33 +010033
Dmitry Savenkod7295b72017-11-20 22:00:08 +070034#include "arm_compute/core/utils/quantization/AsymmHelpers.h"
35
Giorgio Arena93a690e2017-08-01 16:09:33 +010036namespace arm_compute
37{
38namespace test
39{
40namespace validation
41{
42namespace reference
43{
44/** Perform a depthwise convolution
45 *
46 * - Three dimensions tensors
47 * - Third dimention is number of channels
48 * - Depths of input tensor and filter are equals
49 * - Padding, stride and output shape "match"
50 *
51 */
Dmitry Savenkod7295b72017-11-20 22:00:08 +070052template <typename T, typename TB>
53SimpleTensor<T> depthwise_convolution(const SimpleTensor<T> &src, const SimpleTensor<T> &weights, const SimpleTensor<TB> &biases, const TensorShape &dst_shape, const PadStrideInfo &conv_info)
Giorgio Arena93a690e2017-08-01 16:09:33 +010054{
55 // Create reference
56 SimpleTensor<T> dst{ dst_shape, src.data_type(), 1, src.fixed_point_position() };
57
58 // Compute reference
Jaroslaw Rzepeckia1ed41f2017-10-13 11:13:58 +010059 const int filter_width = weights.shape().x();
60 const int filter_height = weights.shape().y();
61 const int filter_plane = filter_width * filter_height;
62 const int input_width = src.shape().x();
63 const int input_height = src.shape().y();
64 const int input_depth = src.shape().z();
65 const int num_batches = src.shape().total_size() / (input_width * input_height * input_depth);
Giorgio Arena93a690e2017-08-01 16:09:33 +010066
Jaroslaw Rzepeckia1ed41f2017-10-13 11:13:58 +010067 const int filter_half_width = filter_width / 2;
68 const int filter_half_height = filter_height / 2;
69
70 const int pad_left = std::min(static_cast<int>(conv_info.pad_left()), filter_half_width);
71 const int pad_top = std::min(static_cast<int>(conv_info.pad_top()), filter_half_height);
72 const int pad_right = std::min(static_cast<int>(conv_info.pad_right()), filter_half_width);
73 const int pad_bottom = std::min(static_cast<int>(conv_info.pad_bottom()), filter_half_height);
74
75 const int minimum_x = -pad_left + filter_half_width;
76 const int minimum_y = -pad_top + filter_half_height;
77 const int maximum_x = input_width + pad_left - filter_half_width + pad_right - filter_half_width;
78 const int maximum_y = input_height + pad_top - filter_half_height + pad_bottom - filter_half_height;
Giorgio Arena93a690e2017-08-01 16:09:33 +010079
80 int out_pos = 0;
Giorgio Arena9fe41442017-08-23 16:36:24 +010081 for(int r = 0; r < num_batches; ++r)
Giorgio Arena93a690e2017-08-01 16:09:33 +010082 {
Jaroslaw Rzepeckia1ed41f2017-10-13 11:13:58 +010083 for(int z = 0; z < input_depth; ++z)
Giorgio Arena93a690e2017-08-01 16:09:33 +010084 {
Jaroslaw Rzepeckia1ed41f2017-10-13 11:13:58 +010085 for(int y = minimum_y; y < minimum_y + maximum_y; y += conv_info.stride().second)
Giorgio Arena93a690e2017-08-01 16:09:33 +010086 {
Jaroslaw Rzepeckia1ed41f2017-10-13 11:13:58 +010087 for(int x = minimum_x; x < minimum_x + maximum_x; x += conv_info.stride().first)
Giorgio Arena93a690e2017-08-01 16:09:33 +010088 {
Giorgio Arena9fe41442017-08-23 16:36:24 +010089 Coordinates coords(static_cast<int>(x), static_cast<int>(y), static_cast<int>(z), static_cast<int>(r));
90 size_t filter_offset = filter_plane * z;
91
92 T val = 0;
93 for(int j = y - filter_half_height; j <= static_cast<int>(y + filter_half_height); ++j)
Giorgio Arena93a690e2017-08-01 16:09:33 +010094 {
Giorgio Arena9fe41442017-08-23 16:36:24 +010095 for(int i = x - filter_half_width; i <= static_cast<int>(x + filter_half_width); ++i)
96 {
97 coords.set(0, i);
98 coords.set(1, j);
99 val += *(weights.data() + filter_offset) * tensor_elem_at(src, coords, BorderMode::CONSTANT, 0.f);
100 ++filter_offset;
101 }
Giorgio Arena93a690e2017-08-01 16:09:33 +0100102 }
Giorgio Arena9fe41442017-08-23 16:36:24 +0100103 coords.set(0, x);
104 coords.set(1, y);
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700105 dst[out_pos++] = saturate_cast<T>(val + *static_cast<const TB *>(biases(Coordinates(z))));
Giorgio Arena93a690e2017-08-01 16:09:33 +0100106 }
Giorgio Arena93a690e2017-08-01 16:09:33 +0100107 }
108 }
109 }
110
111 return dst;
112}
113
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700114template <>
115SimpleTensor<uint8_t> depthwise_convolution(const SimpleTensor<uint8_t> &src, const SimpleTensor<uint8_t> &weights, const SimpleTensor<int32_t> &biases, const TensorShape &dst_shape,
116 const PadStrideInfo &conv_info)
117{
118 // Create reference
119 SimpleTensor<uint8_t> dst{ dst_shape, src.data_type(), 1, src.fixed_point_position(), src.quantization_info() };
120
121 const int input_offset = -src.quantization_info().offset;
122 const float input_scale = src.quantization_info().scale;
123 const int weights_offset = -weights.quantization_info().offset;
124 const float weights_scale = weights.quantization_info().scale;
125 const int output_offset = dst.quantization_info().offset;
126 const float output_scale = dst.quantization_info().scale;
127
128 int output_multiplier;
129 int output_shift;
130 const float multiplier = input_scale * weights_scale / output_scale;
131 arm_compute::quantization::calculate_quantized_multiplier_less_than_one(multiplier, &output_multiplier, &output_shift);
132
133 // Compute reference
134 const int filter_width = weights.shape().x();
135 const int filter_height = weights.shape().y();
136 const int filter_plane = filter_width * filter_height;
137 const int input_width = src.shape().x();
138 const int input_height = src.shape().y();
139 const int input_depth = src.shape().z();
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000140 const int num_batches = src.shape().total_size() / (input_width * input_height * input_depth);
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700141
142 const int filter_half_size = filter_width / 2;
143 const int pad_x = std::min(filter_half_size, static_cast<int>(conv_info.pad().first));
144 const int pad_y = std::min(filter_half_size, static_cast<int>(conv_info.pad().second));
145 const int minimum_x = -pad_x + filter_half_size;
146 const int minimum_y = -pad_y + filter_half_size;
147
148 int out_pos = 0;
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000149 for(int r = 0; r < num_batches; ++r)
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700150 {
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000151 for(int z = 0; z < input_depth; ++z)
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700152 {
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000153 int32_t bias_val = *static_cast<const int32_t *>(biases(Coordinates(z)));
154 for(int y = minimum_y; y < input_height + pad_y - filter_half_size; y += conv_info.stride().second)
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700155 {
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000156 for(int x = minimum_x; x < input_width + pad_x - filter_half_size; x += conv_info.stride().first)
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700157 {
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000158 Coordinates coords(x, y, z);
159 int filter_offset = filter_plane * z;
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700160
Georgios Pinitasb6f182d32017-11-29 10:17:56 +0000161 uint32_t val = 0;
162 for(int j = y - filter_half_size; j <= (y + filter_half_size); ++j)
163 {
164 for(int i = x - filter_half_size; i <= (x + filter_half_size); ++i)
165 {
166 coords.set(0, i);
167 coords.set(1, j);
168 auto in_val = tensor_elem_at<uint8_t>(src, coords, BorderMode::CONSTANT, 0);
169 uint8_t w_val = *(weights.data() + filter_offset);
170 val += (in_val + input_offset) * (w_val + weights_offset);
171 ++filter_offset;
172 }
173 }
174 val += bias_val;
175 val = asymm_rounding_divide_by_pow2(asymm_int_mult(val, output_multiplier), output_shift);
176 val += output_offset;
177 val = std::max<int32_t>(val, 0);
178 val = std::min<int32_t>(val, 255);
179
180 // Store the result
181 dst[out_pos++] = val;
182 }
Dmitry Savenkod7295b72017-11-20 22:00:08 +0700183 }
184 }
185 }
186
187 return dst;
188}
189
Georgios Pinitas81a26ad2017-10-23 20:29:30 +0100190template SimpleTensor<float> depthwise_convolution(const SimpleTensor<float> &src, const SimpleTensor<float> &weights, const SimpleTensor<float> &biases, const TensorShape &dst_shape,
191 const PadStrideInfo &conv_info);
Giorgio Arena93a690e2017-08-01 16:09:33 +0100192} // namespace reference
193} // namespace validation
194} // namespace test
195} // namespace arm_compute