blob: 4e615808fb9cd347e65914717151efc6c231b2a5 [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
Georgios Pinitasda953f22019-04-02 17:27:03 +01002 * Copyright (c) 2016-2019 ARM Limited.
Anthony Barbier6ff3b192017-09-04 18:44:23 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#include "arm_compute/runtime/NEON/functions/NEHOGMultiDetection.h"
25
26#include "arm_compute/core/Error.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010027#include "arm_compute/core/TensorInfo.h"
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +010028#include "arm_compute/core/Validate.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010029#include "arm_compute/runtime/NEON/NEScheduler.h"
30#include "arm_compute/runtime/Tensor.h"
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +010031#include "support/ToolchainSupport.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010032
33using namespace arm_compute;
34
Georgios Pinitas658039b2017-09-15 16:30:50 +010035NEHOGMultiDetection::NEHOGMultiDetection(std::shared_ptr<IMemoryManager> memory_manager) // NOLINT
36 : _memory_group(std::move(memory_manager)),
37 _gradient_kernel(),
Moritz Pflanzerf4af76e2017-09-06 07:42:43 +010038 _orient_bin_kernel(),
39 _block_norm_kernel(),
40 _hog_detect_kernel(),
41 _non_maxima_kernel(),
42 _hog_space(),
43 _hog_norm_space(),
44 _detection_windows(),
45 _mag(),
46 _phase(),
47 _non_maxima_suppression(false),
48 _num_orient_bin_kernel(0),
49 _num_block_norm_kernel(0),
50 _num_hog_detect_kernel(0)
Anthony Barbier6ff3b192017-09-04 18:44:23 +010051{
52}
53
54void NEHOGMultiDetection::configure(ITensor *input, const IMultiHOG *multi_hog, IDetectionWindowArray *detection_windows, const ISize2DArray *detection_window_strides, BorderMode border_mode,
55 uint8_t constant_border_value, float threshold, bool non_maxima_suppression, float min_distance)
56{
57 ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(input, 1, DataType::U8);
58 ARM_COMPUTE_ERROR_ON_INVALID_MULTI_HOG(multi_hog);
59 ARM_COMPUTE_ERROR_ON(nullptr == detection_windows);
60 ARM_COMPUTE_ERROR_ON(detection_window_strides->num_values() != multi_hog->num_models());
61
62 const size_t width = input->info()->dimension(Window::DimX);
63 const size_t height = input->info()->dimension(Window::DimY);
64 const TensorShape &shape_img = input->info()->tensor_shape();
65 const size_t num_models = multi_hog->num_models();
66 PhaseType phase_type = multi_hog->model(0)->info()->phase_type();
67
68 size_t prev_num_bins = multi_hog->model(0)->info()->num_bins();
69 Size2D prev_cell_size = multi_hog->model(0)->info()->cell_size();
70 Size2D prev_block_size = multi_hog->model(0)->info()->block_size();
71 Size2D prev_block_stride = multi_hog->model(0)->info()->block_stride();
72
73 /* Check if NEHOGOrientationBinningKernel and NEHOGBlockNormalizationKernel kernels can be skipped for a specific HOG data-object
74 *
75 * 1) NEHOGOrientationBinningKernel and NEHOGBlockNormalizationKernel are skipped if the cell size and the number of bins don't change.
76 * Since "multi_hog" is sorted,it is enough to check the HOG descriptors at level "ith" and level "(i-1)th
77 * 2) NEHOGBlockNormalizationKernel is skipped if the cell size, the number of bins and block size do not change.
78 * Since "multi_hog" is sorted,it is enough to check the HOG descriptors at level "ith" and level "(i-1)th
79 *
80 * @note Since the orientation binning and block normalization kernels can be skipped, we need to keep track of the input to process for each kernel
81 * with "input_orient_bin", "input_hog_detect" and "input_block_norm"
82 */
83 std::vector<size_t> input_orient_bin;
84 std::vector<size_t> input_hog_detect;
85 std::vector<std::pair<size_t, size_t>> input_block_norm;
86
87 input_orient_bin.push_back(0);
88 input_hog_detect.push_back(0);
89 input_block_norm.emplace_back(0, 0);
90
91 for(size_t i = 1; i < num_models; ++i)
92 {
93 size_t cur_num_bins = multi_hog->model(i)->info()->num_bins();
94 Size2D cur_cell_size = multi_hog->model(i)->info()->cell_size();
95 Size2D cur_block_size = multi_hog->model(i)->info()->block_size();
96 Size2D cur_block_stride = multi_hog->model(i)->info()->block_stride();
97
98 if((cur_num_bins != prev_num_bins) || (cur_cell_size.width != prev_cell_size.width) || (cur_cell_size.height != prev_cell_size.height))
99 {
100 prev_num_bins = cur_num_bins;
101 prev_cell_size = cur_cell_size;
102 prev_block_size = cur_block_size;
103 prev_block_stride = cur_block_stride;
104
105 // Compute orientation binning and block normalization kernels. Update input to process
106 input_orient_bin.push_back(i);
107 input_block_norm.emplace_back(i, input_orient_bin.size() - 1);
108 }
109 else if((cur_block_size.width != prev_block_size.width) || (cur_block_size.height != prev_block_size.height) || (cur_block_stride.width != prev_block_stride.width)
110 || (cur_block_stride.height != prev_block_stride.height))
111 {
112 prev_block_size = cur_block_size;
113 prev_block_stride = cur_block_stride;
114
115 // Compute block normalization kernel. Update input to process
116 input_block_norm.emplace_back(i, input_orient_bin.size() - 1);
117 }
118
119 // Update input to process for hog detector kernel
120 input_hog_detect.push_back(input_block_norm.size() - 1);
121 }
122
123 _detection_windows = detection_windows;
124 _non_maxima_suppression = non_maxima_suppression;
125 _num_orient_bin_kernel = input_orient_bin.size(); // Number of NEHOGOrientationBinningKernel kernels to compute
126 _num_block_norm_kernel = input_block_norm.size(); // Number of NEHOGBlockNormalizationKernel kernels to compute
127 _num_hog_detect_kernel = input_hog_detect.size(); // Number of NEHOGDetector functions to compute
128
Georgios Pinitas725b1732019-05-20 19:40:47 +0100129 _orient_bin_kernel.clear();
130 _block_norm_kernel.clear();
131 _hog_detect_kernel.clear();
132 _hog_space.clear();
133 _hog_norm_space.clear();
134
135 _orient_bin_kernel.resize(_num_orient_bin_kernel);
136 _block_norm_kernel.resize(_num_block_norm_kernel);
137 _hog_detect_kernel.resize(_num_hog_detect_kernel);
138 _hog_space.resize(_num_orient_bin_kernel);
139 _hog_norm_space.resize(_num_block_norm_kernel);
140 _non_maxima_kernel = CPPDetectionWindowNonMaximaSuppressionKernel();
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100141
142 // Allocate tensors for magnitude and phase
143 TensorInfo info_mag(shape_img, Format::S16);
144 _mag.allocator()->init(info_mag);
145
146 TensorInfo info_phase(shape_img, Format::U8);
147 _phase.allocator()->init(info_phase);
148
Georgios Pinitas658039b2017-09-15 16:30:50 +0100149 // Manage intermediate buffers
150 _memory_group.manage(&_mag);
151 _memory_group.manage(&_phase);
152
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100153 // Initialise gradient kernel
154 _gradient_kernel.configure(input, &_mag, &_phase, phase_type, border_mode, constant_border_value);
155
156 // Configure NETensor for the HOG space and orientation binning kernel
157 for(size_t i = 0; i < _num_orient_bin_kernel; ++i)
158 {
159 const size_t idx_multi_hog = input_orient_bin[i];
160
161 // Get the corresponding cell size and number of bins
162 const Size2D &cell = multi_hog->model(idx_multi_hog)->info()->cell_size();
163 const size_t num_bins = multi_hog->model(idx_multi_hog)->info()->num_bins();
164
165 // Calculate number of cells along the x and y directions for the hog_space
166 const size_t num_cells_x = width / cell.width;
167 const size_t num_cells_y = height / cell.height;
168
169 // TensorShape of hog space
170 TensorShape shape_hog_space = input->info()->tensor_shape();
171 shape_hog_space.set(Window::DimX, num_cells_x);
172 shape_hog_space.set(Window::DimY, num_cells_y);
173
174 // Allocate HOG space
175 TensorInfo info_space(shape_hog_space, num_bins, DataType::F32);
Georgios Pinitas725b1732019-05-20 19:40:47 +0100176 _hog_space[i].allocator()->init(info_space);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100177
Georgios Pinitas658039b2017-09-15 16:30:50 +0100178 // Manage intermediate buffers
Georgios Pinitas725b1732019-05-20 19:40:47 +0100179 _memory_group.manage(&_hog_space[i]);
Georgios Pinitas658039b2017-09-15 16:30:50 +0100180
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100181 // Initialise orientation binning kernel
Georgios Pinitas725b1732019-05-20 19:40:47 +0100182 _orient_bin_kernel[i].configure(&_mag, &_phase, &_hog_space[i], multi_hog->model(idx_multi_hog)->info());
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100183 }
184
Georgios Pinitas658039b2017-09-15 16:30:50 +0100185 // Allocate intermediate tensors
186 _mag.allocator()->allocate();
187 _phase.allocator()->allocate();
188
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100189 // Configure NETensor for the normalized HOG space and block normalization kernel
190 for(size_t i = 0; i < _num_block_norm_kernel; ++i)
191 {
192 const size_t idx_multi_hog = input_block_norm[i].first;
193 const size_t idx_orient_bin = input_block_norm[i].second;
194
195 // Allocate normalized HOG space
196 TensorInfo tensor_info(*(multi_hog->model(idx_multi_hog)->info()), width, height);
Georgios Pinitas725b1732019-05-20 19:40:47 +0100197 _hog_norm_space[i].allocator()->init(tensor_info);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100198
Georgios Pinitas658039b2017-09-15 16:30:50 +0100199 // Manage intermediate buffers
Georgios Pinitas725b1732019-05-20 19:40:47 +0100200 _memory_group.manage(&_hog_norm_space[i]);
Georgios Pinitas658039b2017-09-15 16:30:50 +0100201
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100202 // Initialize block normalization kernel
Georgios Pinitas725b1732019-05-20 19:40:47 +0100203 _block_norm_kernel[i].configure(&_hog_space[idx_orient_bin], &_hog_norm_space[i], multi_hog->model(idx_multi_hog)->info());
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100204 }
205
Georgios Pinitas658039b2017-09-15 16:30:50 +0100206 // Allocate intermediate tensors
207 for(size_t i = 0; i < _num_orient_bin_kernel; ++i)
208 {
Georgios Pinitas725b1732019-05-20 19:40:47 +0100209 _hog_space[i].allocator()->allocate();
Georgios Pinitas658039b2017-09-15 16:30:50 +0100210 }
211
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100212 // Configure HOG detector kernel
213 for(size_t i = 0; i < _num_hog_detect_kernel; ++i)
214 {
215 const size_t idx_block_norm = input_hog_detect[i];
216
Georgios Pinitas725b1732019-05-20 19:40:47 +0100217 _hog_detect_kernel[i].configure(&_hog_norm_space[idx_block_norm], multi_hog->model(i), detection_windows, detection_window_strides->at(i), threshold, i);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100218 }
219
220 // Configure non maxima suppression kernel
Georgios Pinitas725b1732019-05-20 19:40:47 +0100221 _non_maxima_kernel.configure(_detection_windows, min_distance);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100222
223 // Allocate intermediate tensors
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100224 for(size_t i = 0; i < _num_block_norm_kernel; ++i)
225 {
Georgios Pinitas725b1732019-05-20 19:40:47 +0100226 _hog_norm_space[i].allocator()->allocate();
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100227 }
228}
229
230void NEHOGMultiDetection::run()
231{
232 ARM_COMPUTE_ERROR_ON_MSG(_detection_windows == nullptr, "Unconfigured function");
233
Georgios Pinitasda953f22019-04-02 17:27:03 +0100234 MemoryGroupResourceScope scope_mg(_memory_group);
Georgios Pinitas658039b2017-09-15 16:30:50 +0100235
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100236 // Reset detection window
237 _detection_windows->clear();
238
239 // Run gradient
240 _gradient_kernel.run();
241
242 // Run orientation binning kernel
Michalis Spyrou299fdd32019-05-01 13:03:59 +0100243 for(auto &kernel : _orient_bin_kernel)
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100244 {
Georgios Pinitas725b1732019-05-20 19:40:47 +0100245 NEScheduler::get().schedule(&kernel, Window::DimY);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100246 }
247
248 // Run block normalization kernel
Michalis Spyrou299fdd32019-05-01 13:03:59 +0100249 for(auto &kernel : _block_norm_kernel)
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100250 {
Georgios Pinitas725b1732019-05-20 19:40:47 +0100251 NEScheduler::get().schedule(&kernel, Window::DimY);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100252 }
253
254 // Run HOG detector kernel
Michalis Spyrou299fdd32019-05-01 13:03:59 +0100255 for(auto &kernel : _hog_detect_kernel)
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100256 {
Georgios Pinitas725b1732019-05-20 19:40:47 +0100257 kernel.run();
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100258 }
259
260 // Run non-maxima suppression kernel if enabled
261 if(_non_maxima_suppression)
262 {
Georgios Pinitas725b1732019-05-20 19:40:47 +0100263 NEScheduler::get().schedule(&_non_maxima_kernel, Window::DimY);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100264 }
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100265}