blob: 8436dce87b18ff6764615d2e4baa70b6f73742a8 [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
2 * Copyright (c) 2017 ARM Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#include "arm_compute/runtime/CL/functions/CLGaussianPyramid.h"
25
26#include "arm_compute/core/CL/ICLTensor.h"
27#include "arm_compute/core/CL/kernels/CLGaussianPyramidKernel.h"
28#include "arm_compute/core/CL/kernels/CLScaleKernel.h"
29#include "arm_compute/core/Error.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010030#include "arm_compute/core/PixelValue.h"
31#include "arm_compute/core/TensorInfo.h"
32#include "arm_compute/core/Validate.h"
33#include "arm_compute/core/Window.h"
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +010034#include "support/ToolchainSupport.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010035
36#include "arm_compute/runtime/CL/CLPyramid.h"
37#include "arm_compute/runtime/CL/CLScheduler.h"
38#include "arm_compute/runtime/CL/CLTensor.h"
39#include "arm_compute/runtime/CL/CLTensorAllocator.h"
40#include "arm_compute/runtime/CL/functions/CLGaussian5x5.h"
41
42#include <cstddef>
43
44using namespace arm_compute;
45
46CLGaussianPyramid::CLGaussianPyramid()
47 : _input(nullptr), _pyramid(nullptr), _tmp()
48{
49}
50
Moritz Pflanzerf4af76e2017-09-06 07:42:43 +010051CLGaussianPyramidHalf::CLGaussianPyramidHalf() // NOLINT
52 : _border_handler(),
53 _horizontal_reduction(),
54 _vertical_reduction()
Anthony Barbier6ff3b192017-09-04 18:44:23 +010055{
56}
57
58void CLGaussianPyramidHalf::configure(ICLTensor *input, CLPyramid *pyramid, BorderMode border_mode, uint8_t constant_border_value)
59{
60 ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(input, 1, DataType::U8);
61 ARM_COMPUTE_ERROR_ON(pyramid == nullptr);
62 ARM_COMPUTE_ERROR_ON(input->info()->num_dimensions() != pyramid->get_pyramid_level(0)->info()->num_dimensions());
63 ARM_COMPUTE_ERROR_ON(input->info()->dimension(0) != pyramid->info()->width());
64 ARM_COMPUTE_ERROR_ON(input->info()->dimension(1) != pyramid->info()->height());
65 ARM_COMPUTE_ERROR_ON(SCALE_PYRAMID_HALF != pyramid->info()->scale());
66
67 /* Get number of pyramid levels */
68 const size_t num_levels = pyramid->info()->num_levels();
69
70 _input = input;
71 _pyramid = pyramid;
72
73 if(num_levels > 1)
74 {
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +010075 _border_handler = arm_compute::support::cpp14::make_unique<CLFillBorderKernel[]>(num_levels - 1);
76 _horizontal_reduction = arm_compute::support::cpp14::make_unique<CLGaussianPyramidHorKernel[]>(num_levels - 1);
77 _vertical_reduction = arm_compute::support::cpp14::make_unique<CLGaussianPyramidVertKernel[]>(num_levels - 1);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010078
79 // Apply half scale to the X dimension of the tensor shape
80 TensorShape tensor_shape = pyramid->info()->tensor_shape();
81 tensor_shape.set(0, (pyramid->info()->width() + 1) * SCALE_PYRAMID_HALF);
82
83 PyramidInfo pyramid_info(num_levels - 1, SCALE_PYRAMID_HALF, tensor_shape, Format::U16);
84
85 _tmp.init(pyramid_info);
86
87 for(size_t i = 0; i < num_levels - 1; ++i)
88 {
89 /* Configure horizontal kernel */
90 _horizontal_reduction[i].configure(_pyramid->get_pyramid_level(i), _tmp.get_pyramid_level(i), border_mode == BorderMode::UNDEFINED);
91
92 /* Configure vertical kernel */
93 _vertical_reduction[i].configure(_tmp.get_pyramid_level(i), _pyramid->get_pyramid_level(i + 1), border_mode == BorderMode::UNDEFINED);
94
95 /* Configure border */
96 _border_handler[i].configure(_pyramid->get_pyramid_level(i), _horizontal_reduction[i].border_size(), border_mode, PixelValue(constant_border_value));
97 }
98 _tmp.allocate();
99 }
100}
101
102void CLGaussianPyramidHalf::run()
103{
104 ARM_COMPUTE_ERROR_ON_MSG(_pyramid == nullptr, "Unconfigured function");
105
106 /* Get number of pyramid levels */
107 const size_t num_levels = _pyramid->info()->num_levels();
108
109 /* The first level of the pyramid has the input image */
110 _pyramid->get_pyramid_level(0)->map(CLScheduler::get().queue(), true /* blocking */);
111 _input->map(CLScheduler::get().queue(), true /* blocking */);
112 _pyramid->get_pyramid_level(0)->copy_from(*_input);
113 _input->unmap(CLScheduler::get().queue());
114 _pyramid->get_pyramid_level(0)->unmap(CLScheduler::get().queue());
115
116 for(unsigned int i = 0; i < num_levels - 1; ++i)
117 {
118 CLScheduler::get().enqueue(_border_handler[i], false);
119 CLScheduler::get().enqueue(_horizontal_reduction[i], false);
120 CLScheduler::get().enqueue(_vertical_reduction[i], false);
121 }
122}
123
Moritz Pflanzerf4af76e2017-09-06 07:42:43 +0100124CLGaussianPyramidOrb::CLGaussianPyramidOrb() // NOLINT
125 : _gauss5x5(),
126 _scale_nearest()
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100127{
128}
129
130void CLGaussianPyramidOrb::configure(ICLTensor *input, CLPyramid *pyramid, BorderMode border_mode, uint8_t constant_border_value)
131{
132 ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(input, 1, DataType::U8);
133 ARM_COMPUTE_ERROR_ON(nullptr == pyramid);
134 ARM_COMPUTE_ERROR_ON(input->info()->num_dimensions() != pyramid->get_pyramid_level(0)->info()->num_dimensions());
135 ARM_COMPUTE_ERROR_ON(input->info()->dimension(0) != pyramid->info()->width());
136 ARM_COMPUTE_ERROR_ON(input->info()->dimension(1) != pyramid->info()->height());
137 ARM_COMPUTE_ERROR_ON(SCALE_PYRAMID_ORB != pyramid->info()->scale());
138
139 /* Get number of pyramid levels */
140 const size_t num_levels = pyramid->info()->num_levels();
141
142 _input = input;
143 _pyramid = pyramid;
144
145 if(num_levels > 1)
146 {
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +0100147 _gauss5x5 = arm_compute::support::cpp14::make_unique<CLGaussian5x5[]>(num_levels - 1);
148 _scale_nearest = arm_compute::support::cpp14::make_unique<CLScaleKernel[]>(num_levels - 1);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100149
150 PyramidInfo pyramid_info(num_levels - 1, SCALE_PYRAMID_ORB, pyramid->info()->tensor_shape(), Format::U8);
151
152 _tmp.init(pyramid_info);
153
154 for(size_t i = 0; i < num_levels - 1; ++i)
155 {
156 /* Configure gaussian 5x5 */
157 _gauss5x5[i].configure(_pyramid->get_pyramid_level(i), _tmp.get_pyramid_level(i), border_mode, constant_border_value);
158
159 /* Configure scale image kernel */
160 _scale_nearest[i].configure(_tmp.get_pyramid_level(i), _pyramid->get_pyramid_level(i + 1), InterpolationPolicy::NEAREST_NEIGHBOR, border_mode == BorderMode::UNDEFINED);
161 }
162
163 _tmp.allocate();
164 }
165}
166
167void CLGaussianPyramidOrb::run()
168{
169 ARM_COMPUTE_ERROR_ON_MSG(_pyramid == nullptr, "Unconfigured function");
170
171 /* Get number of pyramid levels */
172 const size_t num_levels = _pyramid->info()->num_levels();
173
174 /* The first level of the pyramid has the input image */
175 _pyramid->get_pyramid_level(0)->map(CLScheduler::get().queue(), true /* blocking */);
176 _input->map(CLScheduler::get().queue(), true /* blocking */);
177 _pyramid->get_pyramid_level(0)->copy_from(*_input);
178 _input->unmap(CLScheduler::get().queue());
179 _pyramid->get_pyramid_level(0)->unmap(CLScheduler::get().queue());
180
181 for(unsigned int i = 0; i < num_levels - 1; ++i)
182 {
183 _gauss5x5[i].run();
184 CLScheduler::get().enqueue(_scale_nearest[i]);
185 }
186}