blob: d00b1b50994757282c6f2dc6eef07acfcef17c75 [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
2 * Copyright (c) 2017 ARM Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#include "arm_compute/runtime/CL/functions/CLOpticalFlow.h"
25
26#include "arm_compute/core/CL/ICLTensor.h"
27#include "arm_compute/core/CL/kernels/CLLKTrackerKernel.h"
28#include "arm_compute/core/Error.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010029#include "arm_compute/core/TensorInfo.h"
30#include "arm_compute/core/Window.h"
31#include "arm_compute/runtime/CL/CLPyramid.h"
32#include "arm_compute/runtime/CL/CLScheduler.h"
33#include "arm_compute/runtime/CL/CLTensor.h"
34#include "arm_compute/runtime/CL/CLTensorAllocator.h"
35#include "arm_compute/runtime/CL/functions/CLScharr3x3.h"
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +010036#include "support/ToolchainSupport.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010037
38using namespace arm_compute;
39
Georgios Pinitas8a94e7c2017-09-15 19:06:47 +010040CLOpticalFlow::CLOpticalFlow(std::shared_ptr<IMemoryManager> memory_manager) // NOLINT
41 : _memory_group(std::move(memory_manager)),
42 _tracker_init_kernel(),
Moritz Pflanzerf4af76e2017-09-06 07:42:43 +010043 _tracker_stage0_kernel(),
44 _tracker_stage1_kernel(),
45 _tracker_finalize_kernel(),
46 _func_scharr(),
47 _scharr_gx(),
48 _scharr_gy(),
49 _old_points(nullptr),
50 _new_points_estimates(nullptr),
51 _new_points(nullptr),
52 _old_points_internal(),
53 _new_points_internal(),
54 _coefficient_table(),
55 _old_values(),
56 _num_levels(0)
Anthony Barbier6ff3b192017-09-04 18:44:23 +010057{
58}
59
60void CLOpticalFlow::configure(const CLPyramid *old_pyramid, const CLPyramid *new_pyramid,
61 const ICLKeyPointArray *old_points, const ICLKeyPointArray *new_points_estimates, ICLKeyPointArray *new_points,
62 Termination termination, float epsilon, size_t num_iterations, size_t window_dimension, bool use_initial_estimate,
63 BorderMode border_mode, uint8_t constant_border_value)
64{
65 ARM_COMPUTE_ERROR_ON(nullptr == old_pyramid);
66 ARM_COMPUTE_ERROR_ON(nullptr == new_pyramid);
67 ARM_COMPUTE_ERROR_ON(nullptr == old_points);
68 ARM_COMPUTE_ERROR_ON(nullptr == new_points_estimates);
69 ARM_COMPUTE_ERROR_ON(nullptr == new_points);
70 ARM_COMPUTE_ERROR_ON(old_pyramid->info()->num_levels() != new_pyramid->info()->num_levels());
71 ARM_COMPUTE_ERROR_ON(0 == old_pyramid->info()->num_levels());
72 ARM_COMPUTE_ERROR_ON(old_pyramid->info()->width() != new_pyramid->info()->width());
73 ARM_COMPUTE_ERROR_ON(old_pyramid->info()->height() != new_pyramid->info()->height());
74 ARM_COMPUTE_ERROR_ON(use_initial_estimate && old_points->num_values() != new_points_estimates->num_values());
75
76 // Set member variables
77 _old_points = old_points;
78 _new_points_estimates = new_points_estimates;
79 _new_points = new_points;
80 _num_levels = old_pyramid->info()->num_levels();
81
82 const float pyr_scale = old_pyramid->info()->scale();
83 const int list_length = old_points->num_values();
84 const int old_values_list_length = list_length * window_dimension * window_dimension;
85
86 // Create kernels and tensors
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +010087 _tracker_init_kernel = arm_compute::support::cpp14::make_unique<CLLKTrackerInitKernel[]>(_num_levels);
88 _tracker_stage0_kernel = arm_compute::support::cpp14::make_unique<CLLKTrackerStage0Kernel[]>(_num_levels);
89 _tracker_stage1_kernel = arm_compute::support::cpp14::make_unique<CLLKTrackerStage1Kernel[]>(_num_levels);
90 _func_scharr = arm_compute::support::cpp14::make_unique<CLScharr3x3[]>(_num_levels);
91 _scharr_gx = arm_compute::support::cpp14::make_unique<CLTensor[]>(_num_levels);
92 _scharr_gy = arm_compute::support::cpp14::make_unique<CLTensor[]>(_num_levels);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010093
94 // Create internal keypoint arrays
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +010095 _old_points_internal = arm_compute::support::cpp14::make_unique<CLLKInternalKeypointArray>(list_length);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010096 _old_points_internal->resize(list_length);
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +010097 _new_points_internal = arm_compute::support::cpp14::make_unique<CLLKInternalKeypointArray>(list_length);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010098 _new_points_internal->resize(list_length);
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +010099 _coefficient_table = arm_compute::support::cpp14::make_unique<CLCoefficientTableArray>(list_length);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100100 _coefficient_table->resize(list_length);
Moritz Pflanzerd0ae8b82017-06-29 14:51:57 +0100101 _old_values = arm_compute::support::cpp14::make_unique<CLOldValueArray>(old_values_list_length);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100102 _old_values->resize(old_values_list_length);
103 _new_points->resize(list_length);
104
105 for(size_t i = 0; i < _num_levels; ++i)
106 {
107 // Get images from the ith level of old and right pyramid
108 ICLImage *old_ith_input = old_pyramid->get_pyramid_level(i);
109 ICLImage *new_ith_input = new_pyramid->get_pyramid_level(i);
110
111 // Get width and height of images
112 const unsigned int width_ith = old_ith_input->info()->dimension(0);
113 const unsigned int height_ith = new_ith_input->info()->dimension(1);
114
115 // Initialize Scharr tensors
116 TensorInfo tensor_info(TensorShape(width_ith, height_ith), 1, DataType::S16);
117 _scharr_gx[i].allocator()->init(tensor_info);
118 _scharr_gy[i].allocator()->init(tensor_info);
119
Georgios Pinitas8a94e7c2017-09-15 19:06:47 +0100120 // Manage intermediate buffers
121 _memory_group.manage(_scharr_gx.get() + i);
122 _memory_group.manage(_scharr_gy.get() + i);
123
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100124 // Init Scharr kernel
125 _func_scharr[i].configure(old_ith_input, &_scharr_gx[i], &_scharr_gy[i], border_mode, constant_border_value);
126
127 // Init Lucas-Kanade init kernel
128 _tracker_init_kernel[i].configure(old_points, new_points_estimates, _old_points_internal.get(), _new_points_internal.get(), use_initial_estimate, i, _num_levels, pyr_scale);
129
130 // Init Lucas-Kanade stage0 kernel
131 _tracker_stage0_kernel[i].configure(old_ith_input, &_scharr_gx[i], &_scharr_gy[i],
132 _old_points_internal.get(), _new_points_internal.get(), _coefficient_table.get(), _old_values.get(),
133 window_dimension, i);
134
135 // Init Lucas-Kanade stage1 kernel
136 _tracker_stage1_kernel[i].configure(new_ith_input, _new_points_internal.get(), _coefficient_table.get(), _old_values.get(),
137 termination, epsilon, num_iterations, window_dimension, i);
138
139 // Allocate intermediate buffers
140 _scharr_gx[i].allocator()->allocate();
141 _scharr_gy[i].allocator()->allocate();
142 }
143
144 // Finalize Lucas-Kanade
145 _tracker_finalize_kernel.configure(_new_points_internal.get(), new_points);
146}
147
148void CLOpticalFlow::run()
149{
150 ARM_COMPUTE_ERROR_ON_MSG(_num_levels == 0, "Unconfigured function");
151
Georgios Pinitas8a94e7c2017-09-15 19:06:47 +0100152 _memory_group.acquire();
153
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100154 for(unsigned int level = _num_levels; level > 0; --level)
155 {
156 // Run Scharr kernel
157 _func_scharr[level - 1].run();
158
159 // Run Lucas-Kanade init kernel
160 CLScheduler::get().enqueue(_tracker_init_kernel[level - 1]);
161
162 // Run Lucas-Kanade stage0 kernel
163 CLScheduler::get().enqueue(_tracker_stage0_kernel[level - 1]);
164
165 // Run Lucas-Kanade stage1 kernel
166 CLScheduler::get().enqueue(_tracker_stage1_kernel[level - 1]);
167 }
168
169 CLScheduler::get().enqueue(_tracker_finalize_kernel, true);
Georgios Pinitas8a94e7c2017-09-15 19:06:47 +0100170
171 _memory_group.release();
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100172}