blob: c3ecfb430f70df14d2b9c31e0b7a8cdbb71da30a [file] [log] [blame]
Georgios Pinitasd9769582017-08-03 10:19:40 +01001/*
ramelg01cbbb0382021-09-17 17:36:57 +01002 * Copyright (c) 2017-2021 Arm Limited.
Georgios Pinitasd9769582017-08-03 10:19:40 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Giorgio Arena04a8f8c2017-11-23 11:45:24 +000024#include "arm_compute/runtime/NEON/functions/NEL2NormalizeLayer.h"
Georgios Pinitasd9769582017-08-03 10:19:40 +010025
26#include "arm_compute/core/Helpers.h"
27#include "arm_compute/runtime/NEON/NEScheduler.h"
ramelg01cbbb0382021-09-17 17:36:57 +010028#include "src/common/utils/Log.h"
Michalis Spyrouebcebf12020-10-21 00:04:14 +010029#include "src/core/NEON/kernels/NEL2NormalizeLayerKernel.h"
30#include "src/core/NEON/kernels/NEReductionOperationKernel.h"
Georgios Pinitasd9769582017-08-03 10:19:40 +010031
Michalis Spyrou2897e612018-11-20 18:38:29 +000032namespace arm_compute
33{
Manuel Bottini4b5c5882019-05-14 10:38:30 +010034namespace
35{
36constexpr int max_input_tensor_dim = 3;
37} // namespace
Michalis Spyrouebcebf12020-10-21 00:04:14 +010038NEL2NormalizeLayer::~NEL2NormalizeLayer() = default;
Manuel Bottini4b5c5882019-05-14 10:38:30 +010039
Giorgio Arena04a8f8c2017-11-23 11:45:24 +000040NEL2NormalizeLayer::NEL2NormalizeLayer(std::shared_ptr<IMemoryManager> memory_manager)
Georgios Pinitas658039b2017-09-15 16:30:50 +010041 : _memory_group(std::move(memory_manager)), _reduce_func(), _normalize_kernel(), _sumsq()
Georgios Pinitasd9769582017-08-03 10:19:40 +010042{
43}
44
Manuel Bottini4b5c5882019-05-14 10:38:30 +010045void NEL2NormalizeLayer::configure(ITensor *input, ITensor *output, int axis, float epsilon)
Georgios Pinitasd9769582017-08-03 10:19:40 +010046{
ramelg01cbbb0382021-09-17 17:36:57 +010047 ARM_COMPUTE_LOG_PARAMS(input, output, axis, epsilon);
48
Georgios Pinitas658039b2017-09-15 16:30:50 +010049 // Manage intermediate buffers
50 _memory_group.manage(&_sumsq);
51
Georgios Pinitasd9769582017-08-03 10:19:40 +010052 // Configure Kernels
Manuel Bottini4b5c5882019-05-14 10:38:30 +010053 const uint32_t actual_axis = wrap_around(axis, max_input_tensor_dim);
54 _reduce_func.configure(input, &_sumsq, actual_axis, ReductionOperation::SUM_SQUARE);
Georgios Pinitas40f51a62020-11-21 03:04:18 +000055 _normalize_kernel = std::make_unique<NEL2NormalizeLayerKernel>();
Michalis Spyrouebcebf12020-10-21 00:04:14 +010056 _normalize_kernel->configure(input, &_sumsq, output, axis, epsilon);
Georgios Pinitasd9769582017-08-03 10:19:40 +010057
58 // Allocate intermediate tensors
59 _sumsq.allocator()->allocate();
60}
61
Manuel Bottini4b5c5882019-05-14 10:38:30 +010062Status NEL2NormalizeLayer::validate(const ITensorInfo *input, const ITensorInfo *output, int axis, float epsilon)
John Richardson73d4aef2018-05-08 14:34:33 +010063{
64 TensorShape shape(input->tensor_shape());
65
66 // Create intermediate tensor info
67 TensorInfo sum_sq;
68 sum_sq.set_data_type(input->data_type());
69 sum_sq.set_tensor_shape(shape);
70
Manuel Bottini4b5c5882019-05-14 10:38:30 +010071 const uint32_t actual_axis = wrap_around(axis, max_input_tensor_dim);
72 ARM_COMPUTE_RETURN_ON_ERROR(NEReductionOperation::validate(input, &sum_sq, actual_axis, ReductionOperation::SUM_SQUARE));
John Richardson73d4aef2018-05-08 14:34:33 +010073
Michalis Spyrou2897e612018-11-20 18:38:29 +000074 // Reduce shape on axis
Manuel Bottini4b5c5882019-05-14 10:38:30 +010075 shape.set(actual_axis, 1);
John Richardson73d4aef2018-05-08 14:34:33 +010076 sum_sq.set_tensor_shape(shape);
77
78 ARM_COMPUTE_RETURN_ON_ERROR(NEL2NormalizeLayerKernel::validate(input, &sum_sq, output, axis, epsilon));
79
80 return Status{};
81}
82
Giorgio Arena04a8f8c2017-11-23 11:45:24 +000083void NEL2NormalizeLayer::run()
Georgios Pinitasd9769582017-08-03 10:19:40 +010084{
Georgios Pinitasda953f22019-04-02 17:27:03 +010085 MemoryGroupResourceScope scope_mg(_memory_group);
Georgios Pinitas658039b2017-09-15 16:30:50 +010086
Georgios Pinitasd9769582017-08-03 10:19:40 +010087 _reduce_func.run();
Michalis Spyrouebcebf12020-10-21 00:04:14 +010088 NEScheduler::get().schedule(_normalize_kernel.get(), Window::DimY);
Georgios Pinitasd9769582017-08-03 10:19:40 +010089}
Michalis Spyrou2897e612018-11-20 18:38:29 +000090} // namespace arm_compute