blob: 8d77abcfc741929f207a0f3fa6f7e1eae60fbbc6 [file] [log] [blame]
Pablo Tello89519332017-11-17 11:52:36 +00001/*
ramelg01a1f78512022-06-29 16:28:10 +01002 * Copyright (c) 2017-2022 Arm Limited.
Pablo Tello89519332017-11-17 11:52:36 +00003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Georgios Pinitas9fb11592018-04-26 20:34:58 +010024#include "arm_compute/runtime/NEON/functions/NEWinogradConvolutionLayer.h"
Pablo Tello89519332017-11-17 11:52:36 +000025
Isabella Gottardi6acc6ad2018-02-02 17:19:18 +000026#include "arm_compute/core/Error.h"
Michalis Spyrou96f977e2021-07-01 12:20:56 +010027#include "arm_compute/core/ITensorPack.h"
Pablo Tello89519332017-11-17 11:52:36 +000028#include "arm_compute/core/Utils.h"
Vidhya Sudhan Loganathan3ca97862018-04-23 08:20:04 +010029#include "arm_compute/core/utils/misc/ShapeCalculator.h"
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010030#include "arm_compute/core/Validate.h"
31
Sang-Hoon Park68dd25f2020-10-19 16:00:11 +010032#include "src/core/CPP/Validate.h"
Michalis Spyrou96f977e2021-07-01 12:20:56 +010033#include "src/core/helpers/MemoryHelpers.h"
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010034#include "src/core/NEON/kernels/convolution/common/utils.hpp"
Georgios Pinitas7891a732021-08-20 21:39:25 +010035#include "src/cpu/kernels/CpuWinogradConv2dKernel.h"
36#include "src/cpu/operators/CpuWinogradConv2d.h"
Pablo Tello89519332017-11-17 11:52:36 +000037
Pablo Tello89519332017-11-17 11:52:36 +000038namespace arm_compute
39{
Michalis Spyrou96f977e2021-07-01 12:20:56 +010040using namespace arm_compute::experimental;
41
42struct NEWinogradConvolutionLayer::Impl
Isabella Gottardi6acc6ad2018-02-02 17:19:18 +000043{
Michalis Spyrou96f977e2021-07-01 12:20:56 +010044 MemoryGroup memory_group{};
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010045 std::unique_ptr<cpu::CpuWinogradConv2d> op{nullptr};
Michalis Spyrou96f977e2021-07-01 12:20:56 +010046 ITensorPack run_pack{};
47 ITensorPack prep_pack{};
48 WorkspaceData<Tensor> workspace{};
49 experimental::MemoryRequirements aux_mem_req{};
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010050 const ITensor *original_weights{nullptr};
51 bool is_prepared{false};
52 bool is_activationlayer_enabled{false};
Michalis Spyrou96f977e2021-07-01 12:20:56 +010053 DataLayout data_layout{};
54};
Isabella Gottardi6acc6ad2018-02-02 17:19:18 +000055
Michalis Spyroua4f378d2019-04-26 14:54:54 +010056NEWinogradConvolutionLayer::NEWinogradConvolutionLayer(const std::shared_ptr<IMemoryManager> &memory_manager)
Michalis Spyrou96f977e2021-07-01 12:20:56 +010057 : _impl(std::make_unique<Impl>())
Pablo Tello89519332017-11-17 11:52:36 +000058{
Michalis Spyrou96f977e2021-07-01 12:20:56 +010059 _impl->memory_group = MemoryGroup(std::move(memory_manager));
Pablo Tello8f43d742019-03-27 09:28:32 +000060}
Pablo Tello89519332017-11-17 11:52:36 +000061
Michalis Spyrou96f977e2021-07-01 12:20:56 +010062NEWinogradConvolutionLayer::~NEWinogradConvolutionLayer() = default;
63
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010064void NEWinogradConvolutionLayer::configure(const ITensor *input,
65 const ITensor *weights,
66 const ITensor *biases,
67 ITensor *output,
68 const PadStrideInfo &conv_info,
69 const ActivationLayerInfo &act_info,
70 bool enable_fast_math)
Pablo Tello89519332017-11-17 11:52:36 +000071{
Michalis Spyrou96f977e2021-07-01 12:20:56 +010072 _impl->original_weights = weights;
73 _impl->op = std::make_unique<cpu::CpuWinogradConv2d>();
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010074 _impl->op->configure(input->info(), weights->info(), biases != nullptr ? biases->info() : nullptr, output->info(),
75 conv_info, act_info, enable_fast_math);
Pablo Tello89519332017-11-17 11:52:36 +000076
Michalis Spyrou96f977e2021-07-01 12:20:56 +010077 _impl->aux_mem_req = _impl->op->workspace();
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010078 _impl->run_pack = {{ACL_SRC_0, input}, {ACL_SRC_1, weights}, {ACL_SRC_2, biases}, {ACL_DST, output}};
79 _impl->prep_pack = {{ACL_SRC_1, weights}, {ACL_SRC_2, biases}};
80 _impl->workspace =
81 manage_workspace<Tensor>(_impl->aux_mem_req, _impl->memory_group, _impl->run_pack, _impl->prep_pack);
Pablo Tello89519332017-11-17 11:52:36 +000082}
83
Georgios Pinitas9fb11592018-04-26 20:34:58 +010084void NEWinogradConvolutionLayer::run()
Pablo Tello89519332017-11-17 11:52:36 +000085{
Georgios Pinitas72219332018-06-05 14:56:06 +010086 prepare();
87
Michalis Spyrou96f977e2021-07-01 12:20:56 +010088 MemoryGroupResourceScope scope_mg(_impl->memory_group);
89 _impl->op->run(_impl->run_pack);
Pablo Tello89519332017-11-17 11:52:36 +000090}
Isabella Gottardi6acc6ad2018-02-02 17:19:18 +000091
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010092Status NEWinogradConvolutionLayer::validate(const ITensorInfo *input,
93 const ITensorInfo *weights,
94 const ITensorInfo *biases,
95 const ITensorInfo *output,
96 const PadStrideInfo &conv_info,
97 const ActivationLayerInfo &act_info,
98 bool enable_fast_math)
Isabella Gottardi6acc6ad2018-02-02 17:19:18 +000099{
Michalis Spyrou96f977e2021-07-01 12:20:56 +0100100 return cpu::CpuWinogradConv2d::validate(input, weights, biases, output, conv_info, act_info, enable_fast_math);
Isabella Gottardi6acc6ad2018-02-02 17:19:18 +0000101}
102
Georgios Pinitas72219332018-06-05 14:56:06 +0100103void NEWinogradConvolutionLayer::prepare()
104{
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +0100105 if (!_impl->is_prepared)
Georgios Pinitas72219332018-06-05 14:56:06 +0100106 {
Michalis Spyrou96f977e2021-07-01 12:20:56 +0100107 _impl->op->prepare(_impl->prep_pack);
108 _impl->original_weights->mark_as_unused();
Georgios Pinitas72219332018-06-05 14:56:06 +0100109
Michalis Spyrou96f977e2021-07-01 12:20:56 +0100110 // Release temporary tensors that are only used in prepare stage
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +0100111 release_temporaries<Tensor>(_impl->aux_mem_req, _impl->workspace);
Georgios Pinitasddd79f52021-01-15 09:42:26 +0000112
Michalis Spyrou96f977e2021-07-01 12:20:56 +0100113 _impl->is_prepared = true;
Georgios Pinitas72219332018-06-05 14:56:06 +0100114 }
115}
Pablo Tello89519332017-11-17 11:52:36 +0000116} // namespace arm_compute