blob: 1e12e133570374d019acbaf2e8d817b09b04d061 [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +01006#include "NeonConvolution2dWorkload.hpp"
7
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +00008#include <aclCommon/ArmComputeTensorUtils.hpp>
Mike Kelly07810fc2020-11-12 10:58:48 +00009#include <aclCommon/ArmComputeUtils.hpp>
Jan Eilersbb446e52020-04-02 13:56:54 +010010#include <armnn/utility/PolymorphicDowncast.hpp>
James Conroy1f58f032021-04-27 17:13:27 +010011#include <backendsCommon/TensorHandle.hpp>
Matthew Benthamd80a7122019-01-08 17:52:37 +000012#include <neon/workloads/NeonWorkloadUtils.hpp>
13
14#include <arm_compute/runtime/NEON/functions/NEConvolutionLayer.h>
telsoa014fcda012018-03-09 14:13:49 +000015
David Beck711fa312018-09-24 10:46:38 +010016#include <armnn/Types.hpp>
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000017#include <Half.hpp>
telsoa01c577f2c2018-08-31 09:22:23 +010018
telsoa014fcda012018-03-09 14:13:49 +000019namespace armnn
20{
21
surmeh013537c2c2018-05-18 16:31:43 +010022using namespace armcomputetensorutils;
23
24arm_compute::Status NeonConvolution2dWorkloadValidate(const TensorInfo& input,
Sadik Armagan045f6be2020-09-10 13:37:32 +010025 const TensorInfo& output,
26 const Convolution2dDescriptor& descriptor,
27 const TensorInfo& weights,
28 const Optional<TensorInfo>& biases,
Mike Kelly07810fc2020-11-12 10:58:48 +000029 bool isFastMathEnabled,
30 const ActivationDescriptor* activationDescriptor)
surmeh013537c2c2018-05-18 16:31:43 +010031{
Francis Murtagh351d13d2018-09-24 15:01:18 +010032 const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input, descriptor.m_DataLayout);
33 const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output, descriptor.m_DataLayout);
34 const arm_compute::TensorInfo aclWeightsInfo = BuildArmComputeTensorInfo(weights, descriptor.m_DataLayout);
arovir01a6824102018-08-28 17:40:45 +010035
Jan Eilers59c66702019-07-11 10:22:36 +010036 const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(descriptor.m_DilationX,
37 descriptor.m_DilationY);
38
surmeh013537c2c2018-05-18 16:31:43 +010039 arm_compute::TensorInfo aclBiasesInfo;
40 arm_compute::TensorInfo *optionalAclBiasesInfo = nullptr;
41
42 if (descriptor.m_BiasEnabled)
43 {
Narumol Prangnawaratac2770a2020-04-01 16:51:23 +010044 ARMNN_ASSERT(biases.has_value());
arovir01a6824102018-08-28 17:40:45 +010045
David Beck5eec11d2018-10-04 15:43:17 +010046 aclBiasesInfo = BuildArmComputeTensorInfo(biases.value(), descriptor.m_DataLayout);
surmeh013537c2c2018-05-18 16:31:43 +010047 optionalAclBiasesInfo = &aclBiasesInfo;
48 }
49
50 arm_compute::PadStrideInfo layerInfo = BuildArmComputePadStrideInfo(descriptor);
51
Mike Kelly07810fc2020-11-12 10:58:48 +000052 const arm_compute::ActivationLayerInfo activationInfo = ConvertActivationDescriptorToAclActivationLayerInfo(
53 activationDescriptor);
54
surmeh013537c2c2018-05-18 16:31:43 +010055 return arm_compute::NEConvolutionLayer::validate(&aclInputInfo,
56 &aclWeightsInfo,
57 optionalAclBiasesInfo,
58 &aclOutputInfo,
Jan Eilers59c66702019-07-11 10:22:36 +010059 layerInfo,
60 arm_compute::WeightsInfo(),
Sadik Armagan045f6be2020-09-10 13:37:32 +010061 aclDilationInfo,
Mike Kelly07810fc2020-11-12 10:58:48 +000062 activationInfo,
Sadik Armagan045f6be2020-09-10 13:37:32 +010063 isFastMathEnabled);
surmeh013537c2c2018-05-18 16:31:43 +010064}
65
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +010066NeonConvolution2dWorkload::NeonConvolution2dWorkload(
Sadik Armagan04a72972020-09-14 15:44:18 +010067 const Convolution2dQueueDescriptor& descriptor,
68 const WorkloadInfo& info,
69 std::shared_ptr<arm_compute::MemoryManagerOnDemand>& memoryManager,
70 const bool isFastMathEnabled)
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +010071 : BaseWorkload<Convolution2dQueueDescriptor>(descriptor, info)
telsoa014fcda012018-03-09 14:13:49 +000072{
Teresa Charlin30dfc542020-11-12 22:22:31 +000073 using arm_compute::NEConvolutionLayer;
telsoa014fcda012018-03-09 14:13:49 +000074
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +010075 m_Data.ValidateInputsOutputs("NeonConvolution2dWorkload", 1, 1);
telsoa014fcda012018-03-09 14:13:49 +000076
Jan Eilersbb446e52020-04-02 13:56:54 +010077 arm_compute::ITensor& input = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
78 arm_compute::ITensor& output = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
telsoa014fcda012018-03-09 14:13:49 +000079
Francis Murtaghd59116e2018-10-04 16:03:07 +010080 arm_compute::DataLayout aclDataLayout = ConvertDataLayout(m_Data.m_Parameters.m_DataLayout);
81 input.info()->set_data_layout(aclDataLayout);
82 output.info()->set_data_layout(aclDataLayout);
83
telsoa01c577f2c2018-08-31 09:22:23 +010084 m_KernelTensor = std::make_unique<arm_compute::Tensor>();
Francis Murtaghd59116e2018-10-04 16:03:07 +010085 BuildArmComputeTensor(*m_KernelTensor, m_Data.m_Weight->GetTensorInfo(), m_Data.m_Parameters.m_DataLayout);
telsoa014fcda012018-03-09 14:13:49 +000086
telsoa014fcda012018-03-09 14:13:49 +000087 if (m_Data.m_Parameters.m_BiasEnabled)
88 {
telsoa01c577f2c2018-08-31 09:22:23 +010089 m_BiasTensor = std::make_unique<arm_compute::Tensor>();
Francis Murtaghd59116e2018-10-04 16:03:07 +010090 BuildArmComputeTensor(*m_BiasTensor, m_Data.m_Bias->GetTensorInfo(), m_Data.m_Parameters.m_DataLayout);
telsoa014fcda012018-03-09 14:13:49 +000091 }
92
Aron Virginas-Tar6f3785d2019-07-22 15:30:22 +010093 arm_compute::PadStrideInfo padStrideInfo = BuildArmComputePadStrideInfo(m_Data.m_Parameters);
telsoa014fcda012018-03-09 14:13:49 +000094
Jan Eilers59c66702019-07-11 10:22:36 +010095 const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(m_Data.m_Parameters.m_DilationX,
96 m_Data.m_Parameters.m_DilationY);
97
Mike Kelly07810fc2020-11-12 10:58:48 +000098 const arm_compute::ActivationLayerInfo activationInfo = ConvertAdditionalInfoToAclActivationLayerInfo(descriptor);
99
narpra01fca75c32018-11-16 12:38:41 +0000100 auto convolutionLayer = std::make_unique<arm_compute::NEConvolutionLayer>(memoryManager);
101 convolutionLayer->configure(&input,
102 m_KernelTensor.get(),
103 m_BiasTensor.get(),
104 &output,
Jan Eilers59c66702019-07-11 10:22:36 +0100105 padStrideInfo,
106 arm_compute::WeightsInfo(),
Sadik Armagan04a72972020-09-14 15:44:18 +0100107 aclDilationInfo,
Mike Kelly07810fc2020-11-12 10:58:48 +0000108 activationInfo,
Sadik Armagan04a72972020-09-14 15:44:18 +0100109 isFastMathEnabled);
110
111 m_ConvolutionMethod =
112 convolutionLayer->get_convolution_method(input.info(),
113 m_KernelTensor->info(),
114 output.info(),
115 padStrideInfo,
116 arm_compute::WeightsInfo(),
117 aclDilationInfo,
Mike Kelly07810fc2020-11-12 10:58:48 +0000118 activationInfo,
Sadik Armagan04a72972020-09-14 15:44:18 +0100119 isFastMathEnabled);
Jan Eilers59c66702019-07-11 10:22:36 +0100120
Keith Davis554fa092021-07-20 11:25:22 +0100121 // Add details for profiling output
122 std::string workloadName = "NeonConvolution2dWorkload_Execute_Guid" + std::to_string(this->GetGuid());
123
124 WorkloadInfo detailsInfo;
125
126 detailsInfo.m_InputTensorInfos = info.m_InputTensorInfos;
127 detailsInfo.m_OutputTensorInfos = info.m_OutputTensorInfos;
128 detailsInfo.m_WeightsTensorInfo = armnn::Optional<armnn::TensorInfo>(descriptor.m_Weight->GetTensorInfo());
129 detailsInfo.m_ConvolutionMethod = armnn::Optional<std::string>(GetConvolutionMethodString());
130 if (descriptor.m_Parameters.m_BiasEnabled)
131 {
132 detailsInfo.m_BiasTensorInfo = armnn::Optional<armnn::TensorInfo>(descriptor.m_Bias->GetTensorInfo());
133 }
134
135 // Report Profiling Details
136 ARMNN_REPORT_PROFILING_WORKLOAD_DESC(workloadName, descriptor.m_Parameters, detailsInfo);
137
narpra01fca75c32018-11-16 12:38:41 +0000138 m_ConvolutionLayer.reset(convolutionLayer.release());
telsoa014fcda012018-03-09 14:13:49 +0000139
Narumol Prangnawaratac2770a2020-04-01 16:51:23 +0100140 ARMNN_ASSERT(m_ConvolutionLayer);
telsoa014fcda012018-03-09 14:13:49 +0000141
Nattapat Chaimanowong177d8d22018-10-16 13:21:27 +0100142 InitializeArmComputeTensorData(*m_KernelTensor, m_Data.m_Weight);
telsoa014fcda012018-03-09 14:13:49 +0000143
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100144 if (m_Data.m_Parameters.m_BiasEnabled)
145 {
146 InitializeArmComputeTensorData(*m_BiasTensor, m_Data.m_Bias);
147 }
148
149 m_ConvolutionLayer->prepare();
150 FreeUnusedTensors();
telsoa014fcda012018-03-09 14:13:49 +0000151}
152
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100153void NeonConvolution2dWorkload::Execute() const
154{
155 ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonConvolution2dWorkload_Execute");
156 m_ConvolutionLayer->run();
157}
158
Sadik Armagan04a72972020-09-14 15:44:18 +0100159arm_compute::ConvolutionMethod NeonConvolution2dWorkload::GetConvolutionMethod() const
160{
161 return m_ConvolutionMethod;
162}
163
Keith Davis554fa092021-07-20 11:25:22 +0100164std::string NeonConvolution2dWorkload::GetConvolutionMethodString()
165{
166 switch ( m_ConvolutionMethod )
167 {
168 case arm_compute::ConvolutionMethod::FFT:
169 return "FFT";
170 case arm_compute::ConvolutionMethod::DIRECT:
171 return "Direct";
172 case arm_compute::ConvolutionMethod::GEMM:
173 return "GEMM";
174 case arm_compute::ConvolutionMethod::WINOGRAD:
175 return "Winograd";
176 default:
177 return "Unknown";
178 }
179}
180
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100181void NeonConvolution2dWorkload::FreeUnusedTensors()
telsoa01c577f2c2018-08-31 09:22:23 +0100182{
183 FreeTensorIfUnused(m_KernelTensor);
184 FreeTensorIfUnused(m_BiasTensor);
185}
186
telsoa014fcda012018-03-09 14:13:49 +0000187} //namespace armnn