blob: 65844476e42d2be636341f55eb50e22b7196a0e8 [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
Aron Virginas-Tar56055192018-11-12 18:10:43 +00005
David Beck79141b92018-10-23 16:09:36 +01006#include "NeonBackendId.hpp"
Aron Virginas-Tar56055192018-11-12 18:10:43 +00007#include "NeonTensorHandle.hpp"
8#include "NeonWorkloadFactory.hpp"
9
David Beck0dbe0ee2018-09-24 15:59:27 +010010#include <Layer.hpp>
telsoa014fcda012018-03-09 14:13:49 +000011
Aron Virginas-Tar56055192018-11-12 18:10:43 +000012#include <armnn/Utils.hpp>
telsoa01c577f2c2018-08-31 09:22:23 +010013
Aron Virginas-Tar56055192018-11-12 18:10:43 +000014#include <backendsCommon/CpuTensorHandle.hpp>
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000015#include <backendsCommon/MakeWorkloadHelper.hpp>
Aron Virginas-Tar56055192018-11-12 18:10:43 +000016#include <backendsCommon/MemCopyWorkload.hpp>
telsoa014fcda012018-03-09 14:13:49 +000017
Aron Virginas-Tar56055192018-11-12 18:10:43 +000018#include <neon/workloads/NeonWorkloadUtils.hpp>
19#include <neon/workloads/NeonWorkloads.hpp>
20
21#include <boost/core/ignore_unused.hpp>
telsoa014fcda012018-03-09 14:13:49 +000022#include <boost/polymorphic_cast.hpp>
23
24namespace armnn
25{
26
David Beck79141b92018-10-23 16:09:36 +010027namespace
28{
29static const BackendId s_Id{NeonBackendId()};
30}
31
David Beck29c75de2018-10-23 13:35:58 +010032bool NeonWorkloadFactory::IsLayerSupported(const Layer& layer,
33 Optional<DataType> dataType,
telsoa01c577f2c2018-08-31 09:22:23 +010034 std::string& outReasonIfUnsupported)
telsoa014fcda012018-03-09 14:13:49 +000035{
David Beck79141b92018-10-23 16:09:36 +010036 return IWorkloadFactory::IsLayerSupported(s_Id, layer, dataType, outReasonIfUnsupported);
37}
38
39const BackendId& NeonWorkloadFactory::GetBackendId() const
40{
41 return s_Id;
telsoa014fcda012018-03-09 14:13:49 +000042}
43
Aron Virginas-Tar56055192018-11-12 18:10:43 +000044NeonWorkloadFactory::NeonWorkloadFactory(const std::shared_ptr<NeonMemoryManager>& memoryManager)
45 : m_MemoryManager(memoryManager)
surmeh013537c2c2018-05-18 16:31:43 +010046{
47}
48
telsoa014fcda012018-03-09 14:13:49 +000049std::unique_ptr<ITensorHandle> NeonWorkloadFactory::CreateSubTensorHandle(ITensorHandle& parent,
50 TensorShape const& subTensorShape,
51 unsigned int const* subTensorOrigin) const
52{
telsoa014fcda012018-03-09 14:13:49 +000053 const arm_compute::TensorShape shape = armcomputetensorutils::BuildArmComputeTensorShape(subTensorShape);
54
55 arm_compute::Coordinates coords;
56 coords.set_num_dimensions(subTensorShape.GetNumDimensions());
57 for (unsigned int i = 0; i < subTensorShape.GetNumDimensions(); i++)
58 {
telsoa01c577f2c2018-08-31 09:22:23 +010059 // Arm compute indexes tensor coords in reverse order.
telsoa014fcda012018-03-09 14:13:49 +000060 unsigned int revertedIndex = subTensorShape.GetNumDimensions() - i - 1;
61 coords.set(i, boost::numeric_cast<int>(subTensorOrigin[revertedIndex]));
62 }
63
telsoa01c577f2c2018-08-31 09:22:23 +010064 return std::make_unique<NeonSubTensorHandle>(
65 boost::polymorphic_downcast<INeonTensorHandle*>(&parent), shape, coords);
telsoa014fcda012018-03-09 14:13:49 +000066}
67
68std::unique_ptr<ITensorHandle> NeonWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo) const
69{
telsoa01c577f2c2018-08-31 09:22:23 +010070 auto tensorHandle = std::make_unique<NeonTensorHandle>(tensorInfo);
Aron Virginas-Tar56055192018-11-12 18:10:43 +000071 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
telsoa01c577f2c2018-08-31 09:22:23 +010072
73 return tensorHandle;
telsoa014fcda012018-03-09 14:13:49 +000074}
75
Francis Murtagh351d13d2018-09-24 15:01:18 +010076std::unique_ptr<ITensorHandle> NeonWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo,
77 DataLayout dataLayout) const
78{
79 auto tensorHandle = std::make_unique<NeonTensorHandle>(tensorInfo, dataLayout);
Aron Virginas-Tar56055192018-11-12 18:10:43 +000080 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
Francis Murtagh351d13d2018-09-24 15:01:18 +010081
82 return tensorHandle;
83}
84
telsoa014fcda012018-03-09 14:13:49 +000085std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateInput(const InputQueueDescriptor& descriptor,
86 const WorkloadInfo& info) const
87{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +010088 return MakeWorkloadHelper<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +000089}
90
91std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateOutput(const OutputQueueDescriptor& descriptor,
92 const WorkloadInfo& info) const
93{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +010094 return MakeWorkloadHelper<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +000095}
96
97std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateActivation(const ActivationQueueDescriptor& descriptor,
98 const WorkloadInfo& info) const
99{
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +0100100 return std::make_unique<NeonActivationWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000101}
102
103std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateSoftmax(const SoftmaxQueueDescriptor& descriptor,
104 const WorkloadInfo& info) const
105{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100106 return MakeWorkloadHelper<NeonSoftmaxFloatWorkload, NeonSoftmaxUint8Workload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000107 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000108}
109
110std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateSplitter(const SplitterQueueDescriptor& descriptor,
111 const WorkloadInfo& info) const
112{
Nattapat Chaimanowong14766d72018-10-12 15:09:53 +0100113 return std::make_unique<NeonSplitterWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000114}
115
116std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateMerger(const MergerQueueDescriptor& descriptor,
117 const WorkloadInfo& info) const
118{
Nattapat Chaimanowongf3eb46d2018-10-12 13:54:09 +0100119 return std::make_unique<NeonMergerWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000120}
121
122std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateFullyConnected(
123 const FullyConnectedQueueDescriptor& descriptor, const WorkloadInfo& info) const
124{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100125 return MakeWorkloadHelper<NeonFullyConnectedWorkload, NeonFullyConnectedWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000126 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000127}
128
129std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreatePermute(const PermuteQueueDescriptor& descriptor,
130 const WorkloadInfo& info) const
131{
Nattapat Chaimanowong1d320062018-10-12 14:14:44 +0100132 return std::make_unique<NeonPermuteWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000133}
134
135std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreatePooling2d(const Pooling2dQueueDescriptor& descriptor,
136 const WorkloadInfo& info) const
137{
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100138 return std::make_unique<NeonPooling2dWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000139}
140
141std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateConvolution2d(
142 const Convolution2dQueueDescriptor& descriptor, const WorkloadInfo& info) const
143{
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100144 return std::make_unique<NeonConvolution2dWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000145 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000146}
147
148std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateDepthwiseConvolution2d(
149 const DepthwiseConvolution2dQueueDescriptor& descriptor, const WorkloadInfo& info) const
150{
Nattapat Chaimanowong77140882018-10-17 11:12:19 +0100151 return std::make_unique<NeonDepthwiseConvolutionWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000152}
153
154std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateNormalization(
155 const NormalizationQueueDescriptor& descriptor, const WorkloadInfo& info) const
156{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100157 return MakeWorkloadHelper<NeonNormalizationFloatWorkload, NullWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000158 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000159}
160
161std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateAddition(const AdditionQueueDescriptor& descriptor,
162 const WorkloadInfo& info) const
163{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100164 return MakeWorkloadHelper<NeonAdditionFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000165}
166
167std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateMultiplication(
168 const MultiplicationQueueDescriptor& descriptor, const WorkloadInfo& info) const
169{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100170 return MakeWorkloadHelper<NeonMultiplicationFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000171}
172
Francis Murtaghe7a86a42018-08-29 12:42:10 +0100173std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateDivision(
174 const DivisionQueueDescriptor& descriptor, const WorkloadInfo& info) const
175{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100176 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
Francis Murtaghe7a86a42018-08-29 12:42:10 +0100177}
178
David Beckc2044fe2018-09-05 15:00:38 +0100179std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateSubtraction(
180 const SubtractionQueueDescriptor& descriptor, const WorkloadInfo& info) const
181{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100182 return MakeWorkloadHelper<NeonSubtractionFloatWorkload, NullWorkload>(descriptor, info);
David Beckc2044fe2018-09-05 15:00:38 +0100183}
184
telsoa014fcda012018-03-09 14:13:49 +0000185std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateBatchNormalization(
186 const BatchNormalizationQueueDescriptor& descriptor, const WorkloadInfo& info) const
187{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100188 return MakeWorkloadHelper<NeonBatchNormalizationFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000189}
190
191std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateMemCopy(const MemCopyQueueDescriptor& descriptor,
192 const WorkloadInfo& info) const
193{
194 if (descriptor.m_Inputs.empty() || !descriptor.m_Inputs[0])
195 {
196 throw InvalidArgumentException("NeonWorkloadFactory: Invalid null input for MemCopy workload");
197 }
198
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100199 return MakeWorkloadHelper<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000200}
201
202std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateResizeBilinear(
203 const ResizeBilinearQueueDescriptor& descriptor,
204 const WorkloadInfo& info) const
205{
206 return nullptr;
207}
208
209std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateFakeQuantization(
210 const FakeQuantizationQueueDescriptor& descriptor,
211 const WorkloadInfo& info) const
212{
213 return nullptr;
214}
215
216std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateL2Normalization(const L2NormalizationQueueDescriptor& descriptor,
217 const WorkloadInfo& info) const
218{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100219 return MakeWorkloadHelper<NeonL2NormalizationFloatWorkload, NullWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000220 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000221}
222
223std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateConstant(const ConstantQueueDescriptor& descriptor,
224 const WorkloadInfo& info) const
225{
Nattapat Chaimanowong233b3d62018-10-12 12:02:18 +0100226 return std::make_unique<NeonConstantWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000227}
228
229std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateReshape(const ReshapeQueueDescriptor& descriptor,
230 const WorkloadInfo& info) const
231{
Nattapat Chaimanowongcce11fc2018-10-12 16:30:56 +0100232 return std::make_unique<NeonReshapeWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000233}
234
Nattapat Chaimanowong207ef9a2018-11-02 10:57:25 +0000235std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateSpaceToBatchNd(const SpaceToBatchNdQueueDescriptor& descriptor,
236 const WorkloadInfo& info) const
237{
238 return nullptr;
239}
240
telsoa014fcda012018-03-09 14:13:49 +0000241std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateFloor(const FloorQueueDescriptor& descriptor,
242 const WorkloadInfo& info) const
243{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100244 return MakeWorkloadHelper<NeonFloorFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000245}
246
telsoa01c577f2c2018-08-31 09:22:23 +0100247std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateLstm(const LstmQueueDescriptor& descriptor,
248 const WorkloadInfo& info) const
249{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100250 return MakeWorkloadHelper<NeonLstmFloatWorkload, NullWorkload>(descriptor, info);
telsoa01c577f2c2018-08-31 09:22:23 +0100251}
252
253std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateConvertFp16ToFp32(
254 const ConvertFp16ToFp32QueueDescriptor& descriptor,
255 const WorkloadInfo& info) const
256{
257 return std::make_unique<NeonConvertFp16ToFp32Workload>(descriptor, info);
258}
259
260std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateConvertFp32ToFp16(
261 const ConvertFp32ToFp16QueueDescriptor& descriptor,
262 const WorkloadInfo& info) const
263{
264 return std::make_unique<NeonConvertFp32ToFp16Workload>(descriptor, info);
265}
266
narpra01a6bf9122018-09-10 09:50:09 +0100267std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateMean(const MeanQueueDescriptor& descriptor,
268 const WorkloadInfo& info) const
269{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100270 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
narpra01a6bf9122018-09-10 09:50:09 +0100271}
272
jimfly012c9322a2018-09-19 10:59:49 +0100273std::unique_ptr<IWorkload> NeonWorkloadFactory::CreatePad(const PadQueueDescriptor& descriptor,
274 const WorkloadInfo& info) const
275{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100276 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
jimfly012c9322a2018-09-19 10:59:49 +0100277}
278
Éanna Ó Catháin4e1e1362018-11-12 11:36:34 +0000279std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateBatchToSpaceNd(const BatchToSpaceNdQueueDescriptor& descriptor,
280 const WorkloadInfo& info) const
281{
282 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
283}
284
telsoa01c577f2c2018-08-31 09:22:23 +0100285void NeonWorkloadFactory::Release()
286{
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000287 m_MemoryManager->Release();
telsoa01c577f2c2018-08-31 09:22:23 +0100288}
289
290void NeonWorkloadFactory::Acquire()
291{
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000292 m_MemoryManager->Acquire();
telsoa01c577f2c2018-08-31 09:22:23 +0100293}
294
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000295} // namespace armnn