blob: 5c7eeccb26a549ef182b21eea7b7688f544dc069 [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
Aron Virginas-Tar56055192018-11-12 18:10:43 +00005
David Beck79141b92018-10-23 16:09:36 +01006#include "NeonBackendId.hpp"
Aron Virginas-Tar56055192018-11-12 18:10:43 +00007#include "NeonTensorHandle.hpp"
8#include "NeonWorkloadFactory.hpp"
9
David Beck0dbe0ee2018-09-24 15:59:27 +010010#include <Layer.hpp>
telsoa014fcda012018-03-09 14:13:49 +000011
Aron Virginas-Tar56055192018-11-12 18:10:43 +000012#include <armnn/Utils.hpp>
telsoa01c577f2c2018-08-31 09:22:23 +010013
Aron Virginas-Tar56055192018-11-12 18:10:43 +000014#include <backendsCommon/CpuTensorHandle.hpp>
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000015#include <backendsCommon/MakeWorkloadHelper.hpp>
Aron Virginas-Tar56055192018-11-12 18:10:43 +000016#include <backendsCommon/MemCopyWorkload.hpp>
telsoa014fcda012018-03-09 14:13:49 +000017
Aron Virginas-Tar56055192018-11-12 18:10:43 +000018#include <neon/workloads/NeonWorkloadUtils.hpp>
19#include <neon/workloads/NeonWorkloads.hpp>
20
21#include <boost/core/ignore_unused.hpp>
telsoa014fcda012018-03-09 14:13:49 +000022#include <boost/polymorphic_cast.hpp>
23
24namespace armnn
25{
26
David Beck79141b92018-10-23 16:09:36 +010027namespace
28{
29static const BackendId s_Id{NeonBackendId()};
30}
31
David Beck29c75de2018-10-23 13:35:58 +010032bool NeonWorkloadFactory::IsLayerSupported(const Layer& layer,
33 Optional<DataType> dataType,
telsoa01c577f2c2018-08-31 09:22:23 +010034 std::string& outReasonIfUnsupported)
telsoa014fcda012018-03-09 14:13:49 +000035{
David Beck79141b92018-10-23 16:09:36 +010036 return IWorkloadFactory::IsLayerSupported(s_Id, layer, dataType, outReasonIfUnsupported);
37}
38
39const BackendId& NeonWorkloadFactory::GetBackendId() const
40{
41 return s_Id;
telsoa014fcda012018-03-09 14:13:49 +000042}
43
Aron Virginas-Tar56055192018-11-12 18:10:43 +000044NeonWorkloadFactory::NeonWorkloadFactory(const std::shared_ptr<NeonMemoryManager>& memoryManager)
45 : m_MemoryManager(memoryManager)
surmeh013537c2c2018-05-18 16:31:43 +010046{
47}
48
telsoa014fcda012018-03-09 14:13:49 +000049std::unique_ptr<ITensorHandle> NeonWorkloadFactory::CreateSubTensorHandle(ITensorHandle& parent,
50 TensorShape const& subTensorShape,
51 unsigned int const* subTensorOrigin) const
52{
telsoa014fcda012018-03-09 14:13:49 +000053 const arm_compute::TensorShape shape = armcomputetensorutils::BuildArmComputeTensorShape(subTensorShape);
54
55 arm_compute::Coordinates coords;
56 coords.set_num_dimensions(subTensorShape.GetNumDimensions());
57 for (unsigned int i = 0; i < subTensorShape.GetNumDimensions(); i++)
58 {
telsoa01c577f2c2018-08-31 09:22:23 +010059 // Arm compute indexes tensor coords in reverse order.
telsoa014fcda012018-03-09 14:13:49 +000060 unsigned int revertedIndex = subTensorShape.GetNumDimensions() - i - 1;
61 coords.set(i, boost::numeric_cast<int>(subTensorOrigin[revertedIndex]));
62 }
63
telsoa01c577f2c2018-08-31 09:22:23 +010064 return std::make_unique<NeonSubTensorHandle>(
65 boost::polymorphic_downcast<INeonTensorHandle*>(&parent), shape, coords);
telsoa014fcda012018-03-09 14:13:49 +000066}
67
68std::unique_ptr<ITensorHandle> NeonWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo) const
69{
telsoa01c577f2c2018-08-31 09:22:23 +010070 auto tensorHandle = std::make_unique<NeonTensorHandle>(tensorInfo);
Aron Virginas-Tar56055192018-11-12 18:10:43 +000071 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
telsoa01c577f2c2018-08-31 09:22:23 +010072
73 return tensorHandle;
telsoa014fcda012018-03-09 14:13:49 +000074}
75
Francis Murtagh351d13d2018-09-24 15:01:18 +010076std::unique_ptr<ITensorHandle> NeonWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo,
77 DataLayout dataLayout) const
78{
79 auto tensorHandle = std::make_unique<NeonTensorHandle>(tensorInfo, dataLayout);
Aron Virginas-Tar56055192018-11-12 18:10:43 +000080 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
Francis Murtagh351d13d2018-09-24 15:01:18 +010081
82 return tensorHandle;
83}
84
telsoa014fcda012018-03-09 14:13:49 +000085std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateInput(const InputQueueDescriptor& descriptor,
86 const WorkloadInfo& info) const
87{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +010088 return MakeWorkloadHelper<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +000089}
90
91std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateOutput(const OutputQueueDescriptor& descriptor,
92 const WorkloadInfo& info) const
93{
kevmay012b4d88e2019-01-24 14:05:09 +000094 return MakeWorkloadHelper<CopyMemGenericWorkload, CopyMemGenericWorkload,
95 CopyMemGenericWorkload, NullWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +000096}
97
98std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateActivation(const ActivationQueueDescriptor& descriptor,
99 const WorkloadInfo& info) const
100{
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +0100101 return std::make_unique<NeonActivationWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000102}
103
104std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateSoftmax(const SoftmaxQueueDescriptor& descriptor,
105 const WorkloadInfo& info) const
106{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100107 return MakeWorkloadHelper<NeonSoftmaxFloatWorkload, NeonSoftmaxUint8Workload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000108 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000109}
110
111std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateSplitter(const SplitterQueueDescriptor& descriptor,
112 const WorkloadInfo& info) const
113{
Nattapat Chaimanowong14766d72018-10-12 15:09:53 +0100114 return std::make_unique<NeonSplitterWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000115}
116
117std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateMerger(const MergerQueueDescriptor& descriptor,
118 const WorkloadInfo& info) const
119{
Nattapat Chaimanowongf3eb46d2018-10-12 13:54:09 +0100120 return std::make_unique<NeonMergerWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000121}
122
123std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateFullyConnected(
124 const FullyConnectedQueueDescriptor& descriptor, const WorkloadInfo& info) const
125{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100126 return MakeWorkloadHelper<NeonFullyConnectedWorkload, NeonFullyConnectedWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000127 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000128}
129
130std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreatePermute(const PermuteQueueDescriptor& descriptor,
131 const WorkloadInfo& info) const
132{
Nattapat Chaimanowong1d320062018-10-12 14:14:44 +0100133 return std::make_unique<NeonPermuteWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000134}
135
136std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreatePooling2d(const Pooling2dQueueDescriptor& descriptor,
137 const WorkloadInfo& info) const
138{
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100139 return std::make_unique<NeonPooling2dWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000140}
141
142std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateConvolution2d(
143 const Convolution2dQueueDescriptor& descriptor, const WorkloadInfo& info) const
144{
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100145 return std::make_unique<NeonConvolution2dWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000146 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000147}
148
149std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateDepthwiseConvolution2d(
150 const DepthwiseConvolution2dQueueDescriptor& descriptor, const WorkloadInfo& info) const
151{
Nattapat Chaimanowong77140882018-10-17 11:12:19 +0100152 return std::make_unique<NeonDepthwiseConvolutionWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000153}
154
Narumol Prangnawarat94dd5d82019-01-23 18:06:26 +0000155std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateDetectionPostProcess(
156 const armnn::DetectionPostProcessQueueDescriptor& descriptor, const armnn::WorkloadInfo& info) const
157{
158 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
159}
160
telsoa014fcda012018-03-09 14:13:49 +0000161std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateNormalization(
162 const NormalizationQueueDescriptor& descriptor, const WorkloadInfo& info) const
163{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100164 return MakeWorkloadHelper<NeonNormalizationFloatWorkload, NullWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000165 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000166}
167
168std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateAddition(const AdditionQueueDescriptor& descriptor,
169 const WorkloadInfo& info) const
170{
Matthew Bentham955258d2018-12-10 10:48:52 +0000171 return std::make_unique<NeonAdditionWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000172}
173
174std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateMultiplication(
175 const MultiplicationQueueDescriptor& descriptor, const WorkloadInfo& info) const
176{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100177 return MakeWorkloadHelper<NeonMultiplicationFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000178}
179
Francis Murtaghe7a86a42018-08-29 12:42:10 +0100180std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateDivision(
181 const DivisionQueueDescriptor& descriptor, const WorkloadInfo& info) const
182{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100183 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
Francis Murtaghe7a86a42018-08-29 12:42:10 +0100184}
185
David Beckc2044fe2018-09-05 15:00:38 +0100186std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateSubtraction(
187 const SubtractionQueueDescriptor& descriptor, const WorkloadInfo& info) const
188{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100189 return MakeWorkloadHelper<NeonSubtractionFloatWorkload, NullWorkload>(descriptor, info);
David Beckc2044fe2018-09-05 15:00:38 +0100190}
191
telsoa014fcda012018-03-09 14:13:49 +0000192std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateBatchNormalization(
193 const BatchNormalizationQueueDescriptor& descriptor, const WorkloadInfo& info) const
194{
Matthew Benthamc48ac8c2018-12-12 16:15:59 +0000195 return std::make_unique<NeonBatchNormalizationWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000196}
197
198std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateMemCopy(const MemCopyQueueDescriptor& descriptor,
199 const WorkloadInfo& info) const
200{
201 if (descriptor.m_Inputs.empty() || !descriptor.m_Inputs[0])
202 {
203 throw InvalidArgumentException("NeonWorkloadFactory: Invalid null input for MemCopy workload");
204 }
205
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100206 return MakeWorkloadHelper<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000207}
208
209std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateResizeBilinear(
210 const ResizeBilinearQueueDescriptor& descriptor,
211 const WorkloadInfo& info) const
212{
Sadik Armaganc625f002018-12-17 11:32:16 +0000213 return std::make_unique<NeonResizeBilinearWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000214}
215
216std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateFakeQuantization(
217 const FakeQuantizationQueueDescriptor& descriptor,
218 const WorkloadInfo& info) const
219{
220 return nullptr;
221}
222
223std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateL2Normalization(const L2NormalizationQueueDescriptor& descriptor,
224 const WorkloadInfo& info) const
225{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100226 return MakeWorkloadHelper<NeonL2NormalizationFloatWorkload, NullWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000227 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000228}
229
230std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateConstant(const ConstantQueueDescriptor& descriptor,
231 const WorkloadInfo& info) const
232{
Nattapat Chaimanowong233b3d62018-10-12 12:02:18 +0100233 return std::make_unique<NeonConstantWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000234}
235
236std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateReshape(const ReshapeQueueDescriptor& descriptor,
237 const WorkloadInfo& info) const
238{
Nattapat Chaimanowongcce11fc2018-10-12 16:30:56 +0100239 return std::make_unique<NeonReshapeWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000240}
241
Nattapat Chaimanowong207ef9a2018-11-02 10:57:25 +0000242std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateSpaceToBatchNd(const SpaceToBatchNdQueueDescriptor& descriptor,
243 const WorkloadInfo& info) const
244{
245 return nullptr;
246}
247
telsoa014fcda012018-03-09 14:13:49 +0000248std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateFloor(const FloorQueueDescriptor& descriptor,
249 const WorkloadInfo& info) const
250{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100251 return MakeWorkloadHelper<NeonFloorFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000252}
253
telsoa01c577f2c2018-08-31 09:22:23 +0100254std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateLstm(const LstmQueueDescriptor& descriptor,
255 const WorkloadInfo& info) const
256{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100257 return MakeWorkloadHelper<NeonLstmFloatWorkload, NullWorkload>(descriptor, info);
telsoa01c577f2c2018-08-31 09:22:23 +0100258}
259
260std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateConvertFp16ToFp32(
261 const ConvertFp16ToFp32QueueDescriptor& descriptor,
262 const WorkloadInfo& info) const
263{
264 return std::make_unique<NeonConvertFp16ToFp32Workload>(descriptor, info);
265}
266
267std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateConvertFp32ToFp16(
268 const ConvertFp32ToFp16QueueDescriptor& descriptor,
269 const WorkloadInfo& info) const
270{
271 return std::make_unique<NeonConvertFp32ToFp16Workload>(descriptor, info);
272}
273
Nattapat Chaimanowong5a4304a2018-11-28 10:44:37 +0000274std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateMaximum(const MaximumQueueDescriptor& descriptor,
275 const WorkloadInfo& info) const
276{
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +0000277 return std::make_unique<NeonMaximumWorkload>(descriptor, info);
Nattapat Chaimanowong5a4304a2018-11-28 10:44:37 +0000278}
279
narpra01a6bf9122018-09-10 09:50:09 +0100280std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateMean(const MeanQueueDescriptor& descriptor,
281 const WorkloadInfo& info) const
282{
Matthew Benthamfd899962018-12-31 15:49:42 +0000283 return std::make_unique<NeonMeanWorkload>(descriptor, info);
narpra01a6bf9122018-09-10 09:50:09 +0100284}
285
jimfly012c9322a2018-09-19 10:59:49 +0100286std::unique_ptr<IWorkload> NeonWorkloadFactory::CreatePad(const PadQueueDescriptor& descriptor,
287 const WorkloadInfo& info) const
288{
Éanna Ó Catháin12055742019-01-25 10:01:40 +0000289 return std::make_unique<NeonPadWorkload>(descriptor, info);
jimfly012c9322a2018-09-19 10:59:49 +0100290}
291
FrancisMurtagh20995952018-12-17 12:11:36 +0000292std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateEqual(const EqualQueueDescriptor& descriptor,
293 const WorkloadInfo& info) const
294{
295 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
296}
297
Éanna Ó Catháin4e1e1362018-11-12 11:36:34 +0000298std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateBatchToSpaceNd(const BatchToSpaceNdQueueDescriptor& descriptor,
299 const WorkloadInfo& info) const
300{
301 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
302}
303
Conor Kennedy430b5d82018-11-14 15:28:28 +0000304std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateStridedSlice(const StridedSliceQueueDescriptor& descriptor,
305 const WorkloadInfo& info) const
306{
307 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
308}
309
kevmay0190539692018-11-29 08:40:19 +0000310std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateMinimum(const MinimumQueueDescriptor& descriptor,
311 const WorkloadInfo& info) const
312{
Conor Kennedy54b21692019-01-09 07:57:38 +0000313 return std::make_unique<NeonMinimumWorkload>(descriptor, info);
kevmay0190539692018-11-29 08:40:19 +0000314}
315
Matteo Martincigh59a950c2018-12-13 12:48:25 +0000316std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateGreater(const GreaterQueueDescriptor& descriptor,
317 const WorkloadInfo& info) const
318{
319 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
320}
321
Nattapat Chaimanowonga9a1cf12018-12-03 16:06:49 +0000322std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateDebug(const DebugQueueDescriptor& descriptor,
323 const WorkloadInfo& info) const
324{
325 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
326}
327
Mohamed Nour Abouelseouda1d3c6a2018-12-27 12:39:16 +0000328std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateRsqrt(const RsqrtQueueDescriptor &descriptor,
329 const WorkloadInfo &info) const
330{
331 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
332}
333
Matteo Martincigh49124022019-01-11 13:25:59 +0000334std::unique_ptr<IWorkload> NeonWorkloadFactory::CreatePreCompiled(const PreCompiledQueueDescriptor& descriptor,
335 const WorkloadInfo& info) const
336{
337 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
338}
339
narpra01b89b05f2019-01-16 09:53:09 +0000340std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateGather(const armnn::GatherQueueDescriptor& descriptor,
341 const armnn::WorkloadInfo& info) const
342{
343 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
344}
345
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000346} // namespace armnn