blob: 8db5f9ad84a9d7e6ff79eadcea24eb3698f0df9c [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
Aron Virginas-Tar56055192018-11-12 18:10:43 +00005
David Beck79141b92018-10-23 16:09:36 +01006#include "NeonBackendId.hpp"
Aron Virginas-Tar56055192018-11-12 18:10:43 +00007#include "NeonTensorHandle.hpp"
8#include "NeonWorkloadFactory.hpp"
9
David Beck0dbe0ee2018-09-24 15:59:27 +010010#include <Layer.hpp>
telsoa014fcda012018-03-09 14:13:49 +000011
Aron Virginas-Tar56055192018-11-12 18:10:43 +000012#include <armnn/Utils.hpp>
telsoa01c577f2c2018-08-31 09:22:23 +010013
Aron Virginas-Tar56055192018-11-12 18:10:43 +000014#include <backendsCommon/CpuTensorHandle.hpp>
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000015#include <backendsCommon/MakeWorkloadHelper.hpp>
Aron Virginas-Tar56055192018-11-12 18:10:43 +000016#include <backendsCommon/MemCopyWorkload.hpp>
telsoa014fcda012018-03-09 14:13:49 +000017
Aron Virginas-Tar56055192018-11-12 18:10:43 +000018#include <neon/workloads/NeonWorkloadUtils.hpp>
19#include <neon/workloads/NeonWorkloads.hpp>
20
21#include <boost/core/ignore_unused.hpp>
telsoa014fcda012018-03-09 14:13:49 +000022#include <boost/polymorphic_cast.hpp>
23
24namespace armnn
25{
26
David Beck79141b92018-10-23 16:09:36 +010027namespace
28{
29static const BackendId s_Id{NeonBackendId()};
30}
31
David Beck29c75de2018-10-23 13:35:58 +010032bool NeonWorkloadFactory::IsLayerSupported(const Layer& layer,
33 Optional<DataType> dataType,
telsoa01c577f2c2018-08-31 09:22:23 +010034 std::string& outReasonIfUnsupported)
telsoa014fcda012018-03-09 14:13:49 +000035{
David Beck79141b92018-10-23 16:09:36 +010036 return IWorkloadFactory::IsLayerSupported(s_Id, layer, dataType, outReasonIfUnsupported);
37}
38
39const BackendId& NeonWorkloadFactory::GetBackendId() const
40{
41 return s_Id;
telsoa014fcda012018-03-09 14:13:49 +000042}
43
Aron Virginas-Tar56055192018-11-12 18:10:43 +000044NeonWorkloadFactory::NeonWorkloadFactory(const std::shared_ptr<NeonMemoryManager>& memoryManager)
45 : m_MemoryManager(memoryManager)
surmeh013537c2c2018-05-18 16:31:43 +010046{
47}
48
telsoa014fcda012018-03-09 14:13:49 +000049std::unique_ptr<ITensorHandle> NeonWorkloadFactory::CreateSubTensorHandle(ITensorHandle& parent,
50 TensorShape const& subTensorShape,
51 unsigned int const* subTensorOrigin) const
52{
telsoa014fcda012018-03-09 14:13:49 +000053 const arm_compute::TensorShape shape = armcomputetensorutils::BuildArmComputeTensorShape(subTensorShape);
54
55 arm_compute::Coordinates coords;
56 coords.set_num_dimensions(subTensorShape.GetNumDimensions());
57 for (unsigned int i = 0; i < subTensorShape.GetNumDimensions(); i++)
58 {
telsoa01c577f2c2018-08-31 09:22:23 +010059 // Arm compute indexes tensor coords in reverse order.
telsoa014fcda012018-03-09 14:13:49 +000060 unsigned int revertedIndex = subTensorShape.GetNumDimensions() - i - 1;
61 coords.set(i, boost::numeric_cast<int>(subTensorOrigin[revertedIndex]));
62 }
63
Derek Lamberti0790dce2019-04-15 18:37:35 +010064 const arm_compute::TensorShape parentShape = armcomputetensorutils::BuildArmComputeTensorShape(parent.GetShape());
65 if (!::arm_compute::error_on_invalid_subtensor(__func__, __FILE__, __LINE__, parentShape, coords, shape))
66 {
67 return nullptr;
68 }
69
telsoa01c577f2c2018-08-31 09:22:23 +010070 return std::make_unique<NeonSubTensorHandle>(
71 boost::polymorphic_downcast<INeonTensorHandle*>(&parent), shape, coords);
telsoa014fcda012018-03-09 14:13:49 +000072}
73
74std::unique_ptr<ITensorHandle> NeonWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo) const
75{
telsoa01c577f2c2018-08-31 09:22:23 +010076 auto tensorHandle = std::make_unique<NeonTensorHandle>(tensorInfo);
Aron Virginas-Tar56055192018-11-12 18:10:43 +000077 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
telsoa01c577f2c2018-08-31 09:22:23 +010078
79 return tensorHandle;
telsoa014fcda012018-03-09 14:13:49 +000080}
81
Francis Murtagh351d13d2018-09-24 15:01:18 +010082std::unique_ptr<ITensorHandle> NeonWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo,
83 DataLayout dataLayout) const
84{
85 auto tensorHandle = std::make_unique<NeonTensorHandle>(tensorInfo, dataLayout);
Aron Virginas-Tar56055192018-11-12 18:10:43 +000086 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
Francis Murtagh351d13d2018-09-24 15:01:18 +010087
88 return tensorHandle;
89}
90
telsoa014fcda012018-03-09 14:13:49 +000091std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateInput(const InputQueueDescriptor& descriptor,
92 const WorkloadInfo& info) const
93{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +010094 return MakeWorkloadHelper<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +000095}
96
97std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateOutput(const OutputQueueDescriptor& descriptor,
98 const WorkloadInfo& info) const
99{
kevmay012b4d88e2019-01-24 14:05:09 +0000100 return MakeWorkloadHelper<CopyMemGenericWorkload, CopyMemGenericWorkload,
101 CopyMemGenericWorkload, NullWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000102}
103
104std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateActivation(const ActivationQueueDescriptor& descriptor,
105 const WorkloadInfo& info) const
106{
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +0100107 return std::make_unique<NeonActivationWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000108}
109
110std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateSoftmax(const SoftmaxQueueDescriptor& descriptor,
111 const WorkloadInfo& info) const
112{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100113 return MakeWorkloadHelper<NeonSoftmaxFloatWorkload, NeonSoftmaxUint8Workload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000114 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000115}
116
117std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateSplitter(const SplitterQueueDescriptor& descriptor,
118 const WorkloadInfo& info) const
119{
Nattapat Chaimanowong14766d72018-10-12 15:09:53 +0100120 return std::make_unique<NeonSplitterWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000121}
122
123std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateMerger(const MergerQueueDescriptor& descriptor,
124 const WorkloadInfo& info) const
125{
Nattapat Chaimanowongf3eb46d2018-10-12 13:54:09 +0100126 return std::make_unique<NeonMergerWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000127}
128
129std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateFullyConnected(
130 const FullyConnectedQueueDescriptor& descriptor, const WorkloadInfo& info) const
131{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100132 return MakeWorkloadHelper<NeonFullyConnectedWorkload, NeonFullyConnectedWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000133 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000134}
135
136std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreatePermute(const PermuteQueueDescriptor& descriptor,
137 const WorkloadInfo& info) const
138{
Nattapat Chaimanowong1d320062018-10-12 14:14:44 +0100139 return std::make_unique<NeonPermuteWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000140}
141
142std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreatePooling2d(const Pooling2dQueueDescriptor& descriptor,
143 const WorkloadInfo& info) const
144{
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100145 return std::make_unique<NeonPooling2dWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000146}
147
148std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateConvolution2d(
149 const Convolution2dQueueDescriptor& descriptor, const WorkloadInfo& info) const
150{
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100151 return std::make_unique<NeonConvolution2dWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000152 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000153}
154
155std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateDepthwiseConvolution2d(
156 const DepthwiseConvolution2dQueueDescriptor& descriptor, const WorkloadInfo& info) const
157{
Nattapat Chaimanowong77140882018-10-17 11:12:19 +0100158 return std::make_unique<NeonDepthwiseConvolutionWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000159}
160
Narumol Prangnawarat94dd5d82019-01-23 18:06:26 +0000161std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateDetectionPostProcess(
162 const armnn::DetectionPostProcessQueueDescriptor& descriptor, const armnn::WorkloadInfo& info) const
163{
164 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
165}
166
telsoa014fcda012018-03-09 14:13:49 +0000167std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateNormalization(
168 const NormalizationQueueDescriptor& descriptor, const WorkloadInfo& info) const
169{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100170 return MakeWorkloadHelper<NeonNormalizationFloatWorkload, NullWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000171 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000172}
173
174std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateAddition(const AdditionQueueDescriptor& descriptor,
175 const WorkloadInfo& info) const
176{
Matthew Bentham955258d2018-12-10 10:48:52 +0000177 return std::make_unique<NeonAdditionWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000178}
179
180std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateMultiplication(
181 const MultiplicationQueueDescriptor& descriptor, const WorkloadInfo& info) const
182{
Conor Kennedyb99480b2019-03-08 08:24:41 +0000183 return std::make_unique<NeonMultiplicationWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000184}
185
Francis Murtaghe7a86a42018-08-29 12:42:10 +0100186std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateDivision(
187 const DivisionQueueDescriptor& descriptor, const WorkloadInfo& info) const
188{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100189 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
Francis Murtaghe7a86a42018-08-29 12:42:10 +0100190}
191
David Beckc2044fe2018-09-05 15:00:38 +0100192std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateSubtraction(
193 const SubtractionQueueDescriptor& descriptor, const WorkloadInfo& info) const
194{
Conor Kennedyb99480b2019-03-08 08:24:41 +0000195 return std::make_unique<NeonSubtractionWorkload>(descriptor, info);
David Beckc2044fe2018-09-05 15:00:38 +0100196}
197
telsoa014fcda012018-03-09 14:13:49 +0000198std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateBatchNormalization(
199 const BatchNormalizationQueueDescriptor& descriptor, const WorkloadInfo& info) const
200{
Matthew Benthamc48ac8c2018-12-12 16:15:59 +0000201 return std::make_unique<NeonBatchNormalizationWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000202}
203
204std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateMemCopy(const MemCopyQueueDescriptor& descriptor,
205 const WorkloadInfo& info) const
206{
207 if (descriptor.m_Inputs.empty() || !descriptor.m_Inputs[0])
208 {
209 throw InvalidArgumentException("NeonWorkloadFactory: Invalid null input for MemCopy workload");
210 }
211
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100212 return MakeWorkloadHelper<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000213}
214
215std::unique_ptr<armnn::IWorkload> NeonWorkloadFactory::CreateResizeBilinear(
216 const ResizeBilinearQueueDescriptor& descriptor,
217 const WorkloadInfo& info) const
218{
Sadik Armaganc625f002018-12-17 11:32:16 +0000219 return std::make_unique<NeonResizeBilinearWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000220}
221
222std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateFakeQuantization(
223 const FakeQuantizationQueueDescriptor& descriptor,
224 const WorkloadInfo& info) const
225{
226 return nullptr;
227}
228
229std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateL2Normalization(const L2NormalizationQueueDescriptor& descriptor,
230 const WorkloadInfo& info) const
231{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100232 return MakeWorkloadHelper<NeonL2NormalizationFloatWorkload, NullWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000233 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000234}
235
236std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateConstant(const ConstantQueueDescriptor& descriptor,
237 const WorkloadInfo& info) const
238{
Nattapat Chaimanowong233b3d62018-10-12 12:02:18 +0100239 return std::make_unique<NeonConstantWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000240}
241
242std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateReshape(const ReshapeQueueDescriptor& descriptor,
243 const WorkloadInfo& info) const
244{
Nattapat Chaimanowongcce11fc2018-10-12 16:30:56 +0100245 return std::make_unique<NeonReshapeWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000246}
247
Nattapat Chaimanowong207ef9a2018-11-02 10:57:25 +0000248std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateSpaceToBatchNd(const SpaceToBatchNdQueueDescriptor& descriptor,
249 const WorkloadInfo& info) const
250{
251 return nullptr;
252}
253
telsoa014fcda012018-03-09 14:13:49 +0000254std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateFloor(const FloorQueueDescriptor& descriptor,
255 const WorkloadInfo& info) const
256{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100257 return MakeWorkloadHelper<NeonFloorFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000258}
259
telsoa01c577f2c2018-08-31 09:22:23 +0100260std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateLstm(const LstmQueueDescriptor& descriptor,
261 const WorkloadInfo& info) const
262{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100263 return MakeWorkloadHelper<NeonLstmFloatWorkload, NullWorkload>(descriptor, info);
telsoa01c577f2c2018-08-31 09:22:23 +0100264}
265
266std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateConvertFp16ToFp32(
267 const ConvertFp16ToFp32QueueDescriptor& descriptor,
268 const WorkloadInfo& info) const
269{
270 return std::make_unique<NeonConvertFp16ToFp32Workload>(descriptor, info);
271}
272
273std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateConvertFp32ToFp16(
274 const ConvertFp32ToFp16QueueDescriptor& descriptor,
275 const WorkloadInfo& info) const
276{
277 return std::make_unique<NeonConvertFp32ToFp16Workload>(descriptor, info);
278}
279
Nattapat Chaimanowong5a4304a2018-11-28 10:44:37 +0000280std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateMaximum(const MaximumQueueDescriptor& descriptor,
281 const WorkloadInfo& info) const
282{
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +0000283 return std::make_unique<NeonMaximumWorkload>(descriptor, info);
Nattapat Chaimanowong5a4304a2018-11-28 10:44:37 +0000284}
285
narpra01a6bf9122018-09-10 09:50:09 +0100286std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateMean(const MeanQueueDescriptor& descriptor,
287 const WorkloadInfo& info) const
288{
Matthew Benthamfd899962018-12-31 15:49:42 +0000289 return std::make_unique<NeonMeanWorkload>(descriptor, info);
narpra01a6bf9122018-09-10 09:50:09 +0100290}
291
jimfly012c9322a2018-09-19 10:59:49 +0100292std::unique_ptr<IWorkload> NeonWorkloadFactory::CreatePad(const PadQueueDescriptor& descriptor,
293 const WorkloadInfo& info) const
294{
Éanna Ó Catháin12055742019-01-25 10:01:40 +0000295 return std::make_unique<NeonPadWorkload>(descriptor, info);
jimfly012c9322a2018-09-19 10:59:49 +0100296}
297
FrancisMurtagh20995952018-12-17 12:11:36 +0000298std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateEqual(const EqualQueueDescriptor& descriptor,
299 const WorkloadInfo& info) const
300{
301 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
302}
303
Éanna Ó Catháin4e1e1362018-11-12 11:36:34 +0000304std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateBatchToSpaceNd(const BatchToSpaceNdQueueDescriptor& descriptor,
305 const WorkloadInfo& info) const
306{
307 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
308}
309
Conor Kennedy430b5d82018-11-14 15:28:28 +0000310std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateStridedSlice(const StridedSliceQueueDescriptor& descriptor,
311 const WorkloadInfo& info) const
312{
313 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
314}
315
kevmay0190539692018-11-29 08:40:19 +0000316std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateMinimum(const MinimumQueueDescriptor& descriptor,
317 const WorkloadInfo& info) const
318{
Conor Kennedy54b21692019-01-09 07:57:38 +0000319 return std::make_unique<NeonMinimumWorkload>(descriptor, info);
kevmay0190539692018-11-29 08:40:19 +0000320}
321
Matteo Martincigh59a950c2018-12-13 12:48:25 +0000322std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateGreater(const GreaterQueueDescriptor& descriptor,
323 const WorkloadInfo& info) const
324{
kevmay01eed85922019-01-28 08:37:25 +0000325 return MakeWorkloadHelper<NeonGreaterFloat32Workload, NeonGreaterUint8Workload>(descriptor, info);
Matteo Martincigh59a950c2018-12-13 12:48:25 +0000326}
327
Nattapat Chaimanowonga9a1cf12018-12-03 16:06:49 +0000328std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateDebug(const DebugQueueDescriptor& descriptor,
329 const WorkloadInfo& info) const
330{
331 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
332}
333
Mohamed Nour Abouelseouda1d3c6a2018-12-27 12:39:16 +0000334std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateRsqrt(const RsqrtQueueDescriptor &descriptor,
335 const WorkloadInfo &info) const
336{
337 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
338}
339
Matteo Martincigh49124022019-01-11 13:25:59 +0000340std::unique_ptr<IWorkload> NeonWorkloadFactory::CreatePreCompiled(const PreCompiledQueueDescriptor& descriptor,
341 const WorkloadInfo& info) const
342{
343 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
344}
345
narpra01b89b05f2019-01-16 09:53:09 +0000346std::unique_ptr<IWorkload> NeonWorkloadFactory::CreateGather(const armnn::GatherQueueDescriptor& descriptor,
347 const armnn::WorkloadInfo& info) const
348{
349 return MakeWorkloadHelper<NullWorkload, NullWorkload>(descriptor, info);
350}
351
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000352} // namespace armnn