blob: 16ca2e6e4131c430fafadd7013daed0d1d7c9377 [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5#include "ClWorkloadFactory.hpp"
David Beck79141b92018-10-23 16:09:36 +01006#include "ClBackendId.hpp"
telsoa014fcda012018-03-09 14:13:49 +00007
Aron Virginas-Tar5caf9072018-11-14 18:35:18 +00008#include <Layer.hpp>
9
David Beck0dbe0ee2018-09-24 15:59:27 +010010#include <armnn/Exceptions.hpp>
11#include <armnn/Utils.hpp>
telsoa014fcda012018-03-09 14:13:49 +000012
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000013#include <backendsCommon/CpuTensorHandle.hpp>
Aron Virginas-Tar5caf9072018-11-14 18:35:18 +000014#include <backendsCommon/MakeWorkloadHelper.hpp>
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000015#include <backendsCommon/MemCopyWorkload.hpp>
telsoa01c577f2c2018-08-31 09:22:23 +010016
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000017#include <cl/ClTensorHandle.hpp>
18#include <cl/workloads/ClWorkloads.hpp>
19#include <cl/workloads/ClWorkloadUtils.hpp>
telsoa014fcda012018-03-09 14:13:49 +000020
Aron Virginas-Tar5caf9072018-11-14 18:35:18 +000021#include <arm_compute/core/CL/CLKernelLibrary.h>
22#include <arm_compute/runtime/CL/CLBufferAllocator.h>
23#include <arm_compute/runtime/CL/CLScheduler.h>
telsoa014fcda012018-03-09 14:13:49 +000024
25#include <boost/polymorphic_cast.hpp>
26#include <boost/format.hpp>
surmeh013537c2c2018-05-18 16:31:43 +010027#include <boost/log/trivial.hpp>
telsoa014fcda012018-03-09 14:13:49 +000028
29namespace armnn
30{
31
David Beck79141b92018-10-23 16:09:36 +010032namespace
33{
34static const BackendId s_Id{ClBackendId()};
35}
36
telsoa01c577f2c2018-08-31 09:22:23 +010037bool ClWorkloadFactory::IsLayerSupported(const Layer& layer,
David Beck29c75de2018-10-23 13:35:58 +010038 Optional<DataType> dataType,
telsoa01c577f2c2018-08-31 09:22:23 +010039 std::string& outReasonIfUnsupported)
telsoa014fcda012018-03-09 14:13:49 +000040{
David Beck79141b92018-10-23 16:09:36 +010041 return IWorkloadFactory::IsLayerSupported(s_Id, layer, dataType, outReasonIfUnsupported);
42}
43
44const BackendId& ClWorkloadFactory::GetBackendId() const
45{
46 return s_Id;
telsoa014fcda012018-03-09 14:13:49 +000047}
48
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +010049template <typename FloatWorkload, typename Uint8Workload, typename QueueDescriptorType, typename... Args>
50std::unique_ptr<IWorkload> ClWorkloadFactory::MakeWorkload(const QueueDescriptorType& descriptor,
51 const WorkloadInfo& info,
52 Args&&... args)
53{
54 try
55 {
56 return MakeWorkloadHelper<FloatWorkload, Uint8Workload>(descriptor, info, std::forward<Args>(args)...);
57 }
58 catch (const cl::Error& clError)
59 {
60 throw WrapClError(clError, CHECK_LOCATION());
61 }
62}
63
64template <typename Workload, typename QueueDescriptorType, typename... Args>
65std::unique_ptr<IWorkload> ClWorkloadFactory::MakeWorkload(const QueueDescriptorType& descriptor,
66 const WorkloadInfo& info,
67 Args&&... args)
68{
69 try
70 {
71 return std::make_unique<Workload>(descriptor, info, std::forward<Args>(args)...);
72 }
73 catch (const cl::Error& clError)
74 {
75 throw WrapClError(clError, CHECK_LOCATION());
76 }
77}
78
Aron Virginas-Tar56055192018-11-12 18:10:43 +000079ClWorkloadFactory::ClWorkloadFactory(const std::shared_ptr<ClMemoryManager>& memoryManager)
80 : m_MemoryManager(memoryManager)
telsoa014fcda012018-03-09 14:13:49 +000081{
telsoa014fcda012018-03-09 14:13:49 +000082}
83
84std::unique_ptr<ITensorHandle> ClWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo) const
85{
telsoa01c577f2c2018-08-31 09:22:23 +010086 std::unique_ptr<ClTensorHandle> tensorHandle = std::make_unique<ClTensorHandle>(tensorInfo);
Aron Virginas-Tar56055192018-11-12 18:10:43 +000087 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
telsoa01c577f2c2018-08-31 09:22:23 +010088
89 return tensorHandle;
telsoa014fcda012018-03-09 14:13:49 +000090}
91
Francis Murtagh351d13d2018-09-24 15:01:18 +010092std::unique_ptr<ITensorHandle> ClWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo,
93 DataLayout dataLayout) const
94{
95 std::unique_ptr<ClTensorHandle> tensorHandle = std::make_unique<ClTensorHandle>(tensorInfo, dataLayout);
Aron Virginas-Tar56055192018-11-12 18:10:43 +000096 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
Francis Murtagh351d13d2018-09-24 15:01:18 +010097
98 return tensorHandle;
99}
100
telsoa014fcda012018-03-09 14:13:49 +0000101std::unique_ptr<ITensorHandle> ClWorkloadFactory::CreateSubTensorHandle(ITensorHandle& parent,
102 TensorShape const& subTensorShape,
103 unsigned int const* subTensorOrigin) const
104{
telsoa014fcda012018-03-09 14:13:49 +0000105 arm_compute::Coordinates coords;
106 arm_compute::TensorShape shape = armcomputetensorutils::BuildArmComputeTensorShape(subTensorShape);
107
108 coords.set_num_dimensions(subTensorShape.GetNumDimensions());
109 for (unsigned int i = 0; i < subTensorShape.GetNumDimensions(); i++)
110 {
telsoa01c577f2c2018-08-31 09:22:23 +0100111 // Arm compute indexes tensor coords in reverse order.
telsoa014fcda012018-03-09 14:13:49 +0000112 unsigned int revertedIndex = subTensorShape.GetNumDimensions() - i - 1;
113 coords.set(i, boost::numeric_cast<int>(subTensorOrigin[revertedIndex]));
114 }
115
telsoa01c577f2c2018-08-31 09:22:23 +0100116 return std::make_unique<ClSubTensorHandle>(
117 boost::polymorphic_downcast<IClTensorHandle*>(&parent), shape, coords);
telsoa014fcda012018-03-09 14:13:49 +0000118}
119
120std::unique_ptr<IWorkload> ClWorkloadFactory::CreateInput(const InputQueueDescriptor& descriptor,
121 const WorkloadInfo& info) const
122{
telsoa01c577f2c2018-08-31 09:22:23 +0100123 return MakeWorkload<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000124}
125
126std::unique_ptr<IWorkload> ClWorkloadFactory::CreateOutput(const OutputQueueDescriptor& descriptor,
127 const WorkloadInfo& info) const
128{
telsoa01c577f2c2018-08-31 09:22:23 +0100129 return MakeWorkload<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000130}
131
132std::unique_ptr<IWorkload> ClWorkloadFactory::CreateActivation(const ActivationQueueDescriptor& descriptor,
133 const WorkloadInfo& info) const
134{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100135 return MakeWorkload<ClActivationWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000136}
137
138std::unique_ptr<IWorkload> ClWorkloadFactory::CreateSoftmax(const SoftmaxQueueDescriptor& descriptor,
139 const WorkloadInfo& info) const
140{
arovir019e53a352018-08-31 15:26:35 +0100141 return MakeWorkload<ClSoftmaxFloatWorkload, ClSoftmaxUint8Workload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000142 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000143}
144
145std::unique_ptr<IWorkload> ClWorkloadFactory::CreateSplitter(const SplitterQueueDescriptor& descriptor,
146 const WorkloadInfo& info) const
147{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100148 return MakeWorkload<ClSplitterWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000149}
150
151std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateMerger(const MergerQueueDescriptor& descriptor,
152 const WorkloadInfo& info) const
153{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100154 return MakeWorkload<ClMergerWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000155}
156
157std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateFullyConnected(
158 const FullyConnectedQueueDescriptor& descriptor, const WorkloadInfo& info) const
159{
Matthew Benthamab8cdc12018-09-17 11:17:41 +0100160 return MakeWorkload<ClFullyConnectedWorkload, ClFullyConnectedWorkload>(descriptor, info,
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000161 m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000162}
163
164std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreatePermute(const PermuteQueueDescriptor& descriptor,
165 const WorkloadInfo& info) const
166{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100167 return MakeWorkload<ClPermuteWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000168}
169
170std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreatePooling2d(const Pooling2dQueueDescriptor& descriptor,
171 const WorkloadInfo& info) const
172{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100173 return MakeWorkload<ClPooling2dWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000174}
175
176std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateConvolution2d(const Convolution2dQueueDescriptor& descriptor,
177 const WorkloadInfo& info) const
178{
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000179 return MakeWorkload<ClConvolution2dWorkload>(descriptor, info, m_MemoryManager->GetIntraLayerManager());
telsoa014fcda012018-03-09 14:13:49 +0000180}
181
182std::unique_ptr<IWorkload> ClWorkloadFactory::CreateDepthwiseConvolution2d(
183 const DepthwiseConvolution2dQueueDescriptor& descriptor, const WorkloadInfo& info) const
184{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100185 return MakeWorkload<ClDepthwiseConvolutionWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000186}
187
188std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateNormalization(const NormalizationQueueDescriptor& descriptor,
189 const WorkloadInfo& info) const
190{
arovir019e53a352018-08-31 15:26:35 +0100191 return MakeWorkload<ClNormalizationFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000192}
193
194std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateAddition(const AdditionQueueDescriptor& descriptor,
195 const WorkloadInfo& info) const
196{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100197 return MakeWorkload<ClAdditionWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000198}
199
200std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateMultiplication(
201 const MultiplicationQueueDescriptor& descriptor, const WorkloadInfo& info) const
202{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100203 return MakeWorkload<ClMultiplicationWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000204}
205
Francis Murtaghe7a86a42018-08-29 12:42:10 +0100206std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateDivision(
207 const DivisionQueueDescriptor& descriptor, const WorkloadInfo& info) const
208{
209 return MakeWorkload<ClDivisionFloatWorkload, NullWorkload>(descriptor, info);
210}
211
David Beckc2044fe2018-09-05 15:00:38 +0100212std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateSubtraction(const SubtractionQueueDescriptor& descriptor,
213 const WorkloadInfo& info) const
214{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100215 return MakeWorkload<ClSubtractionWorkload>(descriptor, info);
David Beckc2044fe2018-09-05 15:00:38 +0100216}
217
telsoa014fcda012018-03-09 14:13:49 +0000218std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateBatchNormalization(
219 const BatchNormalizationQueueDescriptor& descriptor, const WorkloadInfo& info) const
220{
arovir019e53a352018-08-31 15:26:35 +0100221 return MakeWorkload<ClBatchNormalizationFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000222}
223
224std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateMemCopy(const MemCopyQueueDescriptor& descriptor,
225 const WorkloadInfo& info) const
226{
227 if (descriptor.m_Inputs.empty() || !descriptor.m_Inputs[0])
228 {
229 throw InvalidArgumentException("ClWorkloadFactory: Invalid null input for MemCopy workload");
230 }
231
telsoa01c577f2c2018-08-31 09:22:23 +0100232 return MakeWorkload<CopyMemGenericWorkload, CopyMemGenericWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000233}
234
235std::unique_ptr<armnn::IWorkload> ClWorkloadFactory::CreateResizeBilinear(
236 const ResizeBilinearQueueDescriptor& descriptor,
237 const WorkloadInfo& info) const
238{
arovir019e53a352018-08-31 15:26:35 +0100239 return MakeWorkload<ClResizeBilinearFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000240}
241
242std::unique_ptr<IWorkload> ClWorkloadFactory::CreateFakeQuantization(
243 const FakeQuantizationQueueDescriptor& descriptor,
244 const WorkloadInfo& info) const
245{
246 return nullptr;
247}
248
249std::unique_ptr<IWorkload> ClWorkloadFactory::CreateL2Normalization(const L2NormalizationQueueDescriptor& descriptor,
250 const WorkloadInfo& info) const
251{
arovir019e53a352018-08-31 15:26:35 +0100252 return MakeWorkload<ClL2NormalizationFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000253}
254
255std::unique_ptr<IWorkload> ClWorkloadFactory::CreateConstant(const ConstantQueueDescriptor& descriptor,
256 const WorkloadInfo& info) const
257{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100258 return MakeWorkload<ClConstantWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000259}
260
261std::unique_ptr<IWorkload> ClWorkloadFactory::CreateReshape(const ReshapeQueueDescriptor& descriptor,
262 const WorkloadInfo& info) const
263{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100264 return MakeWorkload<ClReshapeWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000265}
266
Nattapat Chaimanowong207ef9a2018-11-02 10:57:25 +0000267std::unique_ptr<IWorkload> ClWorkloadFactory::CreateSpaceToBatchNd(const SpaceToBatchNdQueueDescriptor& descriptor,
268 const WorkloadInfo& info) const
269{
270 return nullptr;
271}
272
telsoa014fcda012018-03-09 14:13:49 +0000273std::unique_ptr<IWorkload> ClWorkloadFactory::CreateFloor(const FloorQueueDescriptor& descriptor,
274 const WorkloadInfo& info) const
275{
arovir019e53a352018-08-31 15:26:35 +0100276 return MakeWorkload<ClFloorFloatWorkload, NullWorkload>(descriptor, info);
telsoa014fcda012018-03-09 14:13:49 +0000277}
278
telsoa01c577f2c2018-08-31 09:22:23 +0100279std::unique_ptr<IWorkload> ClWorkloadFactory::CreateLstm(const LstmQueueDescriptor& descriptor,
280 const WorkloadInfo& info) const
281{
arovir019e53a352018-08-31 15:26:35 +0100282 return MakeWorkload<ClLstmFloatWorkload, NullWorkload>(descriptor, info);
telsoa01c577f2c2018-08-31 09:22:23 +0100283}
284
285std::unique_ptr<IWorkload> ClWorkloadFactory::CreateConvertFp16ToFp32(
286 const ConvertFp16ToFp32QueueDescriptor& descriptor,
287 const WorkloadInfo& info) const
288{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100289 return MakeWorkload<ClConvertFp16ToFp32Workload>(descriptor, info);
telsoa01c577f2c2018-08-31 09:22:23 +0100290}
291
292std::unique_ptr<IWorkload> ClWorkloadFactory::CreateConvertFp32ToFp16(
293 const ConvertFp32ToFp16QueueDescriptor& descriptor,
294 const WorkloadInfo& info) const
295{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100296 return MakeWorkload<ClConvertFp32ToFp16Workload>(descriptor, info);
telsoa01c577f2c2018-08-31 09:22:23 +0100297}
298
Nattapat Chaimanowong5a4304a2018-11-28 10:44:37 +0000299std::unique_ptr<IWorkload> ClWorkloadFactory::CreateMaximum(const MaximumQueueDescriptor& descriptor,
300 const WorkloadInfo& info) const
301{
302 return MakeWorkload<NullWorkload, NullWorkload>(descriptor, info);
303}
304
narpra01a6bf9122018-09-10 09:50:09 +0100305std::unique_ptr<IWorkload> ClWorkloadFactory::CreateMean(const MeanQueueDescriptor& descriptor,
306 const WorkloadInfo& info) const
307{
Matteo Martincigh28dcab62018-10-19 16:40:03 +0100308 return std::make_unique<ClMeanWorkload>(descriptor, info);
narpra01a6bf9122018-09-10 09:50:09 +0100309}
310
jimfly012c9322a2018-09-19 10:59:49 +0100311std::unique_ptr<IWorkload> ClWorkloadFactory::CreatePad(const PadQueueDescriptor& descriptor,
312 const WorkloadInfo& info) const
313{
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100314 return MakeWorkload<ClPadWorkload>(descriptor, info);
jimfly012c9322a2018-09-19 10:59:49 +0100315}
316
FrancisMurtagh20995952018-12-17 12:11:36 +0000317std::unique_ptr<IWorkload> ClWorkloadFactory::CreateEqual(const EqualQueueDescriptor& descriptor,
318 const WorkloadInfo& info) const
319{
320 return MakeWorkload<NullWorkload, NullWorkload>(descriptor, info);
321}
322
Éanna Ó Catháin4e1e1362018-11-12 11:36:34 +0000323std::unique_ptr<IWorkload> ClWorkloadFactory::CreateBatchToSpaceNd(const BatchToSpaceNdQueueDescriptor& descriptor,
324 const WorkloadInfo& info) const
325{
Mike Kelly831faed2018-11-28 11:52:08 +0000326 return MakeWorkload<ClBatchToSpaceNdWorkload>(descriptor, info);
Éanna Ó Catháin4e1e1362018-11-12 11:36:34 +0000327}
328
Conor Kennedy430b5d82018-11-14 15:28:28 +0000329std::unique_ptr<IWorkload> ClWorkloadFactory::CreateStridedSlice(const StridedSliceQueueDescriptor& descriptor,
330 const WorkloadInfo& info) const
331{
332 return MakeWorkload<NullWorkload, NullWorkload>(descriptor, info);
333}
334
kevmay0190539692018-11-29 08:40:19 +0000335std::unique_ptr<IWorkload> ClWorkloadFactory::CreateMinimum(const MinimumQueueDescriptor& descriptor,
336 const WorkloadInfo& info) const
337{
338 return MakeWorkload<NullWorkload, NullWorkload>(descriptor, info);
339}
340
Matteo Martincigh59a950c2018-12-13 12:48:25 +0000341std::unique_ptr<IWorkload> ClWorkloadFactory::CreateGreater(const GreaterQueueDescriptor& descriptor,
342 const WorkloadInfo& info) const
343{
344 return MakeWorkload<NullWorkload, NullWorkload>(descriptor, info);
345}
346
Nattapat Chaimanowonga9a1cf12018-12-03 16:06:49 +0000347std::unique_ptr<IWorkload> ClWorkloadFactory::CreateDebug(const DebugQueueDescriptor& descriptor,
348 const WorkloadInfo& info) const
349{
350 return MakeWorkload<NullWorkload, NullWorkload>(descriptor, info);
351}
352
telsoa014fcda012018-03-09 14:13:49 +0000353} // namespace armnn