blob: 134dad576e8460dccd855a80293b5c776ca7026d [file] [log] [blame]
Laurent Carlier749294b2020-06-01 09:03:17 +01001//
Teresa Charlin8398edc2020-07-20 14:23:02 +01002// Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5#include "ClWorkloadFactory.hpp"
David Beck79141b92018-10-23 16:09:36 +01006#include "ClBackendId.hpp"
Sadik Armagan04a72972020-09-14 15:44:18 +01007#include "ClBackendModelContext.hpp"
Matthew Sloyan80fbcd52021-01-07 13:28:47 +00008#include "ClContextDeserializer.hpp"
9#include "ClContextSerializer.hpp"
telsoa014fcda012018-03-09 14:13:49 +000010
Aron Virginas-Tar5caf9072018-11-14 18:35:18 +000011#include <Layer.hpp>
12
David Beck0dbe0ee2018-09-24 15:59:27 +010013#include <armnn/Exceptions.hpp>
14#include <armnn/Utils.hpp>
Jan Eilers8eb25602020-03-09 12:13:48 +000015#include <armnn/utility/IgnoreUnused.hpp>
Matthew Sloyan171214c2020-09-09 09:07:37 +010016#include <armnn/utility/NumericCast.hpp>
Jan Eilersbb446e52020-04-02 13:56:54 +010017#include <armnn/utility/PolymorphicDowncast.hpp>
telsoa014fcda012018-03-09 14:13:49 +000018
Aron Virginas-Tar5caf9072018-11-14 18:35:18 +000019#include <backendsCommon/MakeWorkloadHelper.hpp>
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000020#include <backendsCommon/MemCopyWorkload.hpp>
Derek Lambertif674aa02019-08-01 15:56:25 +010021#include <backendsCommon/MemImportWorkload.hpp>
James Conroy1f58f032021-04-27 17:13:27 +010022#include <backendsCommon/TensorHandle.hpp>
telsoa01c577f2c2018-08-31 09:22:23 +010023
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000024#include <cl/ClTensorHandle.hpp>
25#include <cl/workloads/ClWorkloads.hpp>
26#include <cl/workloads/ClWorkloadUtils.hpp>
telsoa014fcda012018-03-09 14:13:49 +000027
Aron Virginas-Tar5caf9072018-11-14 18:35:18 +000028#include <arm_compute/core/CL/CLKernelLibrary.h>
29#include <arm_compute/runtime/CL/CLBufferAllocator.h>
30#include <arm_compute/runtime/CL/CLScheduler.h>
telsoa014fcda012018-03-09 14:13:49 +000031
Rob Hughes9542f902021-07-14 09:48:54 +010032#include <armnnUtils/Filesystem.hpp>
Matthew Sloyan80fbcd52021-01-07 13:28:47 +000033#include <fstream>
Sadik Armagandea8fb62020-11-26 10:38:11 +000034
Sadik Armaganb7851f92021-10-06 16:37:02 +010035#include <sys/stat.h>
36
telsoa014fcda012018-03-09 14:13:49 +000037namespace armnn
38{
39
David Beck79141b92018-10-23 16:09:36 +010040namespace
41{
42static const BackendId s_Id{ClBackendId()};
43}
44
telsoa01c577f2c2018-08-31 09:22:23 +010045bool ClWorkloadFactory::IsLayerSupported(const Layer& layer,
David Beck29c75de2018-10-23 13:35:58 +010046 Optional<DataType> dataType,
telsoa01c577f2c2018-08-31 09:22:23 +010047 std::string& outReasonIfUnsupported)
telsoa014fcda012018-03-09 14:13:49 +000048{
David Beck79141b92018-10-23 16:09:36 +010049 return IWorkloadFactory::IsLayerSupported(s_Id, layer, dataType, outReasonIfUnsupported);
50}
51
Sadik Armagan04a72972020-09-14 15:44:18 +010052bool ClWorkloadFactory::IsLayerSupported(const IConnectableLayer& layer,
53 Optional<DataType> dataType,
54 std::string& outReasonIfUnsupported,
55 const ModelOptions& modelOptions)
56{
57 return IWorkloadFactory::IsLayerSupported(s_Id, layer, dataType, outReasonIfUnsupported, modelOptions);
58}
59
David Beck79141b92018-10-23 16:09:36 +010060const BackendId& ClWorkloadFactory::GetBackendId() const
61{
62 return s_Id;
telsoa014fcda012018-03-09 14:13:49 +000063}
64
Sadik Armagandea8fb62020-11-26 10:38:11 +000065void ClWorkloadFactory::AfterWorkloadsCreated()
66{
67 if(m_ModelContextPtr)
68 {
69 auto modelOptions = dynamic_cast<ClBackendModelContext*>(m_ModelContextPtr.get());
70 if (modelOptions->SaveCachedNetwork())
71 {
Sadik Armaganb7851f92021-10-06 16:37:02 +010072 ClContextSerializer serializer;
73 serializer.Serialize(m_CLCompileContext);
74 auto cachedFd = modelOptions->GetCachedFileDescriptor();
75 if (cachedFd != -1)
76 {
77 std::vector<uint8_t> compiledContextData;
78 std::stringstream stream;
79 bool serialized = serializer.SaveSerializedToStream(stream);
80 if (serialized)
81 {
82 std::string const serializedString{stream.str()};
83 std::copy(serializedString.begin(),
84 serializedString.end(),
85 std::back_inserter(compiledContextData));
86 write(cachedFd, compiledContextData.data(), compiledContextData.size());
87 }
88 }
89
Sadik Armagandea8fb62020-11-26 10:38:11 +000090 // Save map to a filepath provided in ModelOptions
91 auto filePath = modelOptions->GetCachedNetworkFilePath();
92 if (filePath != "" && fs::exists(filePath) && fs::is_regular_file(filePath))
93 {
Matthew Sloyan80fbcd52021-01-07 13:28:47 +000094 // Serialize ClContext to the file specified
Matthew Sloyan80fbcd52021-01-07 13:28:47 +000095 std::ofstream file(filePath, std::ios::out | std::ios::binary);
96 serializer.SaveSerializedToStream(file);
Sadik Armagandea8fb62020-11-26 10:38:11 +000097 }
98 }
99 }
100}
101
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +0100102template <typename FloatWorkload, typename Uint8Workload, typename QueueDescriptorType, typename... Args>
103std::unique_ptr<IWorkload> ClWorkloadFactory::MakeWorkload(const QueueDescriptorType& descriptor,
104 const WorkloadInfo& info,
105 Args&&... args)
106{
107 try
108 {
109 return MakeWorkloadHelper<FloatWorkload, Uint8Workload>(descriptor, info, std::forward<Args>(args)...);
110 }
111 catch (const cl::Error& clError)
112 {
113 throw WrapClError(clError, CHECK_LOCATION());
114 }
115}
116
117template <typename Workload, typename QueueDescriptorType, typename... Args>
118std::unique_ptr<IWorkload> ClWorkloadFactory::MakeWorkload(const QueueDescriptorType& descriptor,
119 const WorkloadInfo& info,
120 Args&&... args)
121{
122 try
123 {
124 return std::make_unique<Workload>(descriptor, info, std::forward<Args>(args)...);
125 }
126 catch (const cl::Error& clError)
127 {
128 throw WrapClError(clError, CHECK_LOCATION());
129 }
130}
131
Sadik Armagandea8fb62020-11-26 10:38:11 +0000132void ClWorkloadFactory::InitializeCLCompileContext()
133{
134 // Initialize our m_CLCompileContext using default device and context
Sadik Armagane9444752020-12-02 11:28:58 +0000135 auto context = arm_compute::CLKernelLibrary::get().context();
136 auto device = arm_compute::CLKernelLibrary::get().get_device();
Sadik Armagandea8fb62020-11-26 10:38:11 +0000137 m_CLCompileContext = arm_compute::CLCompileContext(context, device);
138
139 if (m_ModelContextPtr)
140 {
141 // Load saved programs if the user has set a filepath
142 auto modelOptions = dynamic_cast<ClBackendModelContext*>(m_ModelContextPtr.get());
143 auto filePath = modelOptions->GetCachedNetworkFilePath();
Sadik Armaganb7851f92021-10-06 16:37:02 +0100144 if (!(modelOptions->SaveCachedNetwork()))
Sadik Armagandea8fb62020-11-26 10:38:11 +0000145 {
Matthew Sloyan80fbcd52021-01-07 13:28:47 +0000146 ClContextDeserializer deserializer;
Sadik Armaganb7851f92021-10-06 16:37:02 +0100147 auto cachedFd = modelOptions->GetCachedFileDescriptor();
148 if (cachedFd != -1)
149 {
150 struct stat statBuffer;
151 if (fstat(cachedFd, &statBuffer) == 0)
152 {
153 long dataSize = static_cast<long>(statBuffer.st_size);
154 if( dataSize > 0)
155 {
156 auto offset = lseek(cachedFd, 0, SEEK_CUR);
157 if (offset == 0)
158 {
159 std::vector <uint8_t> compiledContextData(static_cast<unsigned int>(dataSize));
160 pread(cachedFd, compiledContextData.data(), compiledContextData.size(), 0);
161 deserializer.DeserializeFromBinary(m_CLCompileContext,
162 context,
163 device,
164 compiledContextData);
165 }
166 }
167
168 }
169 }
170
171 if (filePath != "" && fs::exists(filePath) && fs::is_regular_file(filePath))
172 {
173 // Deserialize binary file and load into m_CLCompileContext
174 deserializer.Deserialize(m_CLCompileContext, context, device, filePath);
175 }
Sadik Armagandea8fb62020-11-26 10:38:11 +0000176 }
177 }
178}
179
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000180ClWorkloadFactory::ClWorkloadFactory(const std::shared_ptr<ClMemoryManager>& memoryManager)
Sadik Armagan04a72972020-09-14 15:44:18 +0100181 : m_MemoryManager(memoryManager), m_ModelContextPtr(IBackendInternal::IBackendSpecificModelContextPtr{})
182{
Sadik Armagandea8fb62020-11-26 10:38:11 +0000183 InitializeCLCompileContext();
Sadik Armagan04a72972020-09-14 15:44:18 +0100184}
185
186ClWorkloadFactory::ClWorkloadFactory(const std::shared_ptr<ClMemoryManager>& memoryManager,
187 const IBackendInternal::IBackendSpecificModelContextPtr& modelContextPtr)
188 : m_MemoryManager(memoryManager), m_ModelContextPtr(modelContextPtr)
telsoa014fcda012018-03-09 14:13:49 +0000189{
Sadik Armagandea8fb62020-11-26 10:38:11 +0000190 InitializeCLCompileContext();
telsoa014fcda012018-03-09 14:13:49 +0000191}
192
David Monahan3fb7e102019-08-20 11:25:29 +0100193std::unique_ptr<ITensorHandle> ClWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo,
194 const bool IsMemoryManaged) const
telsoa014fcda012018-03-09 14:13:49 +0000195{
Jan Eilers8eb25602020-03-09 12:13:48 +0000196 IgnoreUnused(IsMemoryManaged);
telsoa01c577f2c2018-08-31 09:22:23 +0100197 std::unique_ptr<ClTensorHandle> tensorHandle = std::make_unique<ClTensorHandle>(tensorInfo);
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000198 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
telsoa01c577f2c2018-08-31 09:22:23 +0100199
200 return tensorHandle;
telsoa014fcda012018-03-09 14:13:49 +0000201}
202
Francis Murtagh351d13d2018-09-24 15:01:18 +0100203std::unique_ptr<ITensorHandle> ClWorkloadFactory::CreateTensorHandle(const TensorInfo& tensorInfo,
David Monahan3fb7e102019-08-20 11:25:29 +0100204 DataLayout dataLayout,
205 const bool IsMemoryManaged) const
Francis Murtagh351d13d2018-09-24 15:01:18 +0100206{
Jan Eilers8eb25602020-03-09 12:13:48 +0000207 IgnoreUnused(IsMemoryManaged);
Francis Murtagh351d13d2018-09-24 15:01:18 +0100208 std::unique_ptr<ClTensorHandle> tensorHandle = std::make_unique<ClTensorHandle>(tensorInfo, dataLayout);
Aron Virginas-Tar56055192018-11-12 18:10:43 +0000209 tensorHandle->SetMemoryGroup(m_MemoryManager->GetInterLayerMemoryGroup());
Francis Murtagh351d13d2018-09-24 15:01:18 +0100210
211 return tensorHandle;
212}
213
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100214std::unique_ptr<ITensorHandle> ClWorkloadFactory::CreateSubTensorHandle(ITensorHandle& parent,
215 TensorShape const& subTensorShape,
telsoa014fcda012018-03-09 14:13:49 +0000216 unsigned int const* subTensorOrigin) const
217{
telsoa014fcda012018-03-09 14:13:49 +0000218 arm_compute::Coordinates coords;
219 arm_compute::TensorShape shape = armcomputetensorutils::BuildArmComputeTensorShape(subTensorShape);
220
221 coords.set_num_dimensions(subTensorShape.GetNumDimensions());
222 for (unsigned int i = 0; i < subTensorShape.GetNumDimensions(); i++)
223 {
telsoa01c577f2c2018-08-31 09:22:23 +0100224 // Arm compute indexes tensor coords in reverse order.
telsoa014fcda012018-03-09 14:13:49 +0000225 unsigned int revertedIndex = subTensorShape.GetNumDimensions() - i - 1;
Matthew Sloyan171214c2020-09-09 09:07:37 +0100226 coords.set(i, armnn::numeric_cast<int>(subTensorOrigin[revertedIndex]));
telsoa014fcda012018-03-09 14:13:49 +0000227 }
228
Derek Lamberti0790dce2019-04-15 18:37:35 +0100229 const arm_compute::TensorShape parentShape = armcomputetensorutils::BuildArmComputeTensorShape(parent.GetShape());
230 if (!::arm_compute::error_on_invalid_subtensor(__func__, __FILE__, __LINE__, parentShape, coords, shape))
231 {
232 return nullptr;
233 }
234
telsoa01c577f2c2018-08-31 09:22:23 +0100235 return std::make_unique<ClSubTensorHandle>(
Jan Eilersbb446e52020-04-02 13:56:54 +0100236 PolymorphicDowncast<IClTensorHandle*>(&parent), shape, coords);
telsoa014fcda012018-03-09 14:13:49 +0000237}
238
telsoa014fcda012018-03-09 14:13:49 +0000239std::unique_ptr<IWorkload> ClWorkloadFactory::CreateActivation(const ActivationQueueDescriptor& descriptor,
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100240 const WorkloadInfo& info) const
telsoa014fcda012018-03-09 14:13:49 +0000241{
Sadik Armagane9444752020-12-02 11:28:58 +0000242 return MakeWorkload<ClActivationWorkload>(descriptor, info, m_CLCompileContext);
telsoa014fcda012018-03-09 14:13:49 +0000243}
244
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100245std::unique_ptr<IWorkload> ClWorkloadFactory::CreateAddition(const AdditionQueueDescriptor& descriptor,
246 const WorkloadInfo& info) const
telsoa014fcda012018-03-09 14:13:49 +0000247{
Sadik Armagane9444752020-12-02 11:28:58 +0000248 return MakeWorkload<ClAdditionWorkload>(descriptor, info, m_CLCompileContext);
telsoa014fcda012018-03-09 14:13:49 +0000249}
250
James Conroy2dc05722019-09-19 17:00:31 +0100251std::unique_ptr<IWorkload> ClWorkloadFactory::CreateArgMinMax(const ArgMinMaxQueueDescriptor& descriptor,
252 const WorkloadInfo& info) const
253{
Sadik Armagane9444752020-12-02 11:28:58 +0000254 return std::make_unique<ClArgMinMaxWorkload>(descriptor, info, m_CLCompileContext);
James Conroy2dc05722019-09-19 17:00:31 +0100255}
256
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100257std::unique_ptr<IWorkload> ClWorkloadFactory::CreateBatchNormalization(
258 const BatchNormalizationQueueDescriptor& descriptor,
259 const WorkloadInfo& info) const
telsoa014fcda012018-03-09 14:13:49 +0000260{
Sadik Armagane9444752020-12-02 11:28:58 +0000261 return MakeWorkload<ClBatchNormalizationFloatWorkload, NullWorkload>(descriptor, info, m_CLCompileContext);
telsoa014fcda012018-03-09 14:13:49 +0000262}
263
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100264std::unique_ptr<IWorkload> ClWorkloadFactory::CreateBatchToSpaceNd(const BatchToSpaceNdQueueDescriptor& descriptor,
telsoa014fcda012018-03-09 14:13:49 +0000265 const WorkloadInfo& info) const
266{
Sadik Armagane9444752020-12-02 11:28:58 +0000267 return MakeWorkload<ClBatchToSpaceNdWorkload>(descriptor, info, m_CLCompileContext);
telsoa014fcda012018-03-09 14:13:49 +0000268}
269
Sadik Armaganf40d6d42021-04-22 09:12:11 +0100270std::unique_ptr<IWorkload> ClWorkloadFactory::CreateCast(const CastQueueDescriptor& descriptor,
271 const WorkloadInfo& info) const
272{
273 return MakeWorkload<ClCastWorkload>(descriptor, info, m_CLCompileContext);
274}
275
Teresa Charlin1222dbd2021-09-02 13:58:52 +0100276std::unique_ptr<IWorkload> ClWorkloadFactory::CreateChannelShuffle(const ChannelShuffleQueueDescriptor& descriptor,
277 const WorkloadInfo& info) const
278{
279 return MakeWorkload<ClChannelShuffleWorkload>(descriptor, info, m_CLCompileContext);
280}
281
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100282std::unique_ptr<IWorkload> ClWorkloadFactory::CreateComparison(const ComparisonQueueDescriptor& descriptor,
283 const WorkloadInfo& info) const
284{
Sadik Armagane9444752020-12-02 11:28:58 +0000285 return MakeWorkload<ClComparisonWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100286}
287
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100288std::unique_ptr<IWorkload> ClWorkloadFactory::CreateConcat(const ConcatQueueDescriptor& descriptor,
289 const WorkloadInfo& info) const
Jim Flynn4ed6c832019-05-20 11:02:46 +0100290{
Sadik Armagane9444752020-12-02 11:28:58 +0000291 return MakeWorkload<ClConcatWorkload>(descriptor, info, m_CLCompileContext);
Jim Flynn4ed6c832019-05-20 11:02:46 +0100292}
293
telsoa014fcda012018-03-09 14:13:49 +0000294std::unique_ptr<IWorkload> ClWorkloadFactory::CreateConstant(const ConstantQueueDescriptor& descriptor,
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100295 const WorkloadInfo& info) const
telsoa014fcda012018-03-09 14:13:49 +0000296{
Sadik Armagane9444752020-12-02 11:28:58 +0000297 return MakeWorkload<ClConstantWorkload>(descriptor, info, m_CLCompileContext);
telsoa014fcda012018-03-09 14:13:49 +0000298}
299
telsoa01c577f2c2018-08-31 09:22:23 +0100300std::unique_ptr<IWorkload> ClWorkloadFactory::CreateConvertFp16ToFp32(
301 const ConvertFp16ToFp32QueueDescriptor& descriptor,
302 const WorkloadInfo& info) const
303{
Sadik Armagane9444752020-12-02 11:28:58 +0000304 return MakeWorkload<ClConvertFp16ToFp32Workload>(descriptor, info, m_CLCompileContext);
telsoa01c577f2c2018-08-31 09:22:23 +0100305}
306
307std::unique_ptr<IWorkload> ClWorkloadFactory::CreateConvertFp32ToFp16(
308 const ConvertFp32ToFp16QueueDescriptor& descriptor,
309 const WorkloadInfo& info) const
310{
Sadik Armagane9444752020-12-02 11:28:58 +0000311 return MakeWorkload<ClConvertFp32ToFp16Workload>(descriptor, info, m_CLCompileContext);
telsoa01c577f2c2018-08-31 09:22:23 +0100312}
313
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100314std::unique_ptr<IWorkload> ClWorkloadFactory::CreateConvolution2d(const Convolution2dQueueDescriptor& descriptor,
315 const WorkloadInfo& info) const
316{
Sadik Armagan04a72972020-09-14 15:44:18 +0100317 bool isFastMathEnabled = false;
318 if (m_ModelContextPtr)
319 {
320 if (m_ModelContextPtr.get() != nullptr)
321 {
322 auto modelOptions = dynamic_cast<ClBackendModelContext*>(m_ModelContextPtr.get());
323 if (modelOptions)
324 {
325 isFastMathEnabled = modelOptions->IsFastMathEnabled();
326 }
327 }
328 }
329 return MakeWorkload<ClConvolution2dWorkload>(descriptor,
330 info,
331 m_MemoryManager->GetIntraLayerManager(),
Sadik Armagane9444752020-12-02 11:28:58 +0000332 m_CLCompileContext,
Sadik Armagan04a72972020-09-14 15:44:18 +0100333 isFastMathEnabled);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100334}
335
Teresa Charlin615ad6c2021-10-26 12:22:20 +0100336std::unique_ptr<IWorkload> ClWorkloadFactory::CreateConvolution3d(const Convolution3dQueueDescriptor& descriptor,
337 const WorkloadInfo& info) const
338{
339 bool isFastMathEnabled = false;
340 if (m_ModelContextPtr)
341 {
342 if (m_ModelContextPtr.get() != nullptr)
343 {
344 auto modelOptions = dynamic_cast<ClBackendModelContext*>(m_ModelContextPtr.get());
345 if (modelOptions)
346 {
347 isFastMathEnabled = modelOptions->IsFastMathEnabled();
348 }
349 }
350 }
351 return MakeWorkload<ClConvolution3dWorkload>(descriptor,
352 info,
353 m_MemoryManager->GetIntraLayerManager(),
354 m_CLCompileContext,
355 isFastMathEnabled);
356}
357
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100358std::unique_ptr<IWorkload> ClWorkloadFactory::CreateDebug(const DebugQueueDescriptor& descriptor,
359 const WorkloadInfo& info) const
360{
Sadik Armagane9444752020-12-02 11:28:58 +0000361 return MakeWorkload<NullWorkload, NullWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100362}
363
364std::unique_ptr<IWorkload> ClWorkloadFactory::CreateDepthToSpace(const DepthToSpaceQueueDescriptor& descriptor,
365 const WorkloadInfo& info) const
366{
Sadik Armagane9444752020-12-02 11:28:58 +0000367 return MakeWorkload<ClDepthToSpaceWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100368}
369
370std::unique_ptr<IWorkload> ClWorkloadFactory::CreateDepthwiseConvolution2d(
371 const DepthwiseConvolution2dQueueDescriptor& descriptor,
372 const WorkloadInfo& info) const
373{
Sadik Armagane9444752020-12-02 11:28:58 +0000374 return MakeWorkload<ClDepthwiseConvolutionWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100375}
376
377std::unique_ptr<IWorkload> ClWorkloadFactory::CreateDequantize(const DequantizeQueueDescriptor& descriptor,
378 const WorkloadInfo& info) const
379{
Sadik Armagane9444752020-12-02 11:28:58 +0000380 return MakeWorkload<ClDequantizeWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100381}
382
383std::unique_ptr<IWorkload> ClWorkloadFactory::CreateDetectionPostProcess(
384 const DetectionPostProcessQueueDescriptor& descriptor,
385 const WorkloadInfo& info) const
386{
Sadik Armagane9444752020-12-02 11:28:58 +0000387 return MakeWorkload<NullWorkload, NullWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100388}
389
390std::unique_ptr<IWorkload> ClWorkloadFactory::CreateDivision(const DivisionQueueDescriptor& descriptor,
391 const WorkloadInfo& info) const
392{
Teresa Charline11e63d2021-04-21 12:56:45 +0100393 return std::make_unique<ClDivisionWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100394}
395
josh minor4a3c6102020-01-06 16:40:46 -0600396std::unique_ptr<IWorkload> ClWorkloadFactory::CreateElementwiseUnary(const ElementwiseUnaryQueueDescriptor& descriptor,
397 const WorkloadInfo& info) const
398{
Sadik Armagan9fabf432020-05-27 13:40:58 +0100399 switch(descriptor.m_Parameters.m_Operation)
josh minor4a3c6102020-01-06 16:40:46 -0600400 {
Sadik Armagan9fabf432020-05-27 13:40:58 +0100401 case UnaryOperation::Abs:
James Conroyfe3ec942020-11-18 14:20:53 +0000402 {
403 AbsQueueDescriptor absQueueDescriptor;
404 absQueueDescriptor.m_Inputs = descriptor.m_Inputs;
405 absQueueDescriptor.m_Outputs = descriptor.m_Outputs;
josh minor4a3c6102020-01-06 16:40:46 -0600406
Sadik Armagane9444752020-12-02 11:28:58 +0000407 return std::make_unique<ClAbsWorkload>(absQueueDescriptor, info, m_CLCompileContext);
James Conroyfe3ec942020-11-18 14:20:53 +0000408 }
Sadik Armagan9fabf432020-05-27 13:40:58 +0100409 case UnaryOperation::Exp:
Sadik Armagane9444752020-12-02 11:28:58 +0000410 return std::make_unique<ClExpWorkload>(descriptor, info, m_CLCompileContext);
Teresa Charlin50de4fa2021-05-31 18:47:33 +0100411 case UnaryOperation::Log:
412 return std::make_unique<ClLogWorkload>(descriptor, info, m_CLCompileContext);
413 case UnaryOperation::LogicalNot:
414 return std::make_unique<ClLogicalNotWorkload>(descriptor, info, m_CLCompileContext);
Sadik Armagan9fabf432020-05-27 13:40:58 +0100415 case UnaryOperation::Neg:
Sadik Armagane9444752020-12-02 11:28:58 +0000416 return std::make_unique<ClNegWorkload>(descriptor, info, m_CLCompileContext);
Sadik Armagan9fabf432020-05-27 13:40:58 +0100417 case UnaryOperation::Rsqrt:
James Conroyfe3ec942020-11-18 14:20:53 +0000418 {
419 RsqrtQueueDescriptor rsqrtQueueDescriptor;
420 rsqrtQueueDescriptor.m_Inputs = descriptor.m_Inputs;
421 rsqrtQueueDescriptor.m_Outputs = descriptor.m_Outputs;
josh minor4a3c6102020-01-06 16:40:46 -0600422
Sadik Armagane9444752020-12-02 11:28:58 +0000423 return std::make_unique<ClRsqrtWorkload>(rsqrtQueueDescriptor, info, m_CLCompileContext);
James Conroyfe3ec942020-11-18 14:20:53 +0000424 }
Teresa Charlin50de4fa2021-05-31 18:47:33 +0100425 case UnaryOperation::Sin:
426 return std::make_unique<ClSinWorkload>(descriptor, info, m_CLCompileContext);
Sadik Armagan9fabf432020-05-27 13:40:58 +0100427 default:
428 return nullptr;
josh minor4a3c6102020-01-06 16:40:46 -0600429 }
josh minor4a3c6102020-01-06 16:40:46 -0600430}
431
Sadik Armagan66aecb02020-06-24 11:42:20 +0100432std::unique_ptr<IWorkload> ClWorkloadFactory::CreateFill(const FillQueueDescriptor& descriptor,
433 const WorkloadInfo& info) const
434{
Sadik Armagane9444752020-12-02 11:28:58 +0000435 return std::make_unique<ClFillWorkload>(descriptor, info, m_CLCompileContext);
Sadik Armagan66aecb02020-06-24 11:42:20 +0100436}
437
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100438std::unique_ptr<IWorkload> ClWorkloadFactory::CreateFloor(const FloorQueueDescriptor& descriptor,
439 const WorkloadInfo& info) const
440{
Sadik Armagane9444752020-12-02 11:28:58 +0000441 return MakeWorkload<ClFloorFloatWorkload, NullWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100442}
443
444std::unique_ptr<IWorkload> ClWorkloadFactory::CreateFullyConnected(const FullyConnectedQueueDescriptor& descriptor,
445 const WorkloadInfo& info) const
446{
Sadik Armagane9444752020-12-02 11:28:58 +0000447 return MakeWorkload<ClFullyConnectedWorkload>(descriptor,
448 info,
449 m_MemoryManager->GetIntraLayerManager(),
450 m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100451}
452
453std::unique_ptr<IWorkload> ClWorkloadFactory::CreateGather(const GatherQueueDescriptor& descriptor,
454 const WorkloadInfo& info) const
455{
Sadik Armagane9444752020-12-02 11:28:58 +0000456 return MakeWorkload<ClGatherWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100457}
458
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100459std::unique_ptr<IWorkload> ClWorkloadFactory::CreateInput(const InputQueueDescriptor& descriptor,
460 const WorkloadInfo& info) const
461{
462 return std::make_unique<CopyMemGenericWorkload>(descriptor, info);
463}
464
465std::unique_ptr<IWorkload> ClWorkloadFactory::CreateInstanceNormalization(
466 const InstanceNormalizationQueueDescriptor& descriptor,
467 const WorkloadInfo& info) const
468{
Sadik Armagane9444752020-12-02 11:28:58 +0000469 return MakeWorkload<ClInstanceNormalizationWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100470}
471
472std::unique_ptr<IWorkload> ClWorkloadFactory::CreateL2Normalization(const L2NormalizationQueueDescriptor& descriptor,
473 const WorkloadInfo& info) const
474{
Sadik Armagane9444752020-12-02 11:28:58 +0000475 return MakeWorkload<ClL2NormalizationFloatWorkload, NullWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100476}
477
James Conroyfe3ec942020-11-18 14:20:53 +0000478std::unique_ptr<IWorkload> ClWorkloadFactory::CreateLogicalBinary(const LogicalBinaryQueueDescriptor& descriptor,
479 const WorkloadInfo& info) const
480{
481 switch(descriptor.m_Parameters.m_Operation)
482 {
483 case LogicalBinaryOperation::LogicalAnd:
Sadik Armagane9444752020-12-02 11:28:58 +0000484 return std::make_unique<ClLogicalAndWorkload>(descriptor, info, m_CLCompileContext);
James Conroyfe3ec942020-11-18 14:20:53 +0000485 case LogicalBinaryOperation::LogicalOr:
Sadik Armagane9444752020-12-02 11:28:58 +0000486 return std::make_unique<ClLogicalOrWorkload>(descriptor, info, m_CLCompileContext);
James Conroyfe3ec942020-11-18 14:20:53 +0000487 default:
488 return nullptr;
489 }
490}
491
Teresa Charlin8398edc2020-07-20 14:23:02 +0100492std::unique_ptr<IWorkload> ClWorkloadFactory::CreateLogSoftmax(const LogSoftmaxQueueDescriptor& descriptor,
493 const WorkloadInfo& info) const
494{
Sadik Armagane9444752020-12-02 11:28:58 +0000495 return MakeWorkload<ClLogSoftmaxWorkload>(descriptor,
496 info,
497 m_MemoryManager->GetIntraLayerManager(),
498 m_CLCompileContext);
Teresa Charlin8398edc2020-07-20 14:23:02 +0100499}
500
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100501std::unique_ptr<IWorkload> ClWorkloadFactory::CreateLstm(const LstmQueueDescriptor& descriptor,
502 const WorkloadInfo& info) const
503{
Sadik Armagane9444752020-12-02 11:28:58 +0000504 return MakeWorkload<ClLstmFloatWorkload, NullWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100505}
506
Nattapat Chaimanowong5a4304a2018-11-28 10:44:37 +0000507std::unique_ptr<IWorkload> ClWorkloadFactory::CreateMaximum(const MaximumQueueDescriptor& descriptor,
508 const WorkloadInfo& info) const
509{
Sadik Armagane9444752020-12-02 11:28:58 +0000510 return MakeWorkload<ClMaximumWorkload>(descriptor, info, m_CLCompileContext);
Nattapat Chaimanowong5a4304a2018-11-28 10:44:37 +0000511}
512
narpra01a6bf9122018-09-10 09:50:09 +0100513std::unique_ptr<IWorkload> ClWorkloadFactory::CreateMean(const MeanQueueDescriptor& descriptor,
514 const WorkloadInfo& info) const
515{
Sadik Armagane9444752020-12-02 11:28:58 +0000516 return MakeWorkload<ClMeanWorkload>(descriptor, info, m_CLCompileContext);
narpra01a6bf9122018-09-10 09:50:09 +0100517}
518
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100519std::unique_ptr<IWorkload> ClWorkloadFactory::CreateMemCopy(const MemCopyQueueDescriptor& descriptor,
520 const WorkloadInfo& info) const
jimfly012c9322a2018-09-19 10:59:49 +0100521{
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100522 if (descriptor.m_Inputs.empty() || !descriptor.m_Inputs[0])
523 {
524 throw InvalidArgumentException("ClWorkloadFactory: Invalid null input for MemCopy workload");
525 }
526
527 return MakeWorkload<CopyMemGenericWorkload>(descriptor, info);
jimfly012c9322a2018-09-19 10:59:49 +0100528}
529
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100530std::unique_ptr<IWorkload> ClWorkloadFactory::CreateMemImport(const MemImportQueueDescriptor& descriptor,
531 const WorkloadInfo& info) const
FrancisMurtagh20995952018-12-17 12:11:36 +0000532{
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100533 if (descriptor.m_Inputs.empty() || !descriptor.m_Inputs[0])
534 {
535 throw InvalidArgumentException("ClWorkloadFactory: Invalid null input for MemImport workload");
536 }
537
538 return std::make_unique<ImportMemGenericWorkload>(descriptor, info);
FrancisMurtagh20995952018-12-17 12:11:36 +0000539}
540
kevmay0190539692018-11-29 08:40:19 +0000541std::unique_ptr<IWorkload> ClWorkloadFactory::CreateMinimum(const MinimumQueueDescriptor& descriptor,
542 const WorkloadInfo& info) const
543{
Sadik Armagane9444752020-12-02 11:28:58 +0000544 return MakeWorkload<ClMinimumWorkload>(descriptor, info, m_CLCompileContext);
kevmay0190539692018-11-29 08:40:19 +0000545}
546
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100547std::unique_ptr<IWorkload> ClWorkloadFactory::CreateMultiplication(const MultiplicationQueueDescriptor& descriptor,
548 const WorkloadInfo& info) const
549{
Sadik Armagane9444752020-12-02 11:28:58 +0000550 return MakeWorkload<ClMultiplicationWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100551}
552
553std::unique_ptr<IWorkload> ClWorkloadFactory::CreateNormalization(const NormalizationQueueDescriptor& descriptor,
554 const WorkloadInfo& info) const
555{
Sadik Armagane9444752020-12-02 11:28:58 +0000556 return MakeWorkload<ClNormalizationFloatWorkload, NullWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100557}
558
559std::unique_ptr<IWorkload> ClWorkloadFactory::CreateOutput(const OutputQueueDescriptor& descriptor,
560 const WorkloadInfo& info) const
561{
562 return std::make_unique<CopyMemGenericWorkload>(descriptor, info);
563}
564
565std::unique_ptr<IWorkload> ClWorkloadFactory::CreatePad(const PadQueueDescriptor& descriptor,
566 const WorkloadInfo& info) const
567{
Sadik Armagane9444752020-12-02 11:28:58 +0000568 return MakeWorkload<ClPadWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100569}
570
571std::unique_ptr<IWorkload> ClWorkloadFactory::CreatePermute(const PermuteQueueDescriptor& descriptor,
Matteo Martincigh59a950c2018-12-13 12:48:25 +0000572 const WorkloadInfo& info) const
573{
Sadik Armagane9444752020-12-02 11:28:58 +0000574 return MakeWorkload<ClPermuteWorkload>(descriptor, info, m_CLCompileContext);
Matteo Martincigh59a950c2018-12-13 12:48:25 +0000575}
576
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100577std::unique_ptr<IWorkload> ClWorkloadFactory::CreatePooling2d(const Pooling2dQueueDescriptor& descriptor,
578 const WorkloadInfo& info) const
Nattapat Chaimanowonga9a1cf12018-12-03 16:06:49 +0000579{
Sadik Armagane9444752020-12-02 11:28:58 +0000580 return MakeWorkload<ClPooling2dWorkload>(descriptor, info, m_CLCompileContext);
Mohamed Nour Abouelseouda1d3c6a2018-12-27 12:39:16 +0000581}
582
Matteo Martincigh49124022019-01-11 13:25:59 +0000583std::unique_ptr<IWorkload> ClWorkloadFactory::CreatePreCompiled(const PreCompiledQueueDescriptor& descriptor,
584 const WorkloadInfo& info) const
585{
Sadik Armagane9444752020-12-02 11:28:58 +0000586 return MakeWorkload<NullWorkload, NullWorkload>(descriptor, info, m_CLCompileContext);
Matteo Martincigh49124022019-01-11 13:25:59 +0000587}
588
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100589std::unique_ptr<IWorkload> ClWorkloadFactory::CreatePrelu(const PreluQueueDescriptor &descriptor,
590 const WorkloadInfo &info) const
narpra01b89b05f2019-01-16 09:53:09 +0000591{
Sadik Armagane9444752020-12-02 11:28:58 +0000592 return MakeWorkload<ClPreluWorkload>(descriptor, info, m_CLCompileContext);
narpra01b89b05f2019-01-16 09:53:09 +0000593}
594
Ryan OShea2323af42020-05-13 16:36:19 +0100595std::unique_ptr<IWorkload> ClWorkloadFactory::CreateQLstm(const QLstmQueueDescriptor& descriptor,
596 const WorkloadInfo& info) const
597{
Sadik Armagane9444752020-12-02 11:28:58 +0000598 return std::make_unique<ClQLstmWorkload>(descriptor, info, m_CLCompileContext);
Ryan OShea2323af42020-05-13 16:36:19 +0100599}
600
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100601std::unique_ptr<IWorkload> ClWorkloadFactory::CreateQuantize(const QuantizeQueueDescriptor& descriptor,
602 const WorkloadInfo& info) const
Aron Virginas-Tar7a3e2fe2019-06-27 18:54:47 +0100603{
Sadik Armagane9444752020-12-02 11:28:58 +0000604 return MakeWorkload<ClQuantizeWorkload>(descriptor, info, m_CLCompileContext);
James Conroyd2aa85e2019-07-01 17:12:40 +0100605}
606
Ferran Balaguer737d9ff2019-08-01 09:58:08 +0100607std::unique_ptr<IWorkload> ClWorkloadFactory::CreateQuantizedLstm(const QuantizedLstmQueueDescriptor& descriptor,
608 const WorkloadInfo& info) const
609{
Sadik Armagane9444752020-12-02 11:28:58 +0000610 return MakeWorkload<ClQuantizedLstmWorkload>(descriptor, info, m_CLCompileContext);
Ferran Balaguer737d9ff2019-08-01 09:58:08 +0100611}
612
David Monahanc11ba462020-12-03 11:09:46 +0000613std::unique_ptr<IWorkload> ClWorkloadFactory::CreateRank(const RankQueueDescriptor& descriptor,
614 const WorkloadInfo& info) const
615{
616 return std::make_unique<ClRankWorkload>(descriptor, info);
617}
618
Sadik Armagana2747482021-02-09 10:28:54 +0000619std::unique_ptr<IWorkload> ClWorkloadFactory::CreateReduce(const ReduceQueueDescriptor& descriptor,
620 const WorkloadInfo& info) const
621{
622 return std::make_unique<ClReduceWorkload>(descriptor, info);
623}
624
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100625std::unique_ptr<IWorkload> ClWorkloadFactory::CreateReshape(const ReshapeQueueDescriptor& descriptor,
626 const WorkloadInfo& info) const
627{
Sadik Armagane9444752020-12-02 11:28:58 +0000628 return MakeWorkload<ClReshapeWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100629}
630
631std::unique_ptr<IWorkload> ClWorkloadFactory::CreateResize(const ResizeQueueDescriptor& descriptor,
632 const WorkloadInfo& info) const
633{
Sadik Armagane9444752020-12-02 11:28:58 +0000634 return MakeWorkload<ClResizeWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100635}
636
Aron Virginas-Tar94c4fef2019-11-25 15:37:08 +0000637std::unique_ptr<IWorkload> ClWorkloadFactory::CreateSlice(const SliceQueueDescriptor& descriptor,
638 const WorkloadInfo& info) const
639{
Sadik Armagane9444752020-12-02 11:28:58 +0000640 return MakeWorkload<ClSliceWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar94c4fef2019-11-25 15:37:08 +0000641}
642
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100643std::unique_ptr<IWorkload> ClWorkloadFactory::CreateSoftmax(const SoftmaxQueueDescriptor& descriptor,
644 const WorkloadInfo& info) const
645{
Sadik Armagane9444752020-12-02 11:28:58 +0000646 return std::make_unique<ClSoftmaxWorkload>(descriptor,
647 info,
648 m_MemoryManager->GetIntraLayerManager(),
649 m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100650}
651
652std::unique_ptr<IWorkload> ClWorkloadFactory::CreateSpaceToBatchNd(const SpaceToBatchNdQueueDescriptor& descriptor,
653 const WorkloadInfo& info) const
654{
Sadik Armagane9444752020-12-02 11:28:58 +0000655 return MakeWorkload<ClSpaceToBatchNdWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100656}
657
658std::unique_ptr<IWorkload> ClWorkloadFactory::CreateSpaceToDepth(const SpaceToDepthQueueDescriptor& descriptor,
659 const WorkloadInfo& info) const
660{
Sadik Armagane9444752020-12-02 11:28:58 +0000661 return MakeWorkload<ClSpaceToDepthWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100662}
663
664std::unique_ptr<IWorkload> ClWorkloadFactory::CreateSplitter(const SplitterQueueDescriptor& descriptor,
665 const WorkloadInfo& info) const
666{
Sadik Armagane9444752020-12-02 11:28:58 +0000667 return MakeWorkload<ClSplitterWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100668}
669
Matthew Jacksond5166102019-07-31 14:06:28 +0100670std::unique_ptr<IWorkload> ClWorkloadFactory::CreateStack(const StackQueueDescriptor& descriptor,
671 const WorkloadInfo& info) const
672{
Sadik Armagane9444752020-12-02 11:28:58 +0000673 return MakeWorkload<ClStackWorkload>(descriptor, info, m_CLCompileContext);
Matthew Jacksond5166102019-07-31 14:06:28 +0100674}
675
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100676std::unique_ptr<IWorkload> ClWorkloadFactory::CreateStridedSlice(const StridedSliceQueueDescriptor& descriptor,
Aron Virginas-Tarb2801962019-09-30 11:24:53 +0100677 const WorkloadInfo& info) const
678{
Sadik Armagane9444752020-12-02 11:28:58 +0000679 return MakeWorkload<ClStridedSliceWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100680}
681
682std::unique_ptr<IWorkload> ClWorkloadFactory::CreateSubtraction(const SubtractionQueueDescriptor& descriptor,
683 const WorkloadInfo& info) const
684{
Sadik Armagane9444752020-12-02 11:28:58 +0000685 return MakeWorkload<ClSubtractionWorkload>(descriptor, info, m_CLCompileContext);
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100686}
687
Mike Kellyc9ea45a2020-02-28 18:11:58 +0000688std::unique_ptr<IWorkload> ClWorkloadFactory::CreateTranspose(const TransposeQueueDescriptor& descriptor,
689 const WorkloadInfo& info) const
690{
Sadik Armagane9444752020-12-02 11:28:58 +0000691 return MakeWorkload<ClTransposeWorkload>(descriptor, info, m_CLCompileContext);
Mike Kellyc9ea45a2020-02-28 18:11:58 +0000692}
693
Aron Virginas-Tar8168f402019-10-04 13:10:16 +0100694std::unique_ptr<IWorkload> ClWorkloadFactory::CreateTransposeConvolution2d(
695 const TransposeConvolution2dQueueDescriptor& descriptor,
696 const WorkloadInfo& info) const
697{
Sadik Armagane9444752020-12-02 11:28:58 +0000698 return MakeWorkload<ClTransposeConvolution2dWorkload>(descriptor,
699 info,
700 m_MemoryManager->GetIntraLayerManager(),
701 m_CLCompileContext);
Aron Virginas-Tarb2801962019-09-30 11:24:53 +0100702}
703
telsoa014fcda012018-03-09 14:13:49 +0000704} // namespace armnn