blob: 0db97be62c3284a1c6a129905df2d775a70457d9 [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5
6#include "NeonLayerSupport.hpp"
David Beck3e9e1152018-10-17 14:17:50 +01007#include "NeonBackendId.hpp"
telsoa014fcda012018-03-09 14:13:49 +00008
telsoa014fcda012018-03-09 14:13:49 +00009#include <armnn/Descriptors.hpp>
telsoa014fcda012018-03-09 14:13:49 +000010#include <armnn/Tensor.hpp>
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010011#include <armnn/Types.hpp>
Matteo Martincighc601aa62019-10-29 15:03:22 +000012#include <armnn/BackendRegistry.hpp>
telsoa014fcda012018-03-09 14:13:49 +000013
Matteo Martincighc601aa62019-10-29 15:03:22 +000014#include <InternalTypes.hpp>
15#include <LayerSupportCommon.hpp>
David Beck3e9e1152018-10-17 14:17:50 +010016
telsoa014fcda012018-03-09 14:13:49 +000017#include <boost/core/ignore_unused.hpp>
18
Matteo Martincighd95e9062019-01-31 15:35:59 +000019#if defined(ARMCOMPUTENEON_ENABLED)
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010020#include <aclCommon/ArmComputeUtils.hpp>
Aron Virginas-Tar710f6642019-11-27 14:48:32 +000021#include <aclCommon/ArmComputeTensorUtils.hpp>
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +010022#include "workloads/NeonAbsWorkload.hpp"
Matthew Bentham955258d2018-12-10 10:48:52 +000023#include "workloads/NeonAdditionWorkload.hpp"
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +010024#include "workloads/NeonActivationWorkload.hpp"
James Conroyd47a0642019-09-17 14:22:06 +010025#include "workloads/NeonArgMinMaxWorkload.hpp"
Matthew Benthamc48ac8c2018-12-12 16:15:59 +000026#include "workloads/NeonBatchNormalizationWorkload.hpp"
Mike Kelly56858022020-01-27 12:14:47 +000027#include "workloads/NeonBatchToSpaceNdWorkload.hpp"
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +010028#include "workloads/NeonConvolution2dWorkload.hpp"
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +010029#include "workloads/NeonDepthToSpaceWorkload.hpp"
Nattapat Chaimanowong77140882018-10-17 11:12:19 +010030#include "workloads/NeonDepthwiseConvolutionWorkload.hpp"
Narumol Prangnawarat01961a72019-05-30 16:47:12 +010031#include "workloads/NeonDequantizeWorkload.hpp"
Derek Lamberti6a5e5e82019-12-05 14:41:20 +000032#include "workloads/NeonDetectionPostProcessWorkload.hpp"
kevmay01eed85922019-01-28 08:37:25 +000033#include "workloads/NeonGreaterWorkload.hpp"
Sadik Armagan0d4863d2019-10-09 14:26:32 +010034#include "workloads/NeonInstanceNormalizationWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010035#include "workloads/NeonL2NormalizationFloatWorkload.hpp"
Jan Eilersad5293a2019-07-08 09:57:55 +010036#include "workloads/NeonLstmFloatWorkload.hpp"
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +000037#include "workloads/NeonMaximumWorkload.hpp"
Matthew Benthamfd899962018-12-31 15:49:42 +000038#include "workloads/NeonMeanWorkload.hpp"
Jim Flynn39d487d2019-05-17 15:44:36 +010039#include "workloads/NeonConcatWorkload.hpp"
Conor Kennedy54b21692019-01-09 07:57:38 +000040#include "workloads/NeonMinimumWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000041#include "workloads/NeonMultiplicationWorkload.hpp"
Pablo Telloe61f0712020-01-23 10:37:17 +000042#include "workloads/NeonDivisionWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010043#include "workloads/NeonNormalizationFloatWorkload.hpp"
44#include "workloads/NeonFullyConnectedWorkload.hpp"
Éanna Ó Catháin12055742019-01-25 10:01:40 +000045#include "workloads/NeonPadWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010046#include "workloads/NeonPermuteWorkload.hpp"
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +010047#include "workloads/NeonPooling2dWorkload.hpp"
Nikhil Raj9b461482019-07-03 15:58:31 +010048#include "workloads/NeonPreluWorkload.hpp"
Sadik Armaganfabc2892019-05-31 09:05:11 +010049#include "workloads/NeonQuantizeWorkload.hpp"
Francis Murtagh4fc3c482019-08-02 13:20:54 +010050#include "workloads/NeonQuantizedLstmWorkload.hpp"
Kevin Maya023c402019-12-12 17:28:05 +000051#include "workloads/NeonReshapeWorkload.hpp"
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +010052#include "workloads/NeonResizeWorkload.hpp"
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010053#include "workloads/NeonRsqrtWorkload.hpp"
josh minor036f02d2019-11-15 14:53:22 -060054#include "workloads/NeonSliceWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010055#include "workloads/NeonSoftmaxBaseWorkload.hpp"
Mike Kelly0be3a882020-01-24 11:27:50 +000056#include "workloads/NeonSpaceToBatchNdWorkload.hpp"
Ellen Norris-Thompson29794572019-06-26 16:40:36 +010057#include "workloads/NeonSpaceToDepthWorkload.hpp"
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010058#include "workloads/NeonSplitterWorkload.hpp"
Matthew Jackson87f65ea2019-08-01 10:01:34 +010059#include "workloads/NeonStackWorkload.hpp"
FinnWilliamsArm1fa19192019-08-02 17:26:31 +010060#include "workloads/NeonStridedSliceWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000061#include "workloads/NeonSubtractionWorkload.hpp"
Sadik Armagan581742d2019-08-12 14:11:37 +010062#include "workloads/NeonTransposeConvolution2dWorkload.hpp"
telsoa014fcda012018-03-09 14:13:49 +000063#endif
64
65using namespace boost;
66
67namespace armnn
68{
telsoa014fcda012018-03-09 14:13:49 +000069
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010070namespace
arovir017ff76c52018-10-09 09:40:58 +010071{
telsoa014fcda012018-03-09 14:13:49 +000072
Derek Lamberti901ea112019-12-10 22:07:09 +000073template< typename ... Args>
74bool IsNeonBackendSupported(Optional<std::string&> reasonIfUnsupported, Args... args)
telsoa014fcda012018-03-09 14:13:49 +000075{
Derek Lambertibaa177f2019-12-10 22:00:43 +000076 boost::ignore_unused(reasonIfUnsupported, (args)...);
Matteo Martincighd95e9062019-01-31 15:35:59 +000077#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +000078 return true;
79#else
Derek Lamberti0790dce2019-04-15 18:37:35 +010080 SetValueChecked(reasonIfUnsupported, "The armnn library has been built without NEON support");
telsoa014fcda012018-03-09 14:13:49 +000081 return false;
82#endif
83}
84
telsoa01c577f2c2018-08-31 09:22:23 +010085template<typename FloatFunc, typename Uint8Func, typename ... Params>
arovir01085f0a42018-10-08 14:48:19 +010086bool IsSupportedForDataTypeNeon(Optional<std::string&> reasonIfUnsupported,
telsoa014fcda012018-03-09 14:13:49 +000087 DataType dataType,
telsoa01c577f2c2018-08-31 09:22:23 +010088 FloatFunc floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +000089 Uint8Func uint8FuncPtr,
90 Params&&... params)
91{
92 return IsNeonBackendSupported(reasonIfUnsupported) &&
93 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
94 dataType,
95 floatFuncPtr,
telsoa01c577f2c2018-08-31 09:22:23 +010096 floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +000097 uint8FuncPtr,
narpra01db2b1602019-01-23 15:23:11 +000098 &FalseFunc<>,
kevmay012b4d88e2019-01-24 14:05:09 +000099 &FalseFunc<>,
telsoa014fcda012018-03-09 14:13:49 +0000100 std::forward<Params>(params)...);
101}
102
Matteo Martincighd95e9062019-01-31 15:35:59 +0000103#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +0000104template<class FuncType, class... Args>
arovir01085f0a42018-10-08 14:48:19 +0100105inline bool IsWorkloadSupported(FuncType& func, Optional<std::string&> reasonIfUnsupported, Args&&... args)
telsoa014fcda012018-03-09 14:13:49 +0000106{
107 arm_compute::Status aclStatus = func(std::forward<Args>(args)...);
108 const bool supported = (aclStatus.error_code() == arm_compute::ErrorCode::OK);
109 if (!supported && reasonIfUnsupported)
110 {
arovir01085f0a42018-10-08 14:48:19 +0100111 reasonIfUnsupported.value() = aclStatus.error_description();
telsoa014fcda012018-03-09 14:13:49 +0000112 }
113 return supported;
114}
115
116#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
117 return IsWorkloadSupported(func, reasonIfUnsupported, __VA_ARGS__);
118#else
119#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
Derek Lamberti901ea112019-12-10 22:07:09 +0000120 return IsNeonBackendSupported(reasonIfUnsupported, __VA_ARGS__);
telsoa014fcda012018-03-09 14:13:49 +0000121#endif
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100122} // anonymous namespace
123
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +0100124bool NeonLayerSupport::IsAbsSupported(const TensorInfo& input,
125 const TensorInfo& output,
126 Optional<std::string&> reasonIfUnsupported) const
127{
josh minor4a3c6102020-01-06 16:40:46 -0600128 ElementwiseUnaryDescriptor descriptor(UnaryOperation::Abs);
129 return IsElementwiseUnarySupported(input, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +0100130}
131
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100132bool NeonLayerSupport::IsActivationSupported(const TensorInfo& input,
133 const TensorInfo& output,
134 const ActivationDescriptor& descriptor,
135 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000136{
137 ignore_unused(descriptor);
telsoa01c577f2c2018-08-31 09:22:23 +0100138 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonActivationWorkloadValidate,
139 reasonIfUnsupported,
140 input,
141 output,
142 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000143}
144
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100145bool NeonLayerSupport::IsAdditionSupported(const TensorInfo& input0,
146 const TensorInfo& input1,
147 const TensorInfo& output,
148 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000149{
telsoa01c577f2c2018-08-31 09:22:23 +0100150 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAdditionWorkloadValidate,
151 reasonIfUnsupported,
152 input0,
153 input1,
154 output);
telsoa014fcda012018-03-09 14:13:49 +0000155}
156
James Conroyd47a0642019-09-17 14:22:06 +0100157bool NeonLayerSupport::IsArgMinMaxSupported(const TensorInfo& input,
158 const TensorInfo& output,
159 const ArgMinMaxDescriptor& descriptor,
160 Optional<std::string&> reasonIfUnsupported) const
161{
162 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonArgMinMaxWorkloadValidate,
163 reasonIfUnsupported,
164 input,
165 output,
166 descriptor);
167}
168
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100169bool NeonLayerSupport::IsBatchNormalizationSupported(const TensorInfo& input,
170 const TensorInfo& output,
171 const TensorInfo& mean,
172 const TensorInfo& var,
173 const TensorInfo& beta,
174 const TensorInfo& gamma,
175 const BatchNormalizationDescriptor& descriptor,
176 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000177{
telsoa01c577f2c2018-08-31 09:22:23 +0100178 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonBatchNormalizationValidate,
179 reasonIfUnsupported,
180 input,
181 output,
182 mean,
183 var,
184 beta,
185 gamma,
186 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000187}
188
Mike Kelly56858022020-01-27 12:14:47 +0000189bool NeonLayerSupport::IsBatchToSpaceNdSupported(const TensorInfo& input,
190 const TensorInfo& output,
191 const BatchToSpaceNdDescriptor& descriptor,
192 Optional<std::string&> reasonIfUnsupported) const
193{
194 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonBatchToSpaceNdWorkloadValidate,
195 reasonIfUnsupported,
196 input,
197 output,
198 descriptor);
199}
200
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100201bool NeonLayerSupport::IsComparisonSupported(const TensorInfo& input0,
202 const TensorInfo& input1,
203 const TensorInfo& output,
204 const ComparisonDescriptor& descriptor,
205 Optional<std::string&> reasonIfUnsupported) const
206{
207 if (descriptor.m_Operation == ComparisonOperation::Greater)
208 {
209 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonGreaterWorkloadValidate,
210 reasonIfUnsupported,
211 input0,
212 input1,
213 output);
214 }
215
216 return false;
217}
218
Jim Flynn906f9462019-05-10 13:55:21 +0100219bool NeonLayerSupport::IsConcatSupported(const std::vector<const TensorInfo*> inputs,
220 const TensorInfo& output,
Jim Flynne242f2d2019-05-22 14:24:13 +0100221 const ConcatDescriptor& descriptor,
Jim Flynn906f9462019-05-10 13:55:21 +0100222 Optional<std::string&> reasonIfUnsupported) const
223{
Jim Flynne242f2d2019-05-22 14:24:13 +0100224 if (descriptor.GetNumDimensions() <= descriptor.GetConcatAxis())
225 {
226 SetValueChecked(reasonIfUnsupported, "Neon Concat: Concat axis > Number of dimensions.");
227 return false;
228 }
229
230 unsigned int concatInnerAxis = (descriptor.GetNumDimensions() - descriptor.GetConcatAxis()) - 1;
231 if(concatInnerAxis < 3) // Width, height, or channels
232 {
233 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConcatWorkloadValidate,
234 reasonIfUnsupported,
235 inputs,
236 output,
237 descriptor);
238 }
239 else if (concatInnerAxis == 3)
240 {
241 for (auto& input : inputs)
242 {
243 if (input && !output.IsTypeSpaceMatch(*input)) // Cannot use sub-tensors if the types are not same space
244 {
245 SetValueChecked(reasonIfUnsupported, "Neon Concat: Types and quantization parameters must match.");
246 return false;
247 }
248 }
249 return true; // Sub-tensors support concat along batch
250 }
251 else // > 4 dimensions not supported.
252 {
253 SetValueChecked(reasonIfUnsupported, "Neon Concat: Maximum of 4 dimensions supported.");
254 return false;
255 }
Jim Flynn906f9462019-05-10 13:55:21 +0100256}
257
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100258bool NeonLayerSupport::IsConstantSupported(const TensorInfo& output,
259 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000260{
261 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
262 output.GetDataType(),
263 &TrueFunc<>,
264 &TrueFunc<>);
265}
266
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100267bool NeonLayerSupport::IsConvertFp16ToFp32Supported(const TensorInfo& input,
268 const TensorInfo& output,
269 Optional<std::string&> reasonIfUnsupported) const
270{
271 ignore_unused(input);
272 ignore_unused(output);
273 ignore_unused(reasonIfUnsupported);
274 return true;
275}
276
277bool NeonLayerSupport::IsConvertFp32ToFp16Supported(const TensorInfo& input,
278 const TensorInfo& output,
279 Optional<std::string&> reasonIfUnsupported) const
280{
281 ignore_unused(input);
282 ignore_unused(output);
283 ignore_unused(reasonIfUnsupported);
284 return true;
285}
286
287bool NeonLayerSupport::IsConvolution2dSupported(const TensorInfo& input,
288 const TensorInfo& output,
289 const Convolution2dDescriptor& descriptor,
290 const TensorInfo& weights,
291 const Optional<TensorInfo>& biases,
292 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000293{
surmeh013537c2c2018-05-18 16:31:43 +0100294 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConvolution2dWorkloadValidate,
295 reasonIfUnsupported,
296 input,
297 output,
298 descriptor,
299 weights,
300 biases);
telsoa014fcda012018-03-09 14:13:49 +0000301}
302
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +0100303bool NeonLayerSupport::IsDepthToSpaceSupported(const TensorInfo& input,
304 const TensorInfo& output,
305 const DepthToSpaceDescriptor& descriptor,
306 Optional<std::string&> reasonIfUnsupported) const
307{
308 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthToSpaceWorkloadValidate,
309 reasonIfUnsupported,
310 input,
311 output,
312 descriptor);
313}
314
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100315bool NeonLayerSupport::IsDepthwiseConvolutionSupported(const TensorInfo& input,
316 const TensorInfo& output,
317 const DepthwiseConvolution2dDescriptor& descriptor,
318 const TensorInfo& weights,
319 const Optional<TensorInfo>& biases,
320 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000321{
telsoa01c577f2c2018-08-31 09:22:23 +0100322 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
323 reasonIfUnsupported,
324 input,
325 output,
326 descriptor,
327 weights,
328 biases);
telsoa014fcda012018-03-09 14:13:49 +0000329}
330
Narumol Prangnawarat01961a72019-05-30 16:47:12 +0100331bool NeonLayerSupport::IsDequantizeSupported(const TensorInfo& input,
332 const TensorInfo& output,
333 Optional<std::string&> reasonIfUnsupported) const
334{
335 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDequantizeWorkloadValidate,
336 reasonIfUnsupported,
337 input,
338 output);
339}
340
Derek Lamberti6a5e5e82019-12-05 14:41:20 +0000341bool NeonLayerSupport::IsDetectionPostProcessSupported(const TensorInfo& boxEncodings,
342 const TensorInfo& scores,
343 const TensorInfo& anchors,
344 const TensorInfo& detectionBoxes,
345 const TensorInfo& detectionClasses,
346 const TensorInfo& detectionScores,
347 const TensorInfo& numDetections,
348 const DetectionPostProcessDescriptor& descriptor,
349 Optional<std::string&> reasonIfUnsupported) const
350{
351 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDetectionPostProcessValidate,
352 reasonIfUnsupported,
353 boxEncodings,
354 scores,
355 anchors,
356 detectionBoxes,
357 detectionClasses,
358 detectionScores,
359 numDetections,
360 descriptor);
361}
362
363
Pablo Tellof0bd6832019-04-26 17:58:13 +0100364bool NeonLayerSupport::IsDilatedDepthwiseConvolutionSupported(const TensorInfo& input,
365 const TensorInfo& output,
366 const DepthwiseConvolution2dDescriptor& descriptor,
367 const TensorInfo& weights,
368 const Optional<TensorInfo>& biases,
369 Optional<std::string&> reasonIfUnsupported) const
370{
371 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
372 reasonIfUnsupported,
373 input,
374 output,
375 descriptor,
376 weights,
377 biases);
378}
379
josh minor4a3c6102020-01-06 16:40:46 -0600380bool NeonLayerSupport::IsElementwiseUnarySupported(const TensorInfo& input,
381 const TensorInfo& output,
382 const ElementwiseUnaryDescriptor& descriptor,
383 Optional<std::string&> reasonIfUnsupported) const
384{
385 if (descriptor.m_Operation == UnaryOperation::Abs)
386 {
387 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAbsWorkloadValidate,
388 reasonIfUnsupported,
389 input,
390 output);
391 }
392 else if (descriptor.m_Operation == UnaryOperation::Rsqrt)
393 {
394 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonRsqrtWorkloadValidate,
395 reasonIfUnsupported,
396 input,
397 output);
398 }
399
400 return false;
401}
402
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100403bool NeonLayerSupport::IsFloorSupported(const TensorInfo& input,
404 const TensorInfo& output,
405 Optional<std::string&> reasonIfUnsupported) const
406{
407 ignore_unused(output);
408 return IsNeonBackendSupported(reasonIfUnsupported) &&
409 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
410 input.GetDataType(),
411 &FalseFuncF16<>,
412 &TrueFunc<>,
narpra01db2b1602019-01-23 15:23:11 +0000413 &FalseFuncU8<>,
kevmay012b4d88e2019-01-24 14:05:09 +0000414 &FalseFuncI32<>,
415 &FalseFuncU8<>);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100416}
417
418bool NeonLayerSupport::IsFullyConnectedSupported(const TensorInfo& input,
419 const TensorInfo& output,
420 const TensorInfo& weights,
421 const TensorInfo& biases,
422 const FullyConnectedDescriptor& descriptor,
423 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000424{
telsoa01c577f2c2018-08-31 09:22:23 +0100425 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonFullyConnectedWorkloadValidate,
426 reasonIfUnsupported,
427 input,
428 output,
429 weights,
430 biases,
431 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000432}
433
kevmay01eed85922019-01-28 08:37:25 +0000434bool NeonLayerSupport::IsGreaterSupported(const armnn::TensorInfo& input0,
435 const armnn::TensorInfo& input1,
436 const armnn::TensorInfo& output,
437 armnn::Optional<std::string&> reasonIfUnsupported) const
438{
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100439 ComparisonDescriptor descriptor(ComparisonOperation::Greater);
440 return IsComparisonSupported(input0, input1, output, descriptor, reasonIfUnsupported);
kevmay01eed85922019-01-28 08:37:25 +0000441}
442
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100443bool NeonLayerSupport::IsInputSupported(const TensorInfo& input,
444 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000445{
Derek Lamberti901ea112019-12-10 22:07:09 +0000446 return IsNeonBackendSupported(reasonIfUnsupported, input);
telsoa014fcda012018-03-09 14:13:49 +0000447}
448
Sadik Armagan0d4863d2019-10-09 14:26:32 +0100449bool NeonLayerSupport::IsInstanceNormalizationSupported(const TensorInfo& input,
450 const TensorInfo& output,
451 const InstanceNormalizationDescriptor& descriptor,
452 Optional<std::string&> reasonIfUnsupported) const
453{
454 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonInstanceNormalizationWorkloadValidate,
455 reasonIfUnsupported,
456 input,
457 output,
458 descriptor);
459}
460
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100461bool NeonLayerSupport::IsL2NormalizationSupported(const TensorInfo& input,
462 const TensorInfo& output,
463 const L2NormalizationDescriptor& descriptor,
464 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000465{
Matteo Martincighbcd3c852018-09-28 14:14:12 +0100466 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonL2NormalizationWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000467}
468
Jan Eilersad5293a2019-07-08 09:57:55 +0100469bool NeonLayerSupport::IsLstmSupported(const TensorInfo& input,
470 const TensorInfo& outputStateIn,
471 const TensorInfo& cellStateIn,
472 const TensorInfo& scratchBuffer,
473 const TensorInfo& outputStateOut,
474 const TensorInfo& cellStateOut,
475 const TensorInfo& output,
476 const LstmDescriptor& descriptor,
477 const LstmInputParamsInfo& paramsInfo,
478 Optional<std::string&> reasonIfUnsupported) const
479{
480 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLstmFloatWorkloadValidate,
481 reasonIfUnsupported,
482 input,
483 outputStateIn,
484 cellStateIn,
485 scratchBuffer,
486 outputStateOut,
487 cellStateOut,
488 output,
489 descriptor,
490 paramsInfo);
491}
492
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +0000493bool NeonLayerSupport::IsMaximumSupported(const TensorInfo& input0,
494 const TensorInfo& input1,
495 const TensorInfo& output,
496 Optional<std::string&> reasonIfUnsupported) const
497{
498 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMaximumWorkloadValidate,
499 reasonIfUnsupported,
500 input0,
501 input1,
502 output);
503}
504
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100505bool NeonLayerSupport::IsMeanSupported(const TensorInfo& input,
506 const TensorInfo& output,
507 const MeanDescriptor& descriptor,
508 Optional<std::string&> reasonIfUnsupported) const
narpra0132b90462018-09-13 11:07:48 +0100509{
Matthew Benthamfd899962018-12-31 15:49:42 +0000510 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMeanWorkloadValidate,
511 reasonIfUnsupported,
512 input,
513 output,
514 descriptor);
narpra0132b90462018-09-13 11:07:48 +0100515}
516
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100517bool NeonLayerSupport::IsMergerSupported(const std::vector<const TensorInfo*> inputs,
Nikhil Raj8599a412018-11-19 14:51:07 +0000518 const TensorInfo& output,
Jim Flynne242f2d2019-05-22 14:24:13 +0100519 const MergerDescriptor& descriptor,
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100520 Optional<std::string&> reasonIfUnsupported) const
521{
Jim Flynne242f2d2019-05-22 14:24:13 +0100522 return IsConcatSupported(inputs, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100523}
524
Conor Kennedy54b21692019-01-09 07:57:38 +0000525bool NeonLayerSupport::IsMinimumSupported(const TensorInfo& input0,
526 const TensorInfo& input1,
527 const TensorInfo& output,
528 Optional<std::string&> reasonIfUnsupported) const
529{
530 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMinimumWorkloadValidate,
531 reasonIfUnsupported,
532 input0,
533 input1,
534 output);
535}
536
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100537bool NeonLayerSupport::IsMultiplicationSupported(const TensorInfo& input0,
538 const TensorInfo& input1,
539 const TensorInfo& output,
540 Optional<std::string&> reasonIfUnsupported) const
541{
542 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMultiplicationWorkloadValidate,
543 reasonIfUnsupported,
544 input0,
545 input1,
546 output);
547}
548
Pablo Telloe61f0712020-01-23 10:37:17 +0000549bool NeonLayerSupport::IsDivisionSupported(const TensorInfo& input0,
550 const TensorInfo& input1,
551 const TensorInfo& output,
552 Optional<std::string&> reasonIfUnsupported) const
553{
554 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDivisionWorkloadValidate,
555 reasonIfUnsupported,
556 input0,
557 input1,
558 output);
559}
560
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100561bool NeonLayerSupport::IsNormalizationSupported(const TensorInfo& input,
562 const TensorInfo& output,
563 const NormalizationDescriptor& descriptor,
564 Optional<std::string&> reasonIfUnsupported) const
565{
566 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonNormalizationWorkloadValidate,
567 reasonIfUnsupported,
568 input,
569 output,
570 descriptor);
571}
572
573bool NeonLayerSupport::IsOutputSupported(const TensorInfo& output,
574 Optional<std::string&> reasonIfUnsupported) const
575{
Derek Lamberti901ea112019-12-10 22:07:09 +0000576 return IsNeonBackendSupported(reasonIfUnsupported, output);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100577}
578
Éanna Ó Catháin12055742019-01-25 10:01:40 +0000579bool NeonLayerSupport::IsPadSupported(const TensorInfo& input,
580 const TensorInfo& output,
581 const PadDescriptor& descriptor,
582 Optional<std::string&> reasonIfUnsupported) const
583{
584 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPadWorkloadValidate,
585 reasonIfUnsupported,
586 input,
587 output,
588 descriptor);
589}
590
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100591bool NeonLayerSupport::IsPermuteSupported(const TensorInfo& input,
592 const TensorInfo& output,
593 const PermuteDescriptor& descriptor,
594 Optional<std::string&> reasonIfUnsupported) const
595{
596 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPermuteWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000597}
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100598
599bool NeonLayerSupport::IsPooling2dSupported(const TensorInfo& input,
600 const TensorInfo& output,
601 const Pooling2dDescriptor& descriptor,
602 Optional<std::string&> reasonIfUnsupported) const
603{
604 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPooling2dWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
605}
606
Nikhil Raj9b461482019-07-03 15:58:31 +0100607bool NeonLayerSupport::IsPreluSupported(const armnn::TensorInfo &input,
608 const armnn::TensorInfo &alpha,
609 const armnn::TensorInfo &output,
610 armnn::Optional<std::string &> reasonIfUnsupported) const
611{
612 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPreluWorkloadValidate, reasonIfUnsupported, input, alpha, output);
613}
614
Sadik Armaganfabc2892019-05-31 09:05:11 +0100615bool NeonLayerSupport::IsQuantizeSupported(const TensorInfo& input,
616 const TensorInfo& output,
617 Optional<std::string&> reasonIfUnsupported) const
618{
619 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizeWorkloadValidate,
620 reasonIfUnsupported,
621 input,
622 output);
623}
624
Francis Murtagh4fc3c482019-08-02 13:20:54 +0100625bool NeonLayerSupport::IsQuantizedLstmSupported(const TensorInfo& input,
626 const TensorInfo& cellStateIn,
627 const TensorInfo& outputStateIn,
628 const TensorInfo& cellStateOut,
629 const TensorInfo& outputStateOut,
630 const QuantizedLstmInputParamsInfo& paramsInfo,
631 Optional<std::string&> reasonIfUnsupported) const
632{
633 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizedLstmWorkloadValidate,
634 reasonIfUnsupported,
635 input,
636 cellStateIn,
637 outputStateIn,
638 cellStateOut,
639 outputStateOut,
640 paramsInfo);
641}
642
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100643bool NeonLayerSupport::IsReshapeSupported(const TensorInfo& input,
Kevin Maya023c402019-12-12 17:28:05 +0000644 const TensorInfo& output,
Matteo Martincigh992d6dc2019-01-10 17:34:20 +0000645 const ReshapeDescriptor& descriptor,
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100646 Optional<std::string&> reasonIfUnsupported) const
647{
Matteo Martincigh992d6dc2019-01-10 17:34:20 +0000648 ignore_unused(descriptor);
Kevin Maya023c402019-12-12 17:28:05 +0000649 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonReshapeWorkloadValidate,
650 reasonIfUnsupported,
651 input,
652 output);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100653}
654
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +0100655bool NeonLayerSupport::IsResizeSupported(const TensorInfo& input,
656 const TensorInfo& output,
657 const ResizeDescriptor& descriptor,
658 Optional<std::string&> reasonIfUnsupported) const
659{
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +0100660 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonResizeWorkloadValidate,
661 reasonIfUnsupported,
662 input,
663 output,
664 descriptor);
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +0100665}
666
Sadik Armaganc625f002018-12-17 11:32:16 +0000667bool NeonLayerSupport::IsResizeBilinearSupported(const TensorInfo& input,
668 const TensorInfo& output,
669 Optional<std::string&> reasonIfUnsupported) const
670{
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +0100671 ResizeDescriptor descriptor;
672 descriptor.m_Method = ResizeMethod::Bilinear;
673 descriptor.m_DataLayout = DataLayout::NCHW;
674
675 const TensorShape& outputShape = output.GetShape();
676 descriptor.m_TargetHeight = outputShape[2];
677 descriptor.m_TargetWidth = outputShape[3];
678
679 return IsResizeSupported(input, output, descriptor, reasonIfUnsupported);
Sadik Armaganc625f002018-12-17 11:32:16 +0000680}
681
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +0100682bool NeonLayerSupport::IsRsqrtSupported(const TensorInfo& input,
683 const TensorInfo& output,
684 Optional<std::string&> reasonIfUnsupported) const
685{
josh minor4a3c6102020-01-06 16:40:46 -0600686 ElementwiseUnaryDescriptor descriptor(UnaryOperation::Rsqrt);
687 return IsElementwiseUnarySupported(input, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +0100688}
689
josh minor036f02d2019-11-15 14:53:22 -0600690bool NeonLayerSupport::IsSliceSupported(const TensorInfo& input,
691 const TensorInfo& output,
692 const SliceDescriptor& descriptor,
693 Optional<std::string&> reasonIfUnsupported) const
694{
695 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSliceWorkloadValidate,
696 reasonIfUnsupported,
697 input,
698 output,
699 descriptor);
700}
701
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100702bool NeonLayerSupport::IsSoftmaxSupported(const TensorInfo& input,
703 const TensorInfo& output,
704 const SoftmaxDescriptor& descriptor,
705 Optional<std::string&> reasonIfUnsupported) const
706{
707 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSoftmaxWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
708}
709
Mike Kelly0be3a882020-01-24 11:27:50 +0000710bool NeonLayerSupport::IsSpaceToBatchNdSupported(const TensorInfo& input,
711 const TensorInfo& output,
712 const SpaceToBatchNdDescriptor& descriptor,
713 Optional<std::string&> reasonIfUnsupported) const
714{
715 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSpaceToBatchNdWorkloadValidate,
716 reasonIfUnsupported,
717 input,
718 output,
719 descriptor);
720}
721
Ellen Norris-Thompson29794572019-06-26 16:40:36 +0100722bool NeonLayerSupport::IsSpaceToDepthSupported(const TensorInfo& input,
Mike Kelly0be3a882020-01-24 11:27:50 +0000723 const TensorInfo& output,
724 const SpaceToDepthDescriptor& descriptor,
725 Optional<std::string&> reasonIfUnsupported) const
Ellen Norris-Thompson29794572019-06-26 16:40:36 +0100726{
727 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSpaceToDepthWorkloadValidate,
728 reasonIfUnsupported,
729 input,
730 output,
731 descriptor);
732}
733
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100734bool NeonLayerSupport::IsSplitterSupported(const TensorInfo& input,
735 const ViewsDescriptor& descriptor,
736 Optional<std::string&> reasonIfUnsupported) const
737{
738 ignore_unused(descriptor);
739 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
740 input.GetDataType(),
741 &TrueFunc<>,
742 &TrueFunc<>);
743}
744
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100745bool NeonLayerSupport::IsSplitterSupported(const TensorInfo& input,
746 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
747 const ViewsDescriptor& descriptor,
748 Optional<std::string&> reasonIfUnsupported) const
749{
750#if defined(ARMCOMPUTENEON_ENABLED)
751 // Split along the last dimension, cannot use sub-tensors
752 // as width and height of the sub-tensors do not match
753 // the width and height of the parent tensor
754 // in case of input with more than 2D.
755 std::set<unsigned int> splitAxis = ComputeSplitAxis(descriptor, input.GetShape());
756 if (descriptor.GetNumDimensions() > 2 && splitAxis.size() == 1 &&
757 *splitAxis.begin() == descriptor.GetNumDimensions() - 1 )
758 {
759 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSplitterWorkloadValidate,
760 reasonIfUnsupported,
761 input,
762 outputs,
763 *splitAxis.begin());
764 }
765#endif
Derek Lamberti901ea112019-12-10 22:07:09 +0000766 boost::ignore_unused(descriptor);
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100767 for (auto output : outputs)
768 {
769 if (!input.IsTypeSpaceMatch(output)) // Cannot use sub-tensors if the types are not same space
770 {
771 SetValueChecked(reasonIfUnsupported, "Neon Splitter: Types and quantization parameters must match.");
772 return false;
773 }
774 }
775 return true;
776}
777
Matthew Jackson87f65ea2019-08-01 10:01:34 +0100778bool NeonLayerSupport::IsStackSupported(const std::vector<const TensorInfo*>& inputs,
779 const TensorInfo& output,
780 const StackDescriptor& descriptor,
781 Optional<std::string&> reasonIfUnsupported) const
782{
783 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStackWorkloadValidate,
784 reasonIfUnsupported,
785 inputs,
786 output,
787 descriptor);
788}
789
FinnWilliamsArm1fa19192019-08-02 17:26:31 +0100790bool NeonLayerSupport::IsStridedSliceSupported(const TensorInfo& input,
791 const TensorInfo& output,
792 const StridedSliceDescriptor& descriptor,
793 Optional<std::string&> reasonIfUnsupported) const
794{
795 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStridedSliceWorkloadValidate,
796 reasonIfUnsupported,
797 input,
798 output,
799 descriptor);
800}
801
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100802bool NeonLayerSupport::IsSubtractionSupported(const TensorInfo& input0,
803 const TensorInfo& input1,
804 const TensorInfo& output,
805 Optional<std::string&> reasonIfUnsupported) const
806{
807 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSubtractionWorkloadValidate,
808 reasonIfUnsupported,
809 input0,
810 input1,
811 output);
812}
813
Sadik Armagan581742d2019-08-12 14:11:37 +0100814bool NeonLayerSupport::IsTransposeConvolution2dSupported(const TensorInfo& input,
815 const TensorInfo& output,
816 const TransposeConvolution2dDescriptor& descriptor,
817 const TensorInfo& weights,
818 const Optional<TensorInfo>& biases,
819 Optional<std::string&> reasonIfUnsupported) const
820{
821 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonTransposeConvolution2dWorkloadValidate,
822 reasonIfUnsupported,
823 input,
824 output,
825 descriptor,
826 weights,
827 biases);
828}
829
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100830} // namespace armnn