blob: 6ca69f48416e82ff5b3f3e060e5b82d6cec901fa [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5
6#include "NeonLayerSupport.hpp"
David Beck3e9e1152018-10-17 14:17:50 +01007#include "NeonBackendId.hpp"
telsoa014fcda012018-03-09 14:13:49 +00008
telsoa014fcda012018-03-09 14:13:49 +00009#include <armnn/Descriptors.hpp>
telsoa014fcda012018-03-09 14:13:49 +000010#include <armnn/Tensor.hpp>
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010011#include <armnn/Types.hpp>
Matteo Martincighc601aa62019-10-29 15:03:22 +000012#include <armnn/BackendRegistry.hpp>
telsoa014fcda012018-03-09 14:13:49 +000013
Matteo Martincighc601aa62019-10-29 15:03:22 +000014#include <InternalTypes.hpp>
15#include <LayerSupportCommon.hpp>
David Beck3e9e1152018-10-17 14:17:50 +010016
telsoa014fcda012018-03-09 14:13:49 +000017#include <boost/core/ignore_unused.hpp>
18
Matteo Martincighd95e9062019-01-31 15:35:59 +000019#if defined(ARMCOMPUTENEON_ENABLED)
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010020#include <aclCommon/ArmComputeUtils.hpp>
Aron Virginas-Tar710f6642019-11-27 14:48:32 +000021#include <aclCommon/ArmComputeTensorUtils.hpp>
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +010022#include "workloads/NeonAbsWorkload.hpp"
Matthew Bentham955258d2018-12-10 10:48:52 +000023#include "workloads/NeonAdditionWorkload.hpp"
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +010024#include "workloads/NeonActivationWorkload.hpp"
James Conroyd47a0642019-09-17 14:22:06 +010025#include "workloads/NeonArgMinMaxWorkload.hpp"
Matthew Benthamc48ac8c2018-12-12 16:15:59 +000026#include "workloads/NeonBatchNormalizationWorkload.hpp"
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +010027#include "workloads/NeonConvolution2dWorkload.hpp"
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +010028#include "workloads/NeonDepthToSpaceWorkload.hpp"
Nattapat Chaimanowong77140882018-10-17 11:12:19 +010029#include "workloads/NeonDepthwiseConvolutionWorkload.hpp"
Narumol Prangnawarat01961a72019-05-30 16:47:12 +010030#include "workloads/NeonDequantizeWorkload.hpp"
Derek Lamberti6a5e5e82019-12-05 14:41:20 +000031#include "workloads/NeonDetectionPostProcessWorkload.hpp"
kevmay01eed85922019-01-28 08:37:25 +000032#include "workloads/NeonGreaterWorkload.hpp"
Sadik Armagan0d4863d2019-10-09 14:26:32 +010033#include "workloads/NeonInstanceNormalizationWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010034#include "workloads/NeonL2NormalizationFloatWorkload.hpp"
Jan Eilersad5293a2019-07-08 09:57:55 +010035#include "workloads/NeonLstmFloatWorkload.hpp"
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +000036#include "workloads/NeonMaximumWorkload.hpp"
Matthew Benthamfd899962018-12-31 15:49:42 +000037#include "workloads/NeonMeanWorkload.hpp"
Jim Flynn39d487d2019-05-17 15:44:36 +010038#include "workloads/NeonConcatWorkload.hpp"
Conor Kennedy54b21692019-01-09 07:57:38 +000039#include "workloads/NeonMinimumWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000040#include "workloads/NeonMultiplicationWorkload.hpp"
Pablo Telloe61f0712020-01-23 10:37:17 +000041#include "workloads/NeonDivisionWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010042#include "workloads/NeonNormalizationFloatWorkload.hpp"
43#include "workloads/NeonFullyConnectedWorkload.hpp"
Éanna Ó Catháin12055742019-01-25 10:01:40 +000044#include "workloads/NeonPadWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010045#include "workloads/NeonPermuteWorkload.hpp"
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +010046#include "workloads/NeonPooling2dWorkload.hpp"
Nikhil Raj9b461482019-07-03 15:58:31 +010047#include "workloads/NeonPreluWorkload.hpp"
Sadik Armaganfabc2892019-05-31 09:05:11 +010048#include "workloads/NeonQuantizeWorkload.hpp"
Francis Murtagh4fc3c482019-08-02 13:20:54 +010049#include "workloads/NeonQuantizedLstmWorkload.hpp"
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +010050#include "workloads/NeonResizeWorkload.hpp"
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010051#include "workloads/NeonRsqrtWorkload.hpp"
josh minor036f02d2019-11-15 14:53:22 -060052#include "workloads/NeonSliceWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010053#include "workloads/NeonSoftmaxBaseWorkload.hpp"
Mike Kelly0be3a882020-01-24 11:27:50 +000054#include "workloads/NeonSpaceToBatchNdWorkload.hpp"
Ellen Norris-Thompson29794572019-06-26 16:40:36 +010055#include "workloads/NeonSpaceToDepthWorkload.hpp"
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010056#include "workloads/NeonSplitterWorkload.hpp"
Matthew Jackson87f65ea2019-08-01 10:01:34 +010057#include "workloads/NeonStackWorkload.hpp"
FinnWilliamsArm1fa19192019-08-02 17:26:31 +010058#include "workloads/NeonStridedSliceWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000059#include "workloads/NeonSubtractionWorkload.hpp"
Sadik Armagan581742d2019-08-12 14:11:37 +010060#include "workloads/NeonTransposeConvolution2dWorkload.hpp"
telsoa014fcda012018-03-09 14:13:49 +000061#endif
62
63using namespace boost;
64
65namespace armnn
66{
telsoa014fcda012018-03-09 14:13:49 +000067
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010068namespace
arovir017ff76c52018-10-09 09:40:58 +010069{
telsoa014fcda012018-03-09 14:13:49 +000070
Derek Lamberti901ea112019-12-10 22:07:09 +000071template< typename ... Args>
72bool IsNeonBackendSupported(Optional<std::string&> reasonIfUnsupported, Args... args)
telsoa014fcda012018-03-09 14:13:49 +000073{
Derek Lambertibaa177f2019-12-10 22:00:43 +000074 boost::ignore_unused(reasonIfUnsupported, (args)...);
Matteo Martincighd95e9062019-01-31 15:35:59 +000075#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +000076 return true;
77#else
Derek Lamberti0790dce2019-04-15 18:37:35 +010078 SetValueChecked(reasonIfUnsupported, "The armnn library has been built without NEON support");
telsoa014fcda012018-03-09 14:13:49 +000079 return false;
80#endif
81}
82
telsoa01c577f2c2018-08-31 09:22:23 +010083template<typename FloatFunc, typename Uint8Func, typename ... Params>
arovir01085f0a42018-10-08 14:48:19 +010084bool IsSupportedForDataTypeNeon(Optional<std::string&> reasonIfUnsupported,
telsoa014fcda012018-03-09 14:13:49 +000085 DataType dataType,
telsoa01c577f2c2018-08-31 09:22:23 +010086 FloatFunc floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +000087 Uint8Func uint8FuncPtr,
88 Params&&... params)
89{
90 return IsNeonBackendSupported(reasonIfUnsupported) &&
91 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
92 dataType,
93 floatFuncPtr,
telsoa01c577f2c2018-08-31 09:22:23 +010094 floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +000095 uint8FuncPtr,
narpra01db2b1602019-01-23 15:23:11 +000096 &FalseFunc<>,
kevmay012b4d88e2019-01-24 14:05:09 +000097 &FalseFunc<>,
telsoa014fcda012018-03-09 14:13:49 +000098 std::forward<Params>(params)...);
99}
100
Matteo Martincighd95e9062019-01-31 15:35:59 +0000101#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +0000102template<class FuncType, class... Args>
arovir01085f0a42018-10-08 14:48:19 +0100103inline bool IsWorkloadSupported(FuncType& func, Optional<std::string&> reasonIfUnsupported, Args&&... args)
telsoa014fcda012018-03-09 14:13:49 +0000104{
105 arm_compute::Status aclStatus = func(std::forward<Args>(args)...);
106 const bool supported = (aclStatus.error_code() == arm_compute::ErrorCode::OK);
107 if (!supported && reasonIfUnsupported)
108 {
arovir01085f0a42018-10-08 14:48:19 +0100109 reasonIfUnsupported.value() = aclStatus.error_description();
telsoa014fcda012018-03-09 14:13:49 +0000110 }
111 return supported;
112}
113
114#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
115 return IsWorkloadSupported(func, reasonIfUnsupported, __VA_ARGS__);
116#else
117#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
Derek Lamberti901ea112019-12-10 22:07:09 +0000118 return IsNeonBackendSupported(reasonIfUnsupported, __VA_ARGS__);
telsoa014fcda012018-03-09 14:13:49 +0000119#endif
120
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000121#if defined(ARMCOMPUTENEON_ENABLED)
122#define IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights) \
123armcomputetensorutils::IsQuantMultiplierSupported(input, output, weights)
124#else
125#define IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights) true
126#endif
127
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100128} // anonymous namespace
129
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +0100130bool NeonLayerSupport::IsAbsSupported(const TensorInfo& input,
131 const TensorInfo& output,
132 Optional<std::string&> reasonIfUnsupported) const
133{
josh minor4a3c6102020-01-06 16:40:46 -0600134 ElementwiseUnaryDescriptor descriptor(UnaryOperation::Abs);
135 return IsElementwiseUnarySupported(input, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +0100136}
137
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100138bool NeonLayerSupport::IsActivationSupported(const TensorInfo& input,
139 const TensorInfo& output,
140 const ActivationDescriptor& descriptor,
141 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000142{
143 ignore_unused(descriptor);
telsoa01c577f2c2018-08-31 09:22:23 +0100144 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonActivationWorkloadValidate,
145 reasonIfUnsupported,
146 input,
147 output,
148 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000149}
150
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100151bool NeonLayerSupport::IsAdditionSupported(const TensorInfo& input0,
152 const TensorInfo& input1,
153 const TensorInfo& output,
154 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000155{
telsoa01c577f2c2018-08-31 09:22:23 +0100156 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAdditionWorkloadValidate,
157 reasonIfUnsupported,
158 input0,
159 input1,
160 output);
telsoa014fcda012018-03-09 14:13:49 +0000161}
162
James Conroyd47a0642019-09-17 14:22:06 +0100163bool NeonLayerSupport::IsArgMinMaxSupported(const TensorInfo& input,
164 const TensorInfo& output,
165 const ArgMinMaxDescriptor& descriptor,
166 Optional<std::string&> reasonIfUnsupported) const
167{
168 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonArgMinMaxWorkloadValidate,
169 reasonIfUnsupported,
170 input,
171 output,
172 descriptor);
173}
174
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100175bool NeonLayerSupport::IsBatchNormalizationSupported(const TensorInfo& input,
176 const TensorInfo& output,
177 const TensorInfo& mean,
178 const TensorInfo& var,
179 const TensorInfo& beta,
180 const TensorInfo& gamma,
181 const BatchNormalizationDescriptor& descriptor,
182 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000183{
telsoa01c577f2c2018-08-31 09:22:23 +0100184 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonBatchNormalizationValidate,
185 reasonIfUnsupported,
186 input,
187 output,
188 mean,
189 var,
190 beta,
191 gamma,
192 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000193}
194
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100195bool NeonLayerSupport::IsComparisonSupported(const TensorInfo& input0,
196 const TensorInfo& input1,
197 const TensorInfo& output,
198 const ComparisonDescriptor& descriptor,
199 Optional<std::string&> reasonIfUnsupported) const
200{
201 if (descriptor.m_Operation == ComparisonOperation::Greater)
202 {
203 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonGreaterWorkloadValidate,
204 reasonIfUnsupported,
205 input0,
206 input1,
207 output);
208 }
209
210 return false;
211}
212
Jim Flynn906f9462019-05-10 13:55:21 +0100213bool NeonLayerSupport::IsConcatSupported(const std::vector<const TensorInfo*> inputs,
214 const TensorInfo& output,
Jim Flynne242f2d2019-05-22 14:24:13 +0100215 const ConcatDescriptor& descriptor,
Jim Flynn906f9462019-05-10 13:55:21 +0100216 Optional<std::string&> reasonIfUnsupported) const
217{
Jim Flynne242f2d2019-05-22 14:24:13 +0100218 if (descriptor.GetNumDimensions() <= descriptor.GetConcatAxis())
219 {
220 SetValueChecked(reasonIfUnsupported, "Neon Concat: Concat axis > Number of dimensions.");
221 return false;
222 }
223
224 unsigned int concatInnerAxis = (descriptor.GetNumDimensions() - descriptor.GetConcatAxis()) - 1;
225 if(concatInnerAxis < 3) // Width, height, or channels
226 {
227 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConcatWorkloadValidate,
228 reasonIfUnsupported,
229 inputs,
230 output,
231 descriptor);
232 }
233 else if (concatInnerAxis == 3)
234 {
235 for (auto& input : inputs)
236 {
237 if (input && !output.IsTypeSpaceMatch(*input)) // Cannot use sub-tensors if the types are not same space
238 {
239 SetValueChecked(reasonIfUnsupported, "Neon Concat: Types and quantization parameters must match.");
240 return false;
241 }
242 }
243 return true; // Sub-tensors support concat along batch
244 }
245 else // > 4 dimensions not supported.
246 {
247 SetValueChecked(reasonIfUnsupported, "Neon Concat: Maximum of 4 dimensions supported.");
248 return false;
249 }
Jim Flynn906f9462019-05-10 13:55:21 +0100250}
251
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100252bool NeonLayerSupport::IsConstantSupported(const TensorInfo& output,
253 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000254{
255 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
256 output.GetDataType(),
257 &TrueFunc<>,
258 &TrueFunc<>);
259}
260
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100261bool NeonLayerSupport::IsConvertFp16ToFp32Supported(const TensorInfo& input,
262 const TensorInfo& output,
263 Optional<std::string&> reasonIfUnsupported) const
264{
265 ignore_unused(input);
266 ignore_unused(output);
267 ignore_unused(reasonIfUnsupported);
268 return true;
269}
270
271bool NeonLayerSupport::IsConvertFp32ToFp16Supported(const TensorInfo& input,
272 const TensorInfo& output,
273 Optional<std::string&> reasonIfUnsupported) const
274{
275 ignore_unused(input);
276 ignore_unused(output);
277 ignore_unused(reasonIfUnsupported);
278 return true;
279}
280
281bool NeonLayerSupport::IsConvolution2dSupported(const TensorInfo& input,
282 const TensorInfo& output,
283 const Convolution2dDescriptor& descriptor,
284 const TensorInfo& weights,
285 const Optional<TensorInfo>& biases,
286 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000287{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000288 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000289 {
290 return false;
291 }
292
surmeh013537c2c2018-05-18 16:31:43 +0100293 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConvolution2dWorkloadValidate,
294 reasonIfUnsupported,
295 input,
296 output,
297 descriptor,
298 weights,
299 biases);
telsoa014fcda012018-03-09 14:13:49 +0000300}
301
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +0100302bool NeonLayerSupport::IsDepthToSpaceSupported(const TensorInfo& input,
303 const TensorInfo& output,
304 const DepthToSpaceDescriptor& descriptor,
305 Optional<std::string&> reasonIfUnsupported) const
306{
307 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthToSpaceWorkloadValidate,
308 reasonIfUnsupported,
309 input,
310 output,
311 descriptor);
312}
313
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100314bool NeonLayerSupport::IsDepthwiseConvolutionSupported(const TensorInfo& input,
315 const TensorInfo& output,
316 const DepthwiseConvolution2dDescriptor& descriptor,
317 const TensorInfo& weights,
318 const Optional<TensorInfo>& biases,
319 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000320{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000321 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000322 {
323 return false;
324 }
325
telsoa01c577f2c2018-08-31 09:22:23 +0100326 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
327 reasonIfUnsupported,
328 input,
329 output,
330 descriptor,
331 weights,
332 biases);
telsoa014fcda012018-03-09 14:13:49 +0000333}
334
Narumol Prangnawarat01961a72019-05-30 16:47:12 +0100335bool NeonLayerSupport::IsDequantizeSupported(const TensorInfo& input,
336 const TensorInfo& output,
337 Optional<std::string&> reasonIfUnsupported) const
338{
339 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDequantizeWorkloadValidate,
340 reasonIfUnsupported,
341 input,
342 output);
343}
344
Derek Lamberti6a5e5e82019-12-05 14:41:20 +0000345bool NeonLayerSupport::IsDetectionPostProcessSupported(const TensorInfo& boxEncodings,
346 const TensorInfo& scores,
347 const TensorInfo& anchors,
348 const TensorInfo& detectionBoxes,
349 const TensorInfo& detectionClasses,
350 const TensorInfo& detectionScores,
351 const TensorInfo& numDetections,
352 const DetectionPostProcessDescriptor& descriptor,
353 Optional<std::string&> reasonIfUnsupported) const
354{
355 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDetectionPostProcessValidate,
356 reasonIfUnsupported,
357 boxEncodings,
358 scores,
359 anchors,
360 detectionBoxes,
361 detectionClasses,
362 detectionScores,
363 numDetections,
364 descriptor);
365}
366
367
Pablo Tellof0bd6832019-04-26 17:58:13 +0100368bool NeonLayerSupport::IsDilatedDepthwiseConvolutionSupported(const TensorInfo& input,
369 const TensorInfo& output,
370 const DepthwiseConvolution2dDescriptor& descriptor,
371 const TensorInfo& weights,
372 const Optional<TensorInfo>& biases,
373 Optional<std::string&> reasonIfUnsupported) const
374{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000375 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000376 {
377 return false;
378 }
379
Pablo Tellof0bd6832019-04-26 17:58:13 +0100380 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
381 reasonIfUnsupported,
382 input,
383 output,
384 descriptor,
385 weights,
386 biases);
387}
388
josh minor4a3c6102020-01-06 16:40:46 -0600389bool NeonLayerSupport::IsElementwiseUnarySupported(const TensorInfo& input,
390 const TensorInfo& output,
391 const ElementwiseUnaryDescriptor& descriptor,
392 Optional<std::string&> reasonIfUnsupported) const
393{
394 if (descriptor.m_Operation == UnaryOperation::Abs)
395 {
396 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAbsWorkloadValidate,
397 reasonIfUnsupported,
398 input,
399 output);
400 }
401 else if (descriptor.m_Operation == UnaryOperation::Rsqrt)
402 {
403 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonRsqrtWorkloadValidate,
404 reasonIfUnsupported,
405 input,
406 output);
407 }
408
409 return false;
410}
411
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100412bool NeonLayerSupport::IsFloorSupported(const TensorInfo& input,
413 const TensorInfo& output,
414 Optional<std::string&> reasonIfUnsupported) const
415{
416 ignore_unused(output);
417 return IsNeonBackendSupported(reasonIfUnsupported) &&
418 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
419 input.GetDataType(),
420 &FalseFuncF16<>,
421 &TrueFunc<>,
narpra01db2b1602019-01-23 15:23:11 +0000422 &FalseFuncU8<>,
kevmay012b4d88e2019-01-24 14:05:09 +0000423 &FalseFuncI32<>,
424 &FalseFuncU8<>);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100425}
426
427bool NeonLayerSupport::IsFullyConnectedSupported(const TensorInfo& input,
428 const TensorInfo& output,
429 const TensorInfo& weights,
430 const TensorInfo& biases,
431 const FullyConnectedDescriptor& descriptor,
432 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000433{
telsoa01c577f2c2018-08-31 09:22:23 +0100434 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonFullyConnectedWorkloadValidate,
435 reasonIfUnsupported,
436 input,
437 output,
438 weights,
439 biases,
440 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000441}
442
kevmay01eed85922019-01-28 08:37:25 +0000443bool NeonLayerSupport::IsGreaterSupported(const armnn::TensorInfo& input0,
444 const armnn::TensorInfo& input1,
445 const armnn::TensorInfo& output,
446 armnn::Optional<std::string&> reasonIfUnsupported) const
447{
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100448 ComparisonDescriptor descriptor(ComparisonOperation::Greater);
449 return IsComparisonSupported(input0, input1, output, descriptor, reasonIfUnsupported);
kevmay01eed85922019-01-28 08:37:25 +0000450}
451
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100452bool NeonLayerSupport::IsInputSupported(const TensorInfo& input,
453 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000454{
Derek Lamberti901ea112019-12-10 22:07:09 +0000455 return IsNeonBackendSupported(reasonIfUnsupported, input);
telsoa014fcda012018-03-09 14:13:49 +0000456}
457
Sadik Armagan0d4863d2019-10-09 14:26:32 +0100458bool NeonLayerSupport::IsInstanceNormalizationSupported(const TensorInfo& input,
459 const TensorInfo& output,
460 const InstanceNormalizationDescriptor& descriptor,
461 Optional<std::string&> reasonIfUnsupported) const
462{
463 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonInstanceNormalizationWorkloadValidate,
464 reasonIfUnsupported,
465 input,
466 output,
467 descriptor);
468}
469
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100470bool NeonLayerSupport::IsL2NormalizationSupported(const TensorInfo& input,
471 const TensorInfo& output,
472 const L2NormalizationDescriptor& descriptor,
473 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000474{
Matteo Martincighbcd3c852018-09-28 14:14:12 +0100475 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonL2NormalizationWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000476}
477
Jan Eilersad5293a2019-07-08 09:57:55 +0100478bool NeonLayerSupport::IsLstmSupported(const TensorInfo& input,
479 const TensorInfo& outputStateIn,
480 const TensorInfo& cellStateIn,
481 const TensorInfo& scratchBuffer,
482 const TensorInfo& outputStateOut,
483 const TensorInfo& cellStateOut,
484 const TensorInfo& output,
485 const LstmDescriptor& descriptor,
486 const LstmInputParamsInfo& paramsInfo,
487 Optional<std::string&> reasonIfUnsupported) const
488{
489 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLstmFloatWorkloadValidate,
490 reasonIfUnsupported,
491 input,
492 outputStateIn,
493 cellStateIn,
494 scratchBuffer,
495 outputStateOut,
496 cellStateOut,
497 output,
498 descriptor,
499 paramsInfo);
500}
501
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +0000502bool NeonLayerSupport::IsMaximumSupported(const TensorInfo& input0,
503 const TensorInfo& input1,
504 const TensorInfo& output,
505 Optional<std::string&> reasonIfUnsupported) const
506{
507 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMaximumWorkloadValidate,
508 reasonIfUnsupported,
509 input0,
510 input1,
511 output);
512}
513
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100514bool NeonLayerSupport::IsMeanSupported(const TensorInfo& input,
515 const TensorInfo& output,
516 const MeanDescriptor& descriptor,
517 Optional<std::string&> reasonIfUnsupported) const
narpra0132b90462018-09-13 11:07:48 +0100518{
Matthew Benthamfd899962018-12-31 15:49:42 +0000519 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMeanWorkloadValidate,
520 reasonIfUnsupported,
521 input,
522 output,
523 descriptor);
narpra0132b90462018-09-13 11:07:48 +0100524}
525
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100526bool NeonLayerSupport::IsMergerSupported(const std::vector<const TensorInfo*> inputs,
Nikhil Raj8599a412018-11-19 14:51:07 +0000527 const TensorInfo& output,
Jim Flynne242f2d2019-05-22 14:24:13 +0100528 const MergerDescriptor& descriptor,
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100529 Optional<std::string&> reasonIfUnsupported) const
530{
Jim Flynne242f2d2019-05-22 14:24:13 +0100531 return IsConcatSupported(inputs, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100532}
533
Conor Kennedy54b21692019-01-09 07:57:38 +0000534bool NeonLayerSupport::IsMinimumSupported(const TensorInfo& input0,
535 const TensorInfo& input1,
536 const TensorInfo& output,
537 Optional<std::string&> reasonIfUnsupported) const
538{
539 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMinimumWorkloadValidate,
540 reasonIfUnsupported,
541 input0,
542 input1,
543 output);
544}
545
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100546bool NeonLayerSupport::IsMultiplicationSupported(const TensorInfo& input0,
547 const TensorInfo& input1,
548 const TensorInfo& output,
549 Optional<std::string&> reasonIfUnsupported) const
550{
551 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMultiplicationWorkloadValidate,
552 reasonIfUnsupported,
553 input0,
554 input1,
555 output);
556}
557
Pablo Telloe61f0712020-01-23 10:37:17 +0000558bool NeonLayerSupport::IsDivisionSupported(const TensorInfo& input0,
559 const TensorInfo& input1,
560 const TensorInfo& output,
561 Optional<std::string&> reasonIfUnsupported) const
562{
563 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDivisionWorkloadValidate,
564 reasonIfUnsupported,
565 input0,
566 input1,
567 output);
568}
569
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100570bool NeonLayerSupport::IsNormalizationSupported(const TensorInfo& input,
571 const TensorInfo& output,
572 const NormalizationDescriptor& descriptor,
573 Optional<std::string&> reasonIfUnsupported) const
574{
575 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonNormalizationWorkloadValidate,
576 reasonIfUnsupported,
577 input,
578 output,
579 descriptor);
580}
581
582bool NeonLayerSupport::IsOutputSupported(const TensorInfo& output,
583 Optional<std::string&> reasonIfUnsupported) const
584{
Derek Lamberti901ea112019-12-10 22:07:09 +0000585 return IsNeonBackendSupported(reasonIfUnsupported, output);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100586}
587
Éanna Ó Catháin12055742019-01-25 10:01:40 +0000588bool NeonLayerSupport::IsPadSupported(const TensorInfo& input,
589 const TensorInfo& output,
590 const PadDescriptor& descriptor,
591 Optional<std::string&> reasonIfUnsupported) const
592{
593 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPadWorkloadValidate,
594 reasonIfUnsupported,
595 input,
596 output,
597 descriptor);
598}
599
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100600bool NeonLayerSupport::IsPermuteSupported(const TensorInfo& input,
601 const TensorInfo& output,
602 const PermuteDescriptor& descriptor,
603 Optional<std::string&> reasonIfUnsupported) const
604{
605 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPermuteWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000606}
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100607
608bool NeonLayerSupport::IsPooling2dSupported(const TensorInfo& input,
609 const TensorInfo& output,
610 const Pooling2dDescriptor& descriptor,
611 Optional<std::string&> reasonIfUnsupported) const
612{
613 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPooling2dWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
614}
615
Nikhil Raj9b461482019-07-03 15:58:31 +0100616bool NeonLayerSupport::IsPreluSupported(const armnn::TensorInfo &input,
617 const armnn::TensorInfo &alpha,
618 const armnn::TensorInfo &output,
619 armnn::Optional<std::string &> reasonIfUnsupported) const
620{
621 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPreluWorkloadValidate, reasonIfUnsupported, input, alpha, output);
622}
623
Sadik Armaganfabc2892019-05-31 09:05:11 +0100624bool NeonLayerSupport::IsQuantizeSupported(const TensorInfo& input,
625 const TensorInfo& output,
626 Optional<std::string&> reasonIfUnsupported) const
627{
628 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizeWorkloadValidate,
629 reasonIfUnsupported,
630 input,
631 output);
632}
633
Francis Murtagh4fc3c482019-08-02 13:20:54 +0100634bool NeonLayerSupport::IsQuantizedLstmSupported(const TensorInfo& input,
635 const TensorInfo& cellStateIn,
636 const TensorInfo& outputStateIn,
637 const TensorInfo& cellStateOut,
638 const TensorInfo& outputStateOut,
639 const QuantizedLstmInputParamsInfo& paramsInfo,
640 Optional<std::string&> reasonIfUnsupported) const
641{
642 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizedLstmWorkloadValidate,
643 reasonIfUnsupported,
644 input,
645 cellStateIn,
646 outputStateIn,
647 cellStateOut,
648 outputStateOut,
649 paramsInfo);
650}
651
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100652bool NeonLayerSupport::IsReshapeSupported(const TensorInfo& input,
Matteo Martincigh992d6dc2019-01-10 17:34:20 +0000653 const ReshapeDescriptor& descriptor,
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100654 Optional<std::string&> reasonIfUnsupported) const
655{
Matteo Martincigh992d6dc2019-01-10 17:34:20 +0000656 ignore_unused(descriptor);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100657 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
658 input.GetDataType(),
659 &TrueFunc<>,
660 &TrueFunc<>);
661}
662
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +0100663bool NeonLayerSupport::IsResizeSupported(const TensorInfo& input,
664 const TensorInfo& output,
665 const ResizeDescriptor& descriptor,
666 Optional<std::string&> reasonIfUnsupported) const
667{
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +0100668 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonResizeWorkloadValidate,
669 reasonIfUnsupported,
670 input,
671 output,
672 descriptor);
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +0100673}
674
Sadik Armaganc625f002018-12-17 11:32:16 +0000675bool NeonLayerSupport::IsResizeBilinearSupported(const TensorInfo& input,
676 const TensorInfo& output,
677 Optional<std::string&> reasonIfUnsupported) const
678{
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +0100679 ResizeDescriptor descriptor;
680 descriptor.m_Method = ResizeMethod::Bilinear;
681 descriptor.m_DataLayout = DataLayout::NCHW;
682
683 const TensorShape& outputShape = output.GetShape();
684 descriptor.m_TargetHeight = outputShape[2];
685 descriptor.m_TargetWidth = outputShape[3];
686
687 return IsResizeSupported(input, output, descriptor, reasonIfUnsupported);
Sadik Armaganc625f002018-12-17 11:32:16 +0000688}
689
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +0100690bool NeonLayerSupport::IsRsqrtSupported(const TensorInfo& input,
691 const TensorInfo& output,
692 Optional<std::string&> reasonIfUnsupported) const
693{
josh minor4a3c6102020-01-06 16:40:46 -0600694 ElementwiseUnaryDescriptor descriptor(UnaryOperation::Rsqrt);
695 return IsElementwiseUnarySupported(input, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +0100696}
697
josh minor036f02d2019-11-15 14:53:22 -0600698bool NeonLayerSupport::IsSliceSupported(const TensorInfo& input,
699 const TensorInfo& output,
700 const SliceDescriptor& descriptor,
701 Optional<std::string&> reasonIfUnsupported) const
702{
703 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSliceWorkloadValidate,
704 reasonIfUnsupported,
705 input,
706 output,
707 descriptor);
708}
709
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100710bool NeonLayerSupport::IsSoftmaxSupported(const TensorInfo& input,
711 const TensorInfo& output,
712 const SoftmaxDescriptor& descriptor,
713 Optional<std::string&> reasonIfUnsupported) const
714{
715 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSoftmaxWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
716}
717
Mike Kelly0be3a882020-01-24 11:27:50 +0000718bool NeonLayerSupport::IsSpaceToBatchNdSupported(const TensorInfo& input,
719 const TensorInfo& output,
720 const SpaceToBatchNdDescriptor& descriptor,
721 Optional<std::string&> reasonIfUnsupported) const
722{
723 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSpaceToBatchNdWorkloadValidate,
724 reasonIfUnsupported,
725 input,
726 output,
727 descriptor);
728}
729
Ellen Norris-Thompson29794572019-06-26 16:40:36 +0100730bool NeonLayerSupport::IsSpaceToDepthSupported(const TensorInfo& input,
Mike Kelly0be3a882020-01-24 11:27:50 +0000731 const TensorInfo& output,
732 const SpaceToDepthDescriptor& descriptor,
733 Optional<std::string&> reasonIfUnsupported) const
Ellen Norris-Thompson29794572019-06-26 16:40:36 +0100734{
735 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSpaceToDepthWorkloadValidate,
736 reasonIfUnsupported,
737 input,
738 output,
739 descriptor);
740}
741
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100742bool NeonLayerSupport::IsSplitterSupported(const TensorInfo& input,
743 const ViewsDescriptor& descriptor,
744 Optional<std::string&> reasonIfUnsupported) const
745{
746 ignore_unused(descriptor);
747 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
748 input.GetDataType(),
749 &TrueFunc<>,
750 &TrueFunc<>);
751}
752
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100753bool NeonLayerSupport::IsSplitterSupported(const TensorInfo& input,
754 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
755 const ViewsDescriptor& descriptor,
756 Optional<std::string&> reasonIfUnsupported) const
757{
758#if defined(ARMCOMPUTENEON_ENABLED)
759 // Split along the last dimension, cannot use sub-tensors
760 // as width and height of the sub-tensors do not match
761 // the width and height of the parent tensor
762 // in case of input with more than 2D.
763 std::set<unsigned int> splitAxis = ComputeSplitAxis(descriptor, input.GetShape());
764 if (descriptor.GetNumDimensions() > 2 && splitAxis.size() == 1 &&
765 *splitAxis.begin() == descriptor.GetNumDimensions() - 1 )
766 {
767 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSplitterWorkloadValidate,
768 reasonIfUnsupported,
769 input,
770 outputs,
771 *splitAxis.begin());
772 }
773#endif
Derek Lamberti901ea112019-12-10 22:07:09 +0000774 boost::ignore_unused(descriptor);
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100775 for (auto output : outputs)
776 {
777 if (!input.IsTypeSpaceMatch(output)) // Cannot use sub-tensors if the types are not same space
778 {
779 SetValueChecked(reasonIfUnsupported, "Neon Splitter: Types and quantization parameters must match.");
780 return false;
781 }
782 }
783 return true;
784}
785
Matthew Jackson87f65ea2019-08-01 10:01:34 +0100786bool NeonLayerSupport::IsStackSupported(const std::vector<const TensorInfo*>& inputs,
787 const TensorInfo& output,
788 const StackDescriptor& descriptor,
789 Optional<std::string&> reasonIfUnsupported) const
790{
791 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStackWorkloadValidate,
792 reasonIfUnsupported,
793 inputs,
794 output,
795 descriptor);
796}
797
FinnWilliamsArm1fa19192019-08-02 17:26:31 +0100798bool NeonLayerSupport::IsStridedSliceSupported(const TensorInfo& input,
799 const TensorInfo& output,
800 const StridedSliceDescriptor& descriptor,
801 Optional<std::string&> reasonIfUnsupported) const
802{
803 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStridedSliceWorkloadValidate,
804 reasonIfUnsupported,
805 input,
806 output,
807 descriptor);
808}
809
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100810bool NeonLayerSupport::IsSubtractionSupported(const TensorInfo& input0,
811 const TensorInfo& input1,
812 const TensorInfo& output,
813 Optional<std::string&> reasonIfUnsupported) const
814{
815 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSubtractionWorkloadValidate,
816 reasonIfUnsupported,
817 input0,
818 input1,
819 output);
820}
821
Sadik Armagan581742d2019-08-12 14:11:37 +0100822bool NeonLayerSupport::IsTransposeConvolution2dSupported(const TensorInfo& input,
823 const TensorInfo& output,
824 const TransposeConvolution2dDescriptor& descriptor,
825 const TensorInfo& weights,
826 const Optional<TensorInfo>& biases,
827 Optional<std::string&> reasonIfUnsupported) const
828{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000829 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000830 {
831 return false;
832 }
833
Sadik Armagan581742d2019-08-12 14:11:37 +0100834 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonTransposeConvolution2dWorkloadValidate,
835 reasonIfUnsupported,
836 input,
837 output,
838 descriptor,
839 weights,
840 biases);
841}
842
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100843} // namespace armnn