blob: 47bcc2e79513ed576c68c194749aa0e660cdcf7e [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5
6#include "NeonLayerSupport.hpp"
David Beck3e9e1152018-10-17 14:17:50 +01007#include "NeonBackendId.hpp"
telsoa014fcda012018-03-09 14:13:49 +00008
telsoa014fcda012018-03-09 14:13:49 +00009#include <armnn/Descriptors.hpp>
telsoa014fcda012018-03-09 14:13:49 +000010#include <armnn/Tensor.hpp>
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010011#include <armnn/Types.hpp>
Matteo Martincighc601aa62019-10-29 15:03:22 +000012#include <armnn/BackendRegistry.hpp>
telsoa014fcda012018-03-09 14:13:49 +000013
Matteo Martincighc601aa62019-10-29 15:03:22 +000014#include <InternalTypes.hpp>
15#include <LayerSupportCommon.hpp>
David Beck3e9e1152018-10-17 14:17:50 +010016
telsoa014fcda012018-03-09 14:13:49 +000017#include <boost/core/ignore_unused.hpp>
18
Matteo Martincighd95e9062019-01-31 15:35:59 +000019#if defined(ARMCOMPUTENEON_ENABLED)
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010020#include <aclCommon/ArmComputeUtils.hpp>
Aron Virginas-Tar710f6642019-11-27 14:48:32 +000021#include <aclCommon/ArmComputeTensorUtils.hpp>
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +010022#include "workloads/NeonAbsWorkload.hpp"
Matthew Bentham955258d2018-12-10 10:48:52 +000023#include "workloads/NeonAdditionWorkload.hpp"
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +010024#include "workloads/NeonActivationWorkload.hpp"
James Conroyd47a0642019-09-17 14:22:06 +010025#include "workloads/NeonArgMinMaxWorkload.hpp"
Matthew Benthamc48ac8c2018-12-12 16:15:59 +000026#include "workloads/NeonBatchNormalizationWorkload.hpp"
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +010027#include "workloads/NeonConvolution2dWorkload.hpp"
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +010028#include "workloads/NeonDepthToSpaceWorkload.hpp"
Nattapat Chaimanowong77140882018-10-17 11:12:19 +010029#include "workloads/NeonDepthwiseConvolutionWorkload.hpp"
Narumol Prangnawarat01961a72019-05-30 16:47:12 +010030#include "workloads/NeonDequantizeWorkload.hpp"
Derek Lamberti6a5e5e82019-12-05 14:41:20 +000031#include "workloads/NeonDetectionPostProcessWorkload.hpp"
kevmay01eed85922019-01-28 08:37:25 +000032#include "workloads/NeonGreaterWorkload.hpp"
Sadik Armagan0d4863d2019-10-09 14:26:32 +010033#include "workloads/NeonInstanceNormalizationWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010034#include "workloads/NeonL2NormalizationFloatWorkload.hpp"
Jan Eilersad5293a2019-07-08 09:57:55 +010035#include "workloads/NeonLstmFloatWorkload.hpp"
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +000036#include "workloads/NeonMaximumWorkload.hpp"
Matthew Benthamfd899962018-12-31 15:49:42 +000037#include "workloads/NeonMeanWorkload.hpp"
Jim Flynn39d487d2019-05-17 15:44:36 +010038#include "workloads/NeonConcatWorkload.hpp"
Conor Kennedy54b21692019-01-09 07:57:38 +000039#include "workloads/NeonMinimumWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000040#include "workloads/NeonMultiplicationWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010041#include "workloads/NeonNormalizationFloatWorkload.hpp"
42#include "workloads/NeonFullyConnectedWorkload.hpp"
Éanna Ó Catháin12055742019-01-25 10:01:40 +000043#include "workloads/NeonPadWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010044#include "workloads/NeonPermuteWorkload.hpp"
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +010045#include "workloads/NeonPooling2dWorkload.hpp"
Nikhil Raj9b461482019-07-03 15:58:31 +010046#include "workloads/NeonPreluWorkload.hpp"
Sadik Armaganfabc2892019-05-31 09:05:11 +010047#include "workloads/NeonQuantizeWorkload.hpp"
Francis Murtagh4fc3c482019-08-02 13:20:54 +010048#include "workloads/NeonQuantizedLstmWorkload.hpp"
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +010049#include "workloads/NeonResizeWorkload.hpp"
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010050#include "workloads/NeonRsqrtWorkload.hpp"
josh minor036f02d2019-11-15 14:53:22 -060051#include "workloads/NeonSliceWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010052#include "workloads/NeonSoftmaxBaseWorkload.hpp"
Mike Kelly0be3a882020-01-24 11:27:50 +000053#include "workloads/NeonSpaceToBatchNdWorkload.hpp"
Ellen Norris-Thompson29794572019-06-26 16:40:36 +010054#include "workloads/NeonSpaceToDepthWorkload.hpp"
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010055#include "workloads/NeonSplitterWorkload.hpp"
Matthew Jackson87f65ea2019-08-01 10:01:34 +010056#include "workloads/NeonStackWorkload.hpp"
FinnWilliamsArm1fa19192019-08-02 17:26:31 +010057#include "workloads/NeonStridedSliceWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000058#include "workloads/NeonSubtractionWorkload.hpp"
Sadik Armagan581742d2019-08-12 14:11:37 +010059#include "workloads/NeonTransposeConvolution2dWorkload.hpp"
telsoa014fcda012018-03-09 14:13:49 +000060#endif
61
62using namespace boost;
63
64namespace armnn
65{
telsoa014fcda012018-03-09 14:13:49 +000066
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010067namespace
arovir017ff76c52018-10-09 09:40:58 +010068{
telsoa014fcda012018-03-09 14:13:49 +000069
Derek Lamberti901ea112019-12-10 22:07:09 +000070template< typename ... Args>
71bool IsNeonBackendSupported(Optional<std::string&> reasonIfUnsupported, Args... args)
telsoa014fcda012018-03-09 14:13:49 +000072{
Derek Lambertibaa177f2019-12-10 22:00:43 +000073 boost::ignore_unused(reasonIfUnsupported, (args)...);
Matteo Martincighd95e9062019-01-31 15:35:59 +000074#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +000075 return true;
76#else
Derek Lamberti0790dce2019-04-15 18:37:35 +010077 SetValueChecked(reasonIfUnsupported, "The armnn library has been built without NEON support");
telsoa014fcda012018-03-09 14:13:49 +000078 return false;
79#endif
80}
81
telsoa01c577f2c2018-08-31 09:22:23 +010082template<typename FloatFunc, typename Uint8Func, typename ... Params>
arovir01085f0a42018-10-08 14:48:19 +010083bool IsSupportedForDataTypeNeon(Optional<std::string&> reasonIfUnsupported,
telsoa014fcda012018-03-09 14:13:49 +000084 DataType dataType,
telsoa01c577f2c2018-08-31 09:22:23 +010085 FloatFunc floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +000086 Uint8Func uint8FuncPtr,
87 Params&&... params)
88{
89 return IsNeonBackendSupported(reasonIfUnsupported) &&
90 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
91 dataType,
92 floatFuncPtr,
telsoa01c577f2c2018-08-31 09:22:23 +010093 floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +000094 uint8FuncPtr,
narpra01db2b1602019-01-23 15:23:11 +000095 &FalseFunc<>,
kevmay012b4d88e2019-01-24 14:05:09 +000096 &FalseFunc<>,
telsoa014fcda012018-03-09 14:13:49 +000097 std::forward<Params>(params)...);
98}
99
Matteo Martincighd95e9062019-01-31 15:35:59 +0000100#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +0000101template<class FuncType, class... Args>
arovir01085f0a42018-10-08 14:48:19 +0100102inline bool IsWorkloadSupported(FuncType& func, Optional<std::string&> reasonIfUnsupported, Args&&... args)
telsoa014fcda012018-03-09 14:13:49 +0000103{
104 arm_compute::Status aclStatus = func(std::forward<Args>(args)...);
105 const bool supported = (aclStatus.error_code() == arm_compute::ErrorCode::OK);
106 if (!supported && reasonIfUnsupported)
107 {
arovir01085f0a42018-10-08 14:48:19 +0100108 reasonIfUnsupported.value() = aclStatus.error_description();
telsoa014fcda012018-03-09 14:13:49 +0000109 }
110 return supported;
111}
112
113#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
114 return IsWorkloadSupported(func, reasonIfUnsupported, __VA_ARGS__);
115#else
116#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
Derek Lamberti901ea112019-12-10 22:07:09 +0000117 return IsNeonBackendSupported(reasonIfUnsupported, __VA_ARGS__);
telsoa014fcda012018-03-09 14:13:49 +0000118#endif
119
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000120#if defined(ARMCOMPUTENEON_ENABLED)
121#define IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights) \
122armcomputetensorutils::IsQuantMultiplierSupported(input, output, weights)
123#else
124#define IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights) true
125#endif
126
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100127} // anonymous namespace
128
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +0100129bool NeonLayerSupport::IsAbsSupported(const TensorInfo& input,
130 const TensorInfo& output,
131 Optional<std::string&> reasonIfUnsupported) const
132{
josh minor4a3c6102020-01-06 16:40:46 -0600133 ElementwiseUnaryDescriptor descriptor(UnaryOperation::Abs);
134 return IsElementwiseUnarySupported(input, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +0100135}
136
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100137bool NeonLayerSupport::IsActivationSupported(const TensorInfo& input,
138 const TensorInfo& output,
139 const ActivationDescriptor& descriptor,
140 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000141{
142 ignore_unused(descriptor);
telsoa01c577f2c2018-08-31 09:22:23 +0100143 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonActivationWorkloadValidate,
144 reasonIfUnsupported,
145 input,
146 output,
147 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000148}
149
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100150bool NeonLayerSupport::IsAdditionSupported(const TensorInfo& input0,
151 const TensorInfo& input1,
152 const TensorInfo& output,
153 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000154{
telsoa01c577f2c2018-08-31 09:22:23 +0100155 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAdditionWorkloadValidate,
156 reasonIfUnsupported,
157 input0,
158 input1,
159 output);
telsoa014fcda012018-03-09 14:13:49 +0000160}
161
James Conroyd47a0642019-09-17 14:22:06 +0100162bool NeonLayerSupport::IsArgMinMaxSupported(const TensorInfo& input,
163 const TensorInfo& output,
164 const ArgMinMaxDescriptor& descriptor,
165 Optional<std::string&> reasonIfUnsupported) const
166{
167 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonArgMinMaxWorkloadValidate,
168 reasonIfUnsupported,
169 input,
170 output,
171 descriptor);
172}
173
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100174bool NeonLayerSupport::IsBatchNormalizationSupported(const TensorInfo& input,
175 const TensorInfo& output,
176 const TensorInfo& mean,
177 const TensorInfo& var,
178 const TensorInfo& beta,
179 const TensorInfo& gamma,
180 const BatchNormalizationDescriptor& descriptor,
181 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000182{
telsoa01c577f2c2018-08-31 09:22:23 +0100183 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonBatchNormalizationValidate,
184 reasonIfUnsupported,
185 input,
186 output,
187 mean,
188 var,
189 beta,
190 gamma,
191 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000192}
193
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100194bool NeonLayerSupport::IsComparisonSupported(const TensorInfo& input0,
195 const TensorInfo& input1,
196 const TensorInfo& output,
197 const ComparisonDescriptor& descriptor,
198 Optional<std::string&> reasonIfUnsupported) const
199{
200 if (descriptor.m_Operation == ComparisonOperation::Greater)
201 {
202 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonGreaterWorkloadValidate,
203 reasonIfUnsupported,
204 input0,
205 input1,
206 output);
207 }
208
209 return false;
210}
211
Jim Flynn906f9462019-05-10 13:55:21 +0100212bool NeonLayerSupport::IsConcatSupported(const std::vector<const TensorInfo*> inputs,
213 const TensorInfo& output,
Jim Flynne242f2d2019-05-22 14:24:13 +0100214 const ConcatDescriptor& descriptor,
Jim Flynn906f9462019-05-10 13:55:21 +0100215 Optional<std::string&> reasonIfUnsupported) const
216{
Jim Flynne242f2d2019-05-22 14:24:13 +0100217 if (descriptor.GetNumDimensions() <= descriptor.GetConcatAxis())
218 {
219 SetValueChecked(reasonIfUnsupported, "Neon Concat: Concat axis > Number of dimensions.");
220 return false;
221 }
222
223 unsigned int concatInnerAxis = (descriptor.GetNumDimensions() - descriptor.GetConcatAxis()) - 1;
224 if(concatInnerAxis < 3) // Width, height, or channels
225 {
226 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConcatWorkloadValidate,
227 reasonIfUnsupported,
228 inputs,
229 output,
230 descriptor);
231 }
232 else if (concatInnerAxis == 3)
233 {
234 for (auto& input : inputs)
235 {
236 if (input && !output.IsTypeSpaceMatch(*input)) // Cannot use sub-tensors if the types are not same space
237 {
238 SetValueChecked(reasonIfUnsupported, "Neon Concat: Types and quantization parameters must match.");
239 return false;
240 }
241 }
242 return true; // Sub-tensors support concat along batch
243 }
244 else // > 4 dimensions not supported.
245 {
246 SetValueChecked(reasonIfUnsupported, "Neon Concat: Maximum of 4 dimensions supported.");
247 return false;
248 }
Jim Flynn906f9462019-05-10 13:55:21 +0100249}
250
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100251bool NeonLayerSupport::IsConstantSupported(const TensorInfo& output,
252 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000253{
254 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
255 output.GetDataType(),
256 &TrueFunc<>,
257 &TrueFunc<>);
258}
259
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100260bool NeonLayerSupport::IsConvertFp16ToFp32Supported(const TensorInfo& input,
261 const TensorInfo& output,
262 Optional<std::string&> reasonIfUnsupported) const
263{
264 ignore_unused(input);
265 ignore_unused(output);
266 ignore_unused(reasonIfUnsupported);
267 return true;
268}
269
270bool NeonLayerSupport::IsConvertFp32ToFp16Supported(const TensorInfo& input,
271 const TensorInfo& output,
272 Optional<std::string&> reasonIfUnsupported) const
273{
274 ignore_unused(input);
275 ignore_unused(output);
276 ignore_unused(reasonIfUnsupported);
277 return true;
278}
279
280bool NeonLayerSupport::IsConvolution2dSupported(const TensorInfo& input,
281 const TensorInfo& output,
282 const Convolution2dDescriptor& descriptor,
283 const TensorInfo& weights,
284 const Optional<TensorInfo>& biases,
285 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000286{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000287 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000288 {
289 return false;
290 }
291
surmeh013537c2c2018-05-18 16:31:43 +0100292 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConvolution2dWorkloadValidate,
293 reasonIfUnsupported,
294 input,
295 output,
296 descriptor,
297 weights,
298 biases);
telsoa014fcda012018-03-09 14:13:49 +0000299}
300
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +0100301bool NeonLayerSupport::IsDepthToSpaceSupported(const TensorInfo& input,
302 const TensorInfo& output,
303 const DepthToSpaceDescriptor& descriptor,
304 Optional<std::string&> reasonIfUnsupported) const
305{
306 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthToSpaceWorkloadValidate,
307 reasonIfUnsupported,
308 input,
309 output,
310 descriptor);
311}
312
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100313bool NeonLayerSupport::IsDepthwiseConvolutionSupported(const TensorInfo& input,
314 const TensorInfo& output,
315 const DepthwiseConvolution2dDescriptor& descriptor,
316 const TensorInfo& weights,
317 const Optional<TensorInfo>& biases,
318 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000319{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000320 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000321 {
322 return false;
323 }
324
telsoa01c577f2c2018-08-31 09:22:23 +0100325 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
326 reasonIfUnsupported,
327 input,
328 output,
329 descriptor,
330 weights,
331 biases);
telsoa014fcda012018-03-09 14:13:49 +0000332}
333
Narumol Prangnawarat01961a72019-05-30 16:47:12 +0100334bool NeonLayerSupport::IsDequantizeSupported(const TensorInfo& input,
335 const TensorInfo& output,
336 Optional<std::string&> reasonIfUnsupported) const
337{
338 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDequantizeWorkloadValidate,
339 reasonIfUnsupported,
340 input,
341 output);
342}
343
Derek Lamberti6a5e5e82019-12-05 14:41:20 +0000344bool NeonLayerSupport::IsDetectionPostProcessSupported(const TensorInfo& boxEncodings,
345 const TensorInfo& scores,
346 const TensorInfo& anchors,
347 const TensorInfo& detectionBoxes,
348 const TensorInfo& detectionClasses,
349 const TensorInfo& detectionScores,
350 const TensorInfo& numDetections,
351 const DetectionPostProcessDescriptor& descriptor,
352 Optional<std::string&> reasonIfUnsupported) const
353{
354 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDetectionPostProcessValidate,
355 reasonIfUnsupported,
356 boxEncodings,
357 scores,
358 anchors,
359 detectionBoxes,
360 detectionClasses,
361 detectionScores,
362 numDetections,
363 descriptor);
364}
365
366
Pablo Tellof0bd6832019-04-26 17:58:13 +0100367bool NeonLayerSupport::IsDilatedDepthwiseConvolutionSupported(const TensorInfo& input,
368 const TensorInfo& output,
369 const DepthwiseConvolution2dDescriptor& descriptor,
370 const TensorInfo& weights,
371 const Optional<TensorInfo>& biases,
372 Optional<std::string&> reasonIfUnsupported) const
373{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000374 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000375 {
376 return false;
377 }
378
Pablo Tellof0bd6832019-04-26 17:58:13 +0100379 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
380 reasonIfUnsupported,
381 input,
382 output,
383 descriptor,
384 weights,
385 biases);
386}
387
josh minor4a3c6102020-01-06 16:40:46 -0600388bool NeonLayerSupport::IsElementwiseUnarySupported(const TensorInfo& input,
389 const TensorInfo& output,
390 const ElementwiseUnaryDescriptor& descriptor,
391 Optional<std::string&> reasonIfUnsupported) const
392{
393 if (descriptor.m_Operation == UnaryOperation::Abs)
394 {
395 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAbsWorkloadValidate,
396 reasonIfUnsupported,
397 input,
398 output);
399 }
400 else if (descriptor.m_Operation == UnaryOperation::Rsqrt)
401 {
402 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonRsqrtWorkloadValidate,
403 reasonIfUnsupported,
404 input,
405 output);
406 }
407
408 return false;
409}
410
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100411bool NeonLayerSupport::IsFloorSupported(const TensorInfo& input,
412 const TensorInfo& output,
413 Optional<std::string&> reasonIfUnsupported) const
414{
415 ignore_unused(output);
416 return IsNeonBackendSupported(reasonIfUnsupported) &&
417 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
418 input.GetDataType(),
419 &FalseFuncF16<>,
420 &TrueFunc<>,
narpra01db2b1602019-01-23 15:23:11 +0000421 &FalseFuncU8<>,
kevmay012b4d88e2019-01-24 14:05:09 +0000422 &FalseFuncI32<>,
423 &FalseFuncU8<>);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100424}
425
426bool NeonLayerSupport::IsFullyConnectedSupported(const TensorInfo& input,
427 const TensorInfo& output,
428 const TensorInfo& weights,
429 const TensorInfo& biases,
430 const FullyConnectedDescriptor& descriptor,
431 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000432{
telsoa01c577f2c2018-08-31 09:22:23 +0100433 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonFullyConnectedWorkloadValidate,
434 reasonIfUnsupported,
435 input,
436 output,
437 weights,
438 biases,
439 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000440}
441
kevmay01eed85922019-01-28 08:37:25 +0000442bool NeonLayerSupport::IsGreaterSupported(const armnn::TensorInfo& input0,
443 const armnn::TensorInfo& input1,
444 const armnn::TensorInfo& output,
445 armnn::Optional<std::string&> reasonIfUnsupported) const
446{
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100447 ComparisonDescriptor descriptor(ComparisonOperation::Greater);
448 return IsComparisonSupported(input0, input1, output, descriptor, reasonIfUnsupported);
kevmay01eed85922019-01-28 08:37:25 +0000449}
450
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100451bool NeonLayerSupport::IsInputSupported(const TensorInfo& input,
452 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000453{
Derek Lamberti901ea112019-12-10 22:07:09 +0000454 return IsNeonBackendSupported(reasonIfUnsupported, input);
telsoa014fcda012018-03-09 14:13:49 +0000455}
456
Sadik Armagan0d4863d2019-10-09 14:26:32 +0100457bool NeonLayerSupport::IsInstanceNormalizationSupported(const TensorInfo& input,
458 const TensorInfo& output,
459 const InstanceNormalizationDescriptor& descriptor,
460 Optional<std::string&> reasonIfUnsupported) const
461{
462 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonInstanceNormalizationWorkloadValidate,
463 reasonIfUnsupported,
464 input,
465 output,
466 descriptor);
467}
468
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100469bool NeonLayerSupport::IsL2NormalizationSupported(const TensorInfo& input,
470 const TensorInfo& output,
471 const L2NormalizationDescriptor& descriptor,
472 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000473{
Matteo Martincighbcd3c852018-09-28 14:14:12 +0100474 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonL2NormalizationWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000475}
476
Jan Eilersad5293a2019-07-08 09:57:55 +0100477bool NeonLayerSupport::IsLstmSupported(const TensorInfo& input,
478 const TensorInfo& outputStateIn,
479 const TensorInfo& cellStateIn,
480 const TensorInfo& scratchBuffer,
481 const TensorInfo& outputStateOut,
482 const TensorInfo& cellStateOut,
483 const TensorInfo& output,
484 const LstmDescriptor& descriptor,
485 const LstmInputParamsInfo& paramsInfo,
486 Optional<std::string&> reasonIfUnsupported) const
487{
488 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLstmFloatWorkloadValidate,
489 reasonIfUnsupported,
490 input,
491 outputStateIn,
492 cellStateIn,
493 scratchBuffer,
494 outputStateOut,
495 cellStateOut,
496 output,
497 descriptor,
498 paramsInfo);
499}
500
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +0000501bool NeonLayerSupport::IsMaximumSupported(const TensorInfo& input0,
502 const TensorInfo& input1,
503 const TensorInfo& output,
504 Optional<std::string&> reasonIfUnsupported) const
505{
506 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMaximumWorkloadValidate,
507 reasonIfUnsupported,
508 input0,
509 input1,
510 output);
511}
512
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100513bool NeonLayerSupport::IsMeanSupported(const TensorInfo& input,
514 const TensorInfo& output,
515 const MeanDescriptor& descriptor,
516 Optional<std::string&> reasonIfUnsupported) const
narpra0132b90462018-09-13 11:07:48 +0100517{
Matthew Benthamfd899962018-12-31 15:49:42 +0000518 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMeanWorkloadValidate,
519 reasonIfUnsupported,
520 input,
521 output,
522 descriptor);
narpra0132b90462018-09-13 11:07:48 +0100523}
524
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100525bool NeonLayerSupport::IsMergerSupported(const std::vector<const TensorInfo*> inputs,
Nikhil Raj8599a412018-11-19 14:51:07 +0000526 const TensorInfo& output,
Jim Flynne242f2d2019-05-22 14:24:13 +0100527 const MergerDescriptor& descriptor,
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100528 Optional<std::string&> reasonIfUnsupported) const
529{
Jim Flynne242f2d2019-05-22 14:24:13 +0100530 return IsConcatSupported(inputs, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100531}
532
Conor Kennedy54b21692019-01-09 07:57:38 +0000533bool NeonLayerSupport::IsMinimumSupported(const TensorInfo& input0,
534 const TensorInfo& input1,
535 const TensorInfo& output,
536 Optional<std::string&> reasonIfUnsupported) const
537{
538 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMinimumWorkloadValidate,
539 reasonIfUnsupported,
540 input0,
541 input1,
542 output);
543}
544
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100545bool NeonLayerSupport::IsMultiplicationSupported(const TensorInfo& input0,
546 const TensorInfo& input1,
547 const TensorInfo& output,
548 Optional<std::string&> reasonIfUnsupported) const
549{
550 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMultiplicationWorkloadValidate,
551 reasonIfUnsupported,
552 input0,
553 input1,
554 output);
555}
556
557bool NeonLayerSupport::IsNormalizationSupported(const TensorInfo& input,
558 const TensorInfo& output,
559 const NormalizationDescriptor& descriptor,
560 Optional<std::string&> reasonIfUnsupported) const
561{
562 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonNormalizationWorkloadValidate,
563 reasonIfUnsupported,
564 input,
565 output,
566 descriptor);
567}
568
569bool NeonLayerSupport::IsOutputSupported(const TensorInfo& output,
570 Optional<std::string&> reasonIfUnsupported) const
571{
Derek Lamberti901ea112019-12-10 22:07:09 +0000572 return IsNeonBackendSupported(reasonIfUnsupported, output);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100573}
574
Éanna Ó Catháin12055742019-01-25 10:01:40 +0000575bool NeonLayerSupport::IsPadSupported(const TensorInfo& input,
576 const TensorInfo& output,
577 const PadDescriptor& descriptor,
578 Optional<std::string&> reasonIfUnsupported) const
579{
580 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPadWorkloadValidate,
581 reasonIfUnsupported,
582 input,
583 output,
584 descriptor);
585}
586
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100587bool NeonLayerSupport::IsPermuteSupported(const TensorInfo& input,
588 const TensorInfo& output,
589 const PermuteDescriptor& descriptor,
590 Optional<std::string&> reasonIfUnsupported) const
591{
592 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPermuteWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000593}
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100594
595bool NeonLayerSupport::IsPooling2dSupported(const TensorInfo& input,
596 const TensorInfo& output,
597 const Pooling2dDescriptor& descriptor,
598 Optional<std::string&> reasonIfUnsupported) const
599{
600 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPooling2dWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
601}
602
Nikhil Raj9b461482019-07-03 15:58:31 +0100603bool NeonLayerSupport::IsPreluSupported(const armnn::TensorInfo &input,
604 const armnn::TensorInfo &alpha,
605 const armnn::TensorInfo &output,
606 armnn::Optional<std::string &> reasonIfUnsupported) const
607{
608 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPreluWorkloadValidate, reasonIfUnsupported, input, alpha, output);
609}
610
Sadik Armaganfabc2892019-05-31 09:05:11 +0100611bool NeonLayerSupport::IsQuantizeSupported(const TensorInfo& input,
612 const TensorInfo& output,
613 Optional<std::string&> reasonIfUnsupported) const
614{
615 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizeWorkloadValidate,
616 reasonIfUnsupported,
617 input,
618 output);
619}
620
Francis Murtagh4fc3c482019-08-02 13:20:54 +0100621bool NeonLayerSupport::IsQuantizedLstmSupported(const TensorInfo& input,
622 const TensorInfo& cellStateIn,
623 const TensorInfo& outputStateIn,
624 const TensorInfo& cellStateOut,
625 const TensorInfo& outputStateOut,
626 const QuantizedLstmInputParamsInfo& paramsInfo,
627 Optional<std::string&> reasonIfUnsupported) const
628{
629 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizedLstmWorkloadValidate,
630 reasonIfUnsupported,
631 input,
632 cellStateIn,
633 outputStateIn,
634 cellStateOut,
635 outputStateOut,
636 paramsInfo);
637}
638
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100639bool NeonLayerSupport::IsReshapeSupported(const TensorInfo& input,
Matteo Martincigh992d6dc2019-01-10 17:34:20 +0000640 const ReshapeDescriptor& descriptor,
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100641 Optional<std::string&> reasonIfUnsupported) const
642{
Matteo Martincigh992d6dc2019-01-10 17:34:20 +0000643 ignore_unused(descriptor);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100644 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
645 input.GetDataType(),
646 &TrueFunc<>,
647 &TrueFunc<>);
648}
649
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +0100650bool NeonLayerSupport::IsResizeSupported(const TensorInfo& input,
651 const TensorInfo& output,
652 const ResizeDescriptor& descriptor,
653 Optional<std::string&> reasonIfUnsupported) const
654{
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +0100655 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonResizeWorkloadValidate,
656 reasonIfUnsupported,
657 input,
658 output,
659 descriptor);
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +0100660}
661
Sadik Armaganc625f002018-12-17 11:32:16 +0000662bool NeonLayerSupport::IsResizeBilinearSupported(const TensorInfo& input,
663 const TensorInfo& output,
664 Optional<std::string&> reasonIfUnsupported) const
665{
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +0100666 ResizeDescriptor descriptor;
667 descriptor.m_Method = ResizeMethod::Bilinear;
668 descriptor.m_DataLayout = DataLayout::NCHW;
669
670 const TensorShape& outputShape = output.GetShape();
671 descriptor.m_TargetHeight = outputShape[2];
672 descriptor.m_TargetWidth = outputShape[3];
673
674 return IsResizeSupported(input, output, descriptor, reasonIfUnsupported);
Sadik Armaganc625f002018-12-17 11:32:16 +0000675}
676
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +0100677bool NeonLayerSupport::IsRsqrtSupported(const TensorInfo& input,
678 const TensorInfo& output,
679 Optional<std::string&> reasonIfUnsupported) const
680{
josh minor4a3c6102020-01-06 16:40:46 -0600681 ElementwiseUnaryDescriptor descriptor(UnaryOperation::Rsqrt);
682 return IsElementwiseUnarySupported(input, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +0100683}
684
josh minor036f02d2019-11-15 14:53:22 -0600685bool NeonLayerSupport::IsSliceSupported(const TensorInfo& input,
686 const TensorInfo& output,
687 const SliceDescriptor& descriptor,
688 Optional<std::string&> reasonIfUnsupported) const
689{
690 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSliceWorkloadValidate,
691 reasonIfUnsupported,
692 input,
693 output,
694 descriptor);
695}
696
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100697bool NeonLayerSupport::IsSoftmaxSupported(const TensorInfo& input,
698 const TensorInfo& output,
699 const SoftmaxDescriptor& descriptor,
700 Optional<std::string&> reasonIfUnsupported) const
701{
702 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSoftmaxWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
703}
704
Mike Kelly0be3a882020-01-24 11:27:50 +0000705bool NeonLayerSupport::IsSpaceToBatchNdSupported(const TensorInfo& input,
706 const TensorInfo& output,
707 const SpaceToBatchNdDescriptor& descriptor,
708 Optional<std::string&> reasonIfUnsupported) const
709{
710 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSpaceToBatchNdWorkloadValidate,
711 reasonIfUnsupported,
712 input,
713 output,
714 descriptor);
715}
716
Ellen Norris-Thompson29794572019-06-26 16:40:36 +0100717bool NeonLayerSupport::IsSpaceToDepthSupported(const TensorInfo& input,
Mike Kelly0be3a882020-01-24 11:27:50 +0000718 const TensorInfo& output,
719 const SpaceToDepthDescriptor& descriptor,
720 Optional<std::string&> reasonIfUnsupported) const
Ellen Norris-Thompson29794572019-06-26 16:40:36 +0100721{
722 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSpaceToDepthWorkloadValidate,
723 reasonIfUnsupported,
724 input,
725 output,
726 descriptor);
727}
728
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100729bool NeonLayerSupport::IsSplitterSupported(const TensorInfo& input,
730 const ViewsDescriptor& descriptor,
731 Optional<std::string&> reasonIfUnsupported) const
732{
733 ignore_unused(descriptor);
734 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
735 input.GetDataType(),
736 &TrueFunc<>,
737 &TrueFunc<>);
738}
739
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100740bool NeonLayerSupport::IsSplitterSupported(const TensorInfo& input,
741 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
742 const ViewsDescriptor& descriptor,
743 Optional<std::string&> reasonIfUnsupported) const
744{
745#if defined(ARMCOMPUTENEON_ENABLED)
746 // Split along the last dimension, cannot use sub-tensors
747 // as width and height of the sub-tensors do not match
748 // the width and height of the parent tensor
749 // in case of input with more than 2D.
750 std::set<unsigned int> splitAxis = ComputeSplitAxis(descriptor, input.GetShape());
751 if (descriptor.GetNumDimensions() > 2 && splitAxis.size() == 1 &&
752 *splitAxis.begin() == descriptor.GetNumDimensions() - 1 )
753 {
754 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSplitterWorkloadValidate,
755 reasonIfUnsupported,
756 input,
757 outputs,
758 *splitAxis.begin());
759 }
760#endif
Derek Lamberti901ea112019-12-10 22:07:09 +0000761 boost::ignore_unused(descriptor);
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100762 for (auto output : outputs)
763 {
764 if (!input.IsTypeSpaceMatch(output)) // Cannot use sub-tensors if the types are not same space
765 {
766 SetValueChecked(reasonIfUnsupported, "Neon Splitter: Types and quantization parameters must match.");
767 return false;
768 }
769 }
770 return true;
771}
772
Matthew Jackson87f65ea2019-08-01 10:01:34 +0100773bool NeonLayerSupport::IsStackSupported(const std::vector<const TensorInfo*>& inputs,
774 const TensorInfo& output,
775 const StackDescriptor& descriptor,
776 Optional<std::string&> reasonIfUnsupported) const
777{
778 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStackWorkloadValidate,
779 reasonIfUnsupported,
780 inputs,
781 output,
782 descriptor);
783}
784
FinnWilliamsArm1fa19192019-08-02 17:26:31 +0100785bool NeonLayerSupport::IsStridedSliceSupported(const TensorInfo& input,
786 const TensorInfo& output,
787 const StridedSliceDescriptor& descriptor,
788 Optional<std::string&> reasonIfUnsupported) const
789{
790 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStridedSliceWorkloadValidate,
791 reasonIfUnsupported,
792 input,
793 output,
794 descriptor);
795}
796
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100797bool NeonLayerSupport::IsSubtractionSupported(const TensorInfo& input0,
798 const TensorInfo& input1,
799 const TensorInfo& output,
800 Optional<std::string&> reasonIfUnsupported) const
801{
802 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSubtractionWorkloadValidate,
803 reasonIfUnsupported,
804 input0,
805 input1,
806 output);
807}
808
Sadik Armagan581742d2019-08-12 14:11:37 +0100809bool NeonLayerSupport::IsTransposeConvolution2dSupported(const TensorInfo& input,
810 const TensorInfo& output,
811 const TransposeConvolution2dDescriptor& descriptor,
812 const TensorInfo& weights,
813 const Optional<TensorInfo>& biases,
814 Optional<std::string&> reasonIfUnsupported) const
815{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000816 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000817 {
818 return false;
819 }
820
Sadik Armagan581742d2019-08-12 14:11:37 +0100821 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonTransposeConvolution2dWorkloadValidate,
822 reasonIfUnsupported,
823 input,
824 output,
825 descriptor,
826 weights,
827 biases);
828}
829
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100830} // namespace armnn