blob: 3fc323393e9f5508665997fe6c68b82c5103cf0a [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5
6#include "NeonLayerSupport.hpp"
David Beck3e9e1152018-10-17 14:17:50 +01007#include "NeonBackendId.hpp"
telsoa014fcda012018-03-09 14:13:49 +00008
telsoa014fcda012018-03-09 14:13:49 +00009#include <armnn/Descriptors.hpp>
telsoa014fcda012018-03-09 14:13:49 +000010#include <armnn/Tensor.hpp>
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010011#include <armnn/Types.hpp>
Matteo Martincighc601aa62019-10-29 15:03:22 +000012#include <armnn/BackendRegistry.hpp>
telsoa014fcda012018-03-09 14:13:49 +000013
Matteo Martincighc601aa62019-10-29 15:03:22 +000014#include <InternalTypes.hpp>
15#include <LayerSupportCommon.hpp>
David Beck3e9e1152018-10-17 14:17:50 +010016
telsoa014fcda012018-03-09 14:13:49 +000017#include <boost/core/ignore_unused.hpp>
18
Matteo Martincighd95e9062019-01-31 15:35:59 +000019#if defined(ARMCOMPUTENEON_ENABLED)
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010020#include <aclCommon/ArmComputeUtils.hpp>
Aron Virginas-Tar710f6642019-11-27 14:48:32 +000021#include <aclCommon/ArmComputeTensorUtils.hpp>
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +010022#include "workloads/NeonAbsWorkload.hpp"
Matthew Bentham955258d2018-12-10 10:48:52 +000023#include "workloads/NeonAdditionWorkload.hpp"
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +010024#include "workloads/NeonActivationWorkload.hpp"
James Conroyd47a0642019-09-17 14:22:06 +010025#include "workloads/NeonArgMinMaxWorkload.hpp"
Matthew Benthamc48ac8c2018-12-12 16:15:59 +000026#include "workloads/NeonBatchNormalizationWorkload.hpp"
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +010027#include "workloads/NeonConvolution2dWorkload.hpp"
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +010028#include "workloads/NeonDepthToSpaceWorkload.hpp"
Nattapat Chaimanowong77140882018-10-17 11:12:19 +010029#include "workloads/NeonDepthwiseConvolutionWorkload.hpp"
Narumol Prangnawarat01961a72019-05-30 16:47:12 +010030#include "workloads/NeonDequantizeWorkload.hpp"
Derek Lamberti6a5e5e82019-12-05 14:41:20 +000031#include "workloads/NeonDetectionPostProcessWorkload.hpp"
kevmay01eed85922019-01-28 08:37:25 +000032#include "workloads/NeonGreaterWorkload.hpp"
Sadik Armagan0d4863d2019-10-09 14:26:32 +010033#include "workloads/NeonInstanceNormalizationWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010034#include "workloads/NeonL2NormalizationFloatWorkload.hpp"
Jan Eilersad5293a2019-07-08 09:57:55 +010035#include "workloads/NeonLstmFloatWorkload.hpp"
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +000036#include "workloads/NeonMaximumWorkload.hpp"
Matthew Benthamfd899962018-12-31 15:49:42 +000037#include "workloads/NeonMeanWorkload.hpp"
Jim Flynn39d487d2019-05-17 15:44:36 +010038#include "workloads/NeonConcatWorkload.hpp"
Conor Kennedy54b21692019-01-09 07:57:38 +000039#include "workloads/NeonMinimumWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000040#include "workloads/NeonMultiplicationWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010041#include "workloads/NeonNormalizationFloatWorkload.hpp"
42#include "workloads/NeonFullyConnectedWorkload.hpp"
Éanna Ó Catháin12055742019-01-25 10:01:40 +000043#include "workloads/NeonPadWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010044#include "workloads/NeonPermuteWorkload.hpp"
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +010045#include "workloads/NeonPooling2dWorkload.hpp"
Nikhil Raj9b461482019-07-03 15:58:31 +010046#include "workloads/NeonPreluWorkload.hpp"
Sadik Armaganfabc2892019-05-31 09:05:11 +010047#include "workloads/NeonQuantizeWorkload.hpp"
Francis Murtagh4fc3c482019-08-02 13:20:54 +010048#include "workloads/NeonQuantizedLstmWorkload.hpp"
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +010049#include "workloads/NeonResizeWorkload.hpp"
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010050#include "workloads/NeonRsqrtWorkload.hpp"
josh minor036f02d2019-11-15 14:53:22 -060051#include "workloads/NeonSliceWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010052#include "workloads/NeonSoftmaxBaseWorkload.hpp"
Ellen Norris-Thompson29794572019-06-26 16:40:36 +010053#include "workloads/NeonSpaceToDepthWorkload.hpp"
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010054#include "workloads/NeonSplitterWorkload.hpp"
Matthew Jackson87f65ea2019-08-01 10:01:34 +010055#include "workloads/NeonStackWorkload.hpp"
FinnWilliamsArm1fa19192019-08-02 17:26:31 +010056#include "workloads/NeonStridedSliceWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000057#include "workloads/NeonSubtractionWorkload.hpp"
Sadik Armagan581742d2019-08-12 14:11:37 +010058#include "workloads/NeonTransposeConvolution2dWorkload.hpp"
telsoa014fcda012018-03-09 14:13:49 +000059#endif
60
61using namespace boost;
62
63namespace armnn
64{
telsoa014fcda012018-03-09 14:13:49 +000065
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010066namespace
arovir017ff76c52018-10-09 09:40:58 +010067{
telsoa014fcda012018-03-09 14:13:49 +000068
arovir01085f0a42018-10-08 14:48:19 +010069bool IsNeonBackendSupported(Optional<std::string&> reasonIfUnsupported)
telsoa014fcda012018-03-09 14:13:49 +000070{
Matteo Martincighd95e9062019-01-31 15:35:59 +000071#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +000072 return true;
73#else
Derek Lamberti0790dce2019-04-15 18:37:35 +010074 SetValueChecked(reasonIfUnsupported, "The armnn library has been built without NEON support");
telsoa014fcda012018-03-09 14:13:49 +000075 return false;
76#endif
77}
78
telsoa01c577f2c2018-08-31 09:22:23 +010079template<typename FloatFunc, typename Uint8Func, typename ... Params>
arovir01085f0a42018-10-08 14:48:19 +010080bool IsSupportedForDataTypeNeon(Optional<std::string&> reasonIfUnsupported,
telsoa014fcda012018-03-09 14:13:49 +000081 DataType dataType,
telsoa01c577f2c2018-08-31 09:22:23 +010082 FloatFunc floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +000083 Uint8Func uint8FuncPtr,
84 Params&&... params)
85{
86 return IsNeonBackendSupported(reasonIfUnsupported) &&
87 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
88 dataType,
89 floatFuncPtr,
telsoa01c577f2c2018-08-31 09:22:23 +010090 floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +000091 uint8FuncPtr,
narpra01db2b1602019-01-23 15:23:11 +000092 &FalseFunc<>,
kevmay012b4d88e2019-01-24 14:05:09 +000093 &FalseFunc<>,
telsoa014fcda012018-03-09 14:13:49 +000094 std::forward<Params>(params)...);
95}
96
Matteo Martincighd95e9062019-01-31 15:35:59 +000097#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +000098template<class FuncType, class... Args>
arovir01085f0a42018-10-08 14:48:19 +010099inline bool IsWorkloadSupported(FuncType& func, Optional<std::string&> reasonIfUnsupported, Args&&... args)
telsoa014fcda012018-03-09 14:13:49 +0000100{
101 arm_compute::Status aclStatus = func(std::forward<Args>(args)...);
102 const bool supported = (aclStatus.error_code() == arm_compute::ErrorCode::OK);
103 if (!supported && reasonIfUnsupported)
104 {
arovir01085f0a42018-10-08 14:48:19 +0100105 reasonIfUnsupported.value() = aclStatus.error_description();
telsoa014fcda012018-03-09 14:13:49 +0000106 }
107 return supported;
108}
109
110#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
111 return IsWorkloadSupported(func, reasonIfUnsupported, __VA_ARGS__);
112#else
113#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
114 return IsNeonBackendSupported(reasonIfUnsupported);
115#endif
116
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000117#if defined(ARMCOMPUTENEON_ENABLED)
118#define IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights) \
119armcomputetensorutils::IsQuantMultiplierSupported(input, output, weights)
120#else
121#define IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights) true
122#endif
123
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100124} // anonymous namespace
125
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +0100126bool NeonLayerSupport::IsAbsSupported(const TensorInfo& input,
127 const TensorInfo& output,
128 Optional<std::string&> reasonIfUnsupported) const
129{
130 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAbsWorkloadValidate,
131 reasonIfUnsupported,
132 input,
133 output);
134}
135
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100136bool NeonLayerSupport::IsActivationSupported(const TensorInfo& input,
137 const TensorInfo& output,
138 const ActivationDescriptor& descriptor,
139 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000140{
141 ignore_unused(descriptor);
telsoa01c577f2c2018-08-31 09:22:23 +0100142 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonActivationWorkloadValidate,
143 reasonIfUnsupported,
144 input,
145 output,
146 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000147}
148
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100149bool NeonLayerSupport::IsAdditionSupported(const TensorInfo& input0,
150 const TensorInfo& input1,
151 const TensorInfo& output,
152 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000153{
telsoa01c577f2c2018-08-31 09:22:23 +0100154 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAdditionWorkloadValidate,
155 reasonIfUnsupported,
156 input0,
157 input1,
158 output);
telsoa014fcda012018-03-09 14:13:49 +0000159}
160
James Conroyd47a0642019-09-17 14:22:06 +0100161bool NeonLayerSupport::IsArgMinMaxSupported(const TensorInfo& input,
162 const TensorInfo& output,
163 const ArgMinMaxDescriptor& descriptor,
164 Optional<std::string&> reasonIfUnsupported) const
165{
166 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonArgMinMaxWorkloadValidate,
167 reasonIfUnsupported,
168 input,
169 output,
170 descriptor);
171}
172
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100173bool NeonLayerSupport::IsBatchNormalizationSupported(const TensorInfo& input,
174 const TensorInfo& output,
175 const TensorInfo& mean,
176 const TensorInfo& var,
177 const TensorInfo& beta,
178 const TensorInfo& gamma,
179 const BatchNormalizationDescriptor& descriptor,
180 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000181{
telsoa01c577f2c2018-08-31 09:22:23 +0100182 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonBatchNormalizationValidate,
183 reasonIfUnsupported,
184 input,
185 output,
186 mean,
187 var,
188 beta,
189 gamma,
190 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000191}
192
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100193bool NeonLayerSupport::IsComparisonSupported(const TensorInfo& input0,
194 const TensorInfo& input1,
195 const TensorInfo& output,
196 const ComparisonDescriptor& descriptor,
197 Optional<std::string&> reasonIfUnsupported) const
198{
199 if (descriptor.m_Operation == ComparisonOperation::Greater)
200 {
201 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonGreaterWorkloadValidate,
202 reasonIfUnsupported,
203 input0,
204 input1,
205 output);
206 }
207
208 return false;
209}
210
Jim Flynn906f9462019-05-10 13:55:21 +0100211bool NeonLayerSupport::IsConcatSupported(const std::vector<const TensorInfo*> inputs,
212 const TensorInfo& output,
Jim Flynne242f2d2019-05-22 14:24:13 +0100213 const ConcatDescriptor& descriptor,
Jim Flynn906f9462019-05-10 13:55:21 +0100214 Optional<std::string&> reasonIfUnsupported) const
215{
Jim Flynne242f2d2019-05-22 14:24:13 +0100216 if (descriptor.GetNumDimensions() <= descriptor.GetConcatAxis())
217 {
218 SetValueChecked(reasonIfUnsupported, "Neon Concat: Concat axis > Number of dimensions.");
219 return false;
220 }
221
222 unsigned int concatInnerAxis = (descriptor.GetNumDimensions() - descriptor.GetConcatAxis()) - 1;
223 if(concatInnerAxis < 3) // Width, height, or channels
224 {
225 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConcatWorkloadValidate,
226 reasonIfUnsupported,
227 inputs,
228 output,
229 descriptor);
230 }
231 else if (concatInnerAxis == 3)
232 {
233 for (auto& input : inputs)
234 {
235 if (input && !output.IsTypeSpaceMatch(*input)) // Cannot use sub-tensors if the types are not same space
236 {
237 SetValueChecked(reasonIfUnsupported, "Neon Concat: Types and quantization parameters must match.");
238 return false;
239 }
240 }
241 return true; // Sub-tensors support concat along batch
242 }
243 else // > 4 dimensions not supported.
244 {
245 SetValueChecked(reasonIfUnsupported, "Neon Concat: Maximum of 4 dimensions supported.");
246 return false;
247 }
Jim Flynn906f9462019-05-10 13:55:21 +0100248}
249
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100250bool NeonLayerSupport::IsConstantSupported(const TensorInfo& output,
251 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000252{
253 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
254 output.GetDataType(),
255 &TrueFunc<>,
256 &TrueFunc<>);
257}
258
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100259bool NeonLayerSupport::IsConvertFp16ToFp32Supported(const TensorInfo& input,
260 const TensorInfo& output,
261 Optional<std::string&> reasonIfUnsupported) const
262{
263 ignore_unused(input);
264 ignore_unused(output);
265 ignore_unused(reasonIfUnsupported);
266 return true;
267}
268
269bool NeonLayerSupport::IsConvertFp32ToFp16Supported(const TensorInfo& input,
270 const TensorInfo& output,
271 Optional<std::string&> reasonIfUnsupported) const
272{
273 ignore_unused(input);
274 ignore_unused(output);
275 ignore_unused(reasonIfUnsupported);
276 return true;
277}
278
279bool NeonLayerSupport::IsConvolution2dSupported(const TensorInfo& input,
280 const TensorInfo& output,
281 const Convolution2dDescriptor& descriptor,
282 const TensorInfo& weights,
283 const Optional<TensorInfo>& biases,
284 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000285{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000286 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000287 {
288 return false;
289 }
290
surmeh013537c2c2018-05-18 16:31:43 +0100291 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConvolution2dWorkloadValidate,
292 reasonIfUnsupported,
293 input,
294 output,
295 descriptor,
296 weights,
297 biases);
telsoa014fcda012018-03-09 14:13:49 +0000298}
299
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +0100300bool NeonLayerSupport::IsDepthToSpaceSupported(const TensorInfo& input,
301 const TensorInfo& output,
302 const DepthToSpaceDescriptor& descriptor,
303 Optional<std::string&> reasonIfUnsupported) const
304{
305 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthToSpaceWorkloadValidate,
306 reasonIfUnsupported,
307 input,
308 output,
309 descriptor);
310}
311
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100312bool NeonLayerSupport::IsDepthwiseConvolutionSupported(const TensorInfo& input,
313 const TensorInfo& output,
314 const DepthwiseConvolution2dDescriptor& descriptor,
315 const TensorInfo& weights,
316 const Optional<TensorInfo>& biases,
317 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000318{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000319 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000320 {
321 return false;
322 }
323
telsoa01c577f2c2018-08-31 09:22:23 +0100324 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
325 reasonIfUnsupported,
326 input,
327 output,
328 descriptor,
329 weights,
330 biases);
telsoa014fcda012018-03-09 14:13:49 +0000331}
332
Narumol Prangnawarat01961a72019-05-30 16:47:12 +0100333bool NeonLayerSupport::IsDequantizeSupported(const TensorInfo& input,
334 const TensorInfo& output,
335 Optional<std::string&> reasonIfUnsupported) const
336{
337 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDequantizeWorkloadValidate,
338 reasonIfUnsupported,
339 input,
340 output);
341}
342
Derek Lamberti6a5e5e82019-12-05 14:41:20 +0000343bool NeonLayerSupport::IsDetectionPostProcessSupported(const TensorInfo& boxEncodings,
344 const TensorInfo& scores,
345 const TensorInfo& anchors,
346 const TensorInfo& detectionBoxes,
347 const TensorInfo& detectionClasses,
348 const TensorInfo& detectionScores,
349 const TensorInfo& numDetections,
350 const DetectionPostProcessDescriptor& descriptor,
351 Optional<std::string&> reasonIfUnsupported) const
352{
353 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDetectionPostProcessValidate,
354 reasonIfUnsupported,
355 boxEncodings,
356 scores,
357 anchors,
358 detectionBoxes,
359 detectionClasses,
360 detectionScores,
361 numDetections,
362 descriptor);
363}
364
365
Pablo Tellof0bd6832019-04-26 17:58:13 +0100366bool NeonLayerSupport::IsDilatedDepthwiseConvolutionSupported(const TensorInfo& input,
367 const TensorInfo& output,
368 const DepthwiseConvolution2dDescriptor& descriptor,
369 const TensorInfo& weights,
370 const Optional<TensorInfo>& biases,
371 Optional<std::string&> reasonIfUnsupported) const
372{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000373 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000374 {
375 return false;
376 }
377
Pablo Tellof0bd6832019-04-26 17:58:13 +0100378 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
379 reasonIfUnsupported,
380 input,
381 output,
382 descriptor,
383 weights,
384 biases);
385}
386
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100387bool NeonLayerSupport::IsFloorSupported(const TensorInfo& input,
388 const TensorInfo& output,
389 Optional<std::string&> reasonIfUnsupported) const
390{
391 ignore_unused(output);
392 return IsNeonBackendSupported(reasonIfUnsupported) &&
393 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
394 input.GetDataType(),
395 &FalseFuncF16<>,
396 &TrueFunc<>,
narpra01db2b1602019-01-23 15:23:11 +0000397 &FalseFuncU8<>,
kevmay012b4d88e2019-01-24 14:05:09 +0000398 &FalseFuncI32<>,
399 &FalseFuncU8<>);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100400}
401
402bool NeonLayerSupport::IsFullyConnectedSupported(const TensorInfo& input,
403 const TensorInfo& output,
404 const TensorInfo& weights,
405 const TensorInfo& biases,
406 const FullyConnectedDescriptor& descriptor,
407 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000408{
telsoa01c577f2c2018-08-31 09:22:23 +0100409 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonFullyConnectedWorkloadValidate,
410 reasonIfUnsupported,
411 input,
412 output,
413 weights,
414 biases,
415 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000416}
417
kevmay01eed85922019-01-28 08:37:25 +0000418bool NeonLayerSupport::IsGreaterSupported(const armnn::TensorInfo& input0,
419 const armnn::TensorInfo& input1,
420 const armnn::TensorInfo& output,
421 armnn::Optional<std::string&> reasonIfUnsupported) const
422{
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100423 ComparisonDescriptor descriptor(ComparisonOperation::Greater);
424 return IsComparisonSupported(input0, input1, output, descriptor, reasonIfUnsupported);
kevmay01eed85922019-01-28 08:37:25 +0000425}
426
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100427bool NeonLayerSupport::IsInputSupported(const TensorInfo& input,
428 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000429{
Francis Murtaghb3fc2522019-08-09 13:20:50 +0100430 return IsNeonBackendSupported(reasonIfUnsupported);
telsoa014fcda012018-03-09 14:13:49 +0000431}
432
Sadik Armagan0d4863d2019-10-09 14:26:32 +0100433bool NeonLayerSupport::IsInstanceNormalizationSupported(const TensorInfo& input,
434 const TensorInfo& output,
435 const InstanceNormalizationDescriptor& descriptor,
436 Optional<std::string&> reasonIfUnsupported) const
437{
438 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonInstanceNormalizationWorkloadValidate,
439 reasonIfUnsupported,
440 input,
441 output,
442 descriptor);
443}
444
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100445bool NeonLayerSupport::IsL2NormalizationSupported(const TensorInfo& input,
446 const TensorInfo& output,
447 const L2NormalizationDescriptor& descriptor,
448 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000449{
Matteo Martincighbcd3c852018-09-28 14:14:12 +0100450 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonL2NormalizationWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000451}
452
Jan Eilersad5293a2019-07-08 09:57:55 +0100453bool NeonLayerSupport::IsLstmSupported(const TensorInfo& input,
454 const TensorInfo& outputStateIn,
455 const TensorInfo& cellStateIn,
456 const TensorInfo& scratchBuffer,
457 const TensorInfo& outputStateOut,
458 const TensorInfo& cellStateOut,
459 const TensorInfo& output,
460 const LstmDescriptor& descriptor,
461 const LstmInputParamsInfo& paramsInfo,
462 Optional<std::string&> reasonIfUnsupported) const
463{
464 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLstmFloatWorkloadValidate,
465 reasonIfUnsupported,
466 input,
467 outputStateIn,
468 cellStateIn,
469 scratchBuffer,
470 outputStateOut,
471 cellStateOut,
472 output,
473 descriptor,
474 paramsInfo);
475}
476
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +0000477bool NeonLayerSupport::IsMaximumSupported(const TensorInfo& input0,
478 const TensorInfo& input1,
479 const TensorInfo& output,
480 Optional<std::string&> reasonIfUnsupported) const
481{
482 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMaximumWorkloadValidate,
483 reasonIfUnsupported,
484 input0,
485 input1,
486 output);
487}
488
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100489bool NeonLayerSupport::IsMeanSupported(const TensorInfo& input,
490 const TensorInfo& output,
491 const MeanDescriptor& descriptor,
492 Optional<std::string&> reasonIfUnsupported) const
narpra0132b90462018-09-13 11:07:48 +0100493{
Matthew Benthamfd899962018-12-31 15:49:42 +0000494 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMeanWorkloadValidate,
495 reasonIfUnsupported,
496 input,
497 output,
498 descriptor);
narpra0132b90462018-09-13 11:07:48 +0100499}
500
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100501bool NeonLayerSupport::IsMergerSupported(const std::vector<const TensorInfo*> inputs,
Nikhil Raj8599a412018-11-19 14:51:07 +0000502 const TensorInfo& output,
Jim Flynne242f2d2019-05-22 14:24:13 +0100503 const MergerDescriptor& descriptor,
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100504 Optional<std::string&> reasonIfUnsupported) const
505{
Jim Flynne242f2d2019-05-22 14:24:13 +0100506 return IsConcatSupported(inputs, output, descriptor, reasonIfUnsupported);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100507}
508
Conor Kennedy54b21692019-01-09 07:57:38 +0000509bool NeonLayerSupport::IsMinimumSupported(const TensorInfo& input0,
510 const TensorInfo& input1,
511 const TensorInfo& output,
512 Optional<std::string&> reasonIfUnsupported) const
513{
514 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMinimumWorkloadValidate,
515 reasonIfUnsupported,
516 input0,
517 input1,
518 output);
519}
520
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100521bool NeonLayerSupport::IsMultiplicationSupported(const TensorInfo& input0,
522 const TensorInfo& input1,
523 const TensorInfo& output,
524 Optional<std::string&> reasonIfUnsupported) const
525{
526 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMultiplicationWorkloadValidate,
527 reasonIfUnsupported,
528 input0,
529 input1,
530 output);
531}
532
533bool NeonLayerSupport::IsNormalizationSupported(const TensorInfo& input,
534 const TensorInfo& output,
535 const NormalizationDescriptor& descriptor,
536 Optional<std::string&> reasonIfUnsupported) const
537{
538 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonNormalizationWorkloadValidate,
539 reasonIfUnsupported,
540 input,
541 output,
542 descriptor);
543}
544
545bool NeonLayerSupport::IsOutputSupported(const TensorInfo& output,
546 Optional<std::string&> reasonIfUnsupported) const
547{
Francis Murtaghb3fc2522019-08-09 13:20:50 +0100548 return IsNeonBackendSupported(reasonIfUnsupported);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100549}
550
Éanna Ó Catháin12055742019-01-25 10:01:40 +0000551bool NeonLayerSupport::IsPadSupported(const TensorInfo& input,
552 const TensorInfo& output,
553 const PadDescriptor& descriptor,
554 Optional<std::string&> reasonIfUnsupported) const
555{
556 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPadWorkloadValidate,
557 reasonIfUnsupported,
558 input,
559 output,
560 descriptor);
561}
562
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100563bool NeonLayerSupport::IsPermuteSupported(const TensorInfo& input,
564 const TensorInfo& output,
565 const PermuteDescriptor& descriptor,
566 Optional<std::string&> reasonIfUnsupported) const
567{
568 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPermuteWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000569}
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100570
571bool NeonLayerSupport::IsPooling2dSupported(const TensorInfo& input,
572 const TensorInfo& output,
573 const Pooling2dDescriptor& descriptor,
574 Optional<std::string&> reasonIfUnsupported) const
575{
576 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPooling2dWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
577}
578
Nikhil Raj9b461482019-07-03 15:58:31 +0100579bool NeonLayerSupport::IsPreluSupported(const armnn::TensorInfo &input,
580 const armnn::TensorInfo &alpha,
581 const armnn::TensorInfo &output,
582 armnn::Optional<std::string &> reasonIfUnsupported) const
583{
584 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPreluWorkloadValidate, reasonIfUnsupported, input, alpha, output);
585}
586
Sadik Armaganfabc2892019-05-31 09:05:11 +0100587bool NeonLayerSupport::IsQuantizeSupported(const TensorInfo& input,
588 const TensorInfo& output,
589 Optional<std::string&> reasonIfUnsupported) const
590{
591 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizeWorkloadValidate,
592 reasonIfUnsupported,
593 input,
594 output);
595}
596
Francis Murtagh4fc3c482019-08-02 13:20:54 +0100597bool NeonLayerSupport::IsQuantizedLstmSupported(const TensorInfo& input,
598 const TensorInfo& cellStateIn,
599 const TensorInfo& outputStateIn,
600 const TensorInfo& cellStateOut,
601 const TensorInfo& outputStateOut,
602 const QuantizedLstmInputParamsInfo& paramsInfo,
603 Optional<std::string&> reasonIfUnsupported) const
604{
605 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizedLstmWorkloadValidate,
606 reasonIfUnsupported,
607 input,
608 cellStateIn,
609 outputStateIn,
610 cellStateOut,
611 outputStateOut,
612 paramsInfo);
613}
614
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100615bool NeonLayerSupport::IsReshapeSupported(const TensorInfo& input,
Matteo Martincigh992d6dc2019-01-10 17:34:20 +0000616 const ReshapeDescriptor& descriptor,
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100617 Optional<std::string&> reasonIfUnsupported) const
618{
Matteo Martincigh992d6dc2019-01-10 17:34:20 +0000619 ignore_unused(descriptor);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100620 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
621 input.GetDataType(),
622 &TrueFunc<>,
623 &TrueFunc<>);
624}
625
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +0100626bool NeonLayerSupport::IsResizeSupported(const TensorInfo& input,
627 const TensorInfo& output,
628 const ResizeDescriptor& descriptor,
629 Optional<std::string&> reasonIfUnsupported) const
630{
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +0100631 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonResizeWorkloadValidate,
632 reasonIfUnsupported,
633 input,
634 output,
635 descriptor);
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +0100636}
637
Sadik Armaganc625f002018-12-17 11:32:16 +0000638bool NeonLayerSupport::IsResizeBilinearSupported(const TensorInfo& input,
639 const TensorInfo& output,
640 Optional<std::string&> reasonIfUnsupported) const
641{
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +0100642 ResizeDescriptor descriptor;
643 descriptor.m_Method = ResizeMethod::Bilinear;
644 descriptor.m_DataLayout = DataLayout::NCHW;
645
646 const TensorShape& outputShape = output.GetShape();
647 descriptor.m_TargetHeight = outputShape[2];
648 descriptor.m_TargetWidth = outputShape[3];
649
650 return IsResizeSupported(input, output, descriptor, reasonIfUnsupported);
Sadik Armaganc625f002018-12-17 11:32:16 +0000651}
652
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +0100653bool NeonLayerSupport::IsRsqrtSupported(const TensorInfo& input,
654 const TensorInfo& output,
655 Optional<std::string&> reasonIfUnsupported) const
656{
657 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonRsqrtWorkloadValidate, reasonIfUnsupported, input, output);
658}
659
josh minor036f02d2019-11-15 14:53:22 -0600660bool NeonLayerSupport::IsSliceSupported(const TensorInfo& input,
661 const TensorInfo& output,
662 const SliceDescriptor& descriptor,
663 Optional<std::string&> reasonIfUnsupported) const
664{
665 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSliceWorkloadValidate,
666 reasonIfUnsupported,
667 input,
668 output,
669 descriptor);
670}
671
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100672bool NeonLayerSupport::IsSoftmaxSupported(const TensorInfo& input,
673 const TensorInfo& output,
674 const SoftmaxDescriptor& descriptor,
675 Optional<std::string&> reasonIfUnsupported) const
676{
677 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSoftmaxWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
678}
679
Ellen Norris-Thompson29794572019-06-26 16:40:36 +0100680bool NeonLayerSupport::IsSpaceToDepthSupported(const TensorInfo& input,
681 const TensorInfo& output,
682 const SpaceToDepthDescriptor& descriptor,
683 Optional<std::string&> reasonIfUnsupported) const
684{
685 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSpaceToDepthWorkloadValidate,
686 reasonIfUnsupported,
687 input,
688 output,
689 descriptor);
690}
691
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100692bool NeonLayerSupport::IsSplitterSupported(const TensorInfo& input,
693 const ViewsDescriptor& descriptor,
694 Optional<std::string&> reasonIfUnsupported) const
695{
696 ignore_unused(descriptor);
697 return IsSupportedForDataTypeNeon(reasonIfUnsupported,
698 input.GetDataType(),
699 &TrueFunc<>,
700 &TrueFunc<>);
701}
702
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100703bool NeonLayerSupport::IsSplitterSupported(const TensorInfo& input,
704 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
705 const ViewsDescriptor& descriptor,
706 Optional<std::string&> reasonIfUnsupported) const
707{
708#if defined(ARMCOMPUTENEON_ENABLED)
709 // Split along the last dimension, cannot use sub-tensors
710 // as width and height of the sub-tensors do not match
711 // the width and height of the parent tensor
712 // in case of input with more than 2D.
713 std::set<unsigned int> splitAxis = ComputeSplitAxis(descriptor, input.GetShape());
714 if (descriptor.GetNumDimensions() > 2 && splitAxis.size() == 1 &&
715 *splitAxis.begin() == descriptor.GetNumDimensions() - 1 )
716 {
717 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSplitterWorkloadValidate,
718 reasonIfUnsupported,
719 input,
720 outputs,
721 *splitAxis.begin());
722 }
723#endif
724 for (auto output : outputs)
725 {
726 if (!input.IsTypeSpaceMatch(output)) // Cannot use sub-tensors if the types are not same space
727 {
728 SetValueChecked(reasonIfUnsupported, "Neon Splitter: Types and quantization parameters must match.");
729 return false;
730 }
731 }
732 return true;
733}
734
Matthew Jackson87f65ea2019-08-01 10:01:34 +0100735bool NeonLayerSupport::IsStackSupported(const std::vector<const TensorInfo*>& inputs,
736 const TensorInfo& output,
737 const StackDescriptor& descriptor,
738 Optional<std::string&> reasonIfUnsupported) const
739{
740 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStackWorkloadValidate,
741 reasonIfUnsupported,
742 inputs,
743 output,
744 descriptor);
745}
746
FinnWilliamsArm1fa19192019-08-02 17:26:31 +0100747bool NeonLayerSupport::IsStridedSliceSupported(const TensorInfo& input,
748 const TensorInfo& output,
749 const StridedSliceDescriptor& descriptor,
750 Optional<std::string&> reasonIfUnsupported) const
751{
752 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStridedSliceWorkloadValidate,
753 reasonIfUnsupported,
754 input,
755 output,
756 descriptor);
757}
758
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100759bool NeonLayerSupport::IsSubtractionSupported(const TensorInfo& input0,
760 const TensorInfo& input1,
761 const TensorInfo& output,
762 Optional<std::string&> reasonIfUnsupported) const
763{
764 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSubtractionWorkloadValidate,
765 reasonIfUnsupported,
766 input0,
767 input1,
768 output);
769}
770
Sadik Armagan581742d2019-08-12 14:11:37 +0100771bool NeonLayerSupport::IsTransposeConvolution2dSupported(const TensorInfo& input,
772 const TensorInfo& output,
773 const TransposeConvolution2dDescriptor& descriptor,
774 const TensorInfo& weights,
775 const Optional<TensorInfo>& biases,
776 Optional<std::string&> reasonIfUnsupported) const
777{
Aron Virginas-Tar710f6642019-11-27 14:48:32 +0000778 if (!IS_QUANT_MULTIPLIER_SUPPORTED(input, output, weights))
James Conroyb86a3822019-11-19 15:28:58 +0000779 {
780 return false;
781 }
782
Sadik Armagan581742d2019-08-12 14:11:37 +0100783 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonTransposeConvolution2dWorkloadValidate,
784 reasonIfUnsupported,
785 input,
786 output,
787 descriptor,
788 weights,
789 biases);
790}
791
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100792} // namespace armnn