blob: cd4dca8edba05f9c4b0c91a2c83c1c623619e809 [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
Mike Kelly3ec30772023-03-08 13:47:17 +00002// Copyright © 2017-2023 Arm Ltd and Contributors. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5
6#include "NeonLayerSupport.hpp"
David Beck3e9e1152018-10-17 14:17:50 +01007#include "NeonBackendId.hpp"
Sadik Armagan045f6be2020-09-10 13:37:32 +01008#include "NeonBackendModelContext.hpp"
telsoa014fcda012018-03-09 14:13:49 +00009
Derek Lambertic77874a2020-04-28 13:34:56 +010010#include <armnn/Exceptions.hpp>
telsoa014fcda012018-03-09 14:13:49 +000011#include <armnn/Tensor.hpp>
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010012#include <armnn/Types.hpp>
Matteo Martincighc601aa62019-10-29 15:03:22 +000013#include <armnn/BackendRegistry.hpp>
telsoa014fcda012018-03-09 14:13:49 +000014
Matteo Martincighc601aa62019-10-29 15:03:22 +000015#include <InternalTypes.hpp>
16#include <LayerSupportCommon.hpp>
Jan Eilers8eb25602020-03-09 12:13:48 +000017#include <armnn/utility/IgnoreUnused.hpp>
Sadik Armagan045f6be2020-09-10 13:37:32 +010018#include <armnn/utility/PolymorphicDowncast.hpp>
telsoa014fcda012018-03-09 14:13:49 +000019
Matteo Martincighd95e9062019-01-31 15:35:59 +000020#if defined(ARMCOMPUTENEON_ENABLED)
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010021#include <aclCommon/ArmComputeUtils.hpp>
Aron Virginas-Tar710f6642019-11-27 14:48:32 +000022#include <aclCommon/ArmComputeTensorUtils.hpp>
Aron Virginas-Tar914e4db2019-09-09 13:36:45 +010023#include "workloads/NeonAbsWorkload.hpp"
Matthew Bentham955258d2018-12-10 10:48:52 +000024#include "workloads/NeonAdditionWorkload.hpp"
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +010025#include "workloads/NeonActivationWorkload.hpp"
James Conroyd47a0642019-09-17 14:22:06 +010026#include "workloads/NeonArgMinMaxWorkload.hpp"
Teresa Charlin0f86ecf2022-10-13 15:47:08 +010027#include "workloads/NeonBatchMatMulWorkload.hpp"
Matthew Benthamc48ac8c2018-12-12 16:15:59 +000028#include "workloads/NeonBatchNormalizationWorkload.hpp"
Mike Kelly56858022020-01-27 12:14:47 +000029#include "workloads/NeonBatchToSpaceNdWorkload.hpp"
Sadik Armagan48f011e2021-04-21 10:50:34 +010030#include "workloads/NeonCastWorkload.hpp"
Teresa Charline89dd692021-09-01 16:30:34 +010031#include "workloads/NeonChannelShuffleWorkload.hpp"
Teresa Charlincedd34f2020-03-30 11:17:30 +010032#include "workloads/NeonComparisonWorkload.hpp"
Teresa Charline89dd692021-09-01 16:30:34 +010033#include "workloads/NeonConcatWorkload.hpp"
Mike Kelly0886ac42020-04-27 09:55:40 +010034#include "workloads/NeonConstantWorkload.hpp"
Matthew Bentham34336f92023-04-27 12:13:50 +000035#include "workloads/NeonConvertFp16ToFp32Workload.hpp"
36#include "workloads/NeonConvertFp32ToFp16Workload.hpp"
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +010037#include "workloads/NeonConvolution2dWorkload.hpp"
Teresa Charlinec5f7d12021-10-22 17:15:00 +010038#include "workloads/NeonConvolution3dWorkload.hpp"
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +010039#include "workloads/NeonDepthToSpaceWorkload.hpp"
Nattapat Chaimanowong77140882018-10-17 11:12:19 +010040#include "workloads/NeonDepthwiseConvolutionWorkload.hpp"
Narumol Prangnawarat01961a72019-05-30 16:47:12 +010041#include "workloads/NeonDequantizeWorkload.hpp"
Teresa Charline89dd692021-09-01 16:30:34 +010042#include "workloads/NeonExpWorkload.hpp"
Sadik Armagan0d4863d2019-10-09 14:26:32 +010043#include "workloads/NeonInstanceNormalizationWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010044#include "workloads/NeonL2NormalizationFloatWorkload.hpp"
Teresa Charlin50de4fa2021-05-31 18:47:33 +010045#include "workloads/NeonLogWorkload.hpp"
Keith Davis69e653f2020-07-02 11:49:26 +010046#include "workloads/NeonLogSoftmaxWorkload.hpp"
James Conroy177df1e2020-11-13 10:18:51 +000047#include "workloads/NeonLogicalAndWorkload.hpp"
48#include "workloads/NeonLogicalNotWorkload.hpp"
49#include "workloads/NeonLogicalOrWorkload.hpp"
Jan Eilersad5293a2019-07-08 09:57:55 +010050#include "workloads/NeonLstmFloatWorkload.hpp"
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +000051#include "workloads/NeonMaximumWorkload.hpp"
Matthew Benthamfd899962018-12-31 15:49:42 +000052#include "workloads/NeonMeanWorkload.hpp"
Conor Kennedy54b21692019-01-09 07:57:38 +000053#include "workloads/NeonMinimumWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000054#include "workloads/NeonMultiplicationWorkload.hpp"
Pablo Telloe61f0712020-01-23 10:37:17 +000055#include "workloads/NeonDivisionWorkload.hpp"
Sadik Armaganac472102020-03-24 09:54:36 +000056#include "workloads/NeonNegWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010057#include "workloads/NeonNormalizationFloatWorkload.hpp"
58#include "workloads/NeonFullyConnectedWorkload.hpp"
Teresa Charlinf540eb82020-04-10 19:24:55 +010059#include "workloads/NeonGatherWorkload.hpp"
Teresa Charlinbd22c7d2022-04-26 18:14:12 +010060#include "workloads/NeonGatherNdWorkload.hpp"
Éanna Ó Catháin12055742019-01-25 10:01:40 +000061#include "workloads/NeonPadWorkload.hpp"
David Beck0dbe0ee2018-09-24 15:59:27 +010062#include "workloads/NeonPermuteWorkload.hpp"
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +010063#include "workloads/NeonPooling2dWorkload.hpp"
Ryan OShea19e79422022-05-04 00:38:03 +010064#include "workloads/NeonPooling3dWorkload.hpp"
Nikhil Raj9b461482019-07-03 15:58:31 +010065#include "workloads/NeonPreluWorkload.hpp"
James Conroycc340932020-05-12 18:08:52 +010066#include "workloads/NeonQLstmWorkload.hpp"
Sadik Armaganfabc2892019-05-31 09:05:11 +010067#include "workloads/NeonQuantizeWorkload.hpp"
Francis Murtagh4fc3c482019-08-02 13:20:54 +010068#include "workloads/NeonQuantizedLstmWorkload.hpp"
Sadik Armagana2747482021-02-09 10:28:54 +000069#include "workloads/NeonReduceWorkload.hpp"
Kevin Maya023c402019-12-12 17:28:05 +000070#include "workloads/NeonReshapeWorkload.hpp"
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +010071#include "workloads/NeonResizeWorkload.hpp"
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010072#include "workloads/NeonRsqrtWorkload.hpp"
Teresa Charlin50de4fa2021-05-31 18:47:33 +010073#include "workloads/NeonSinWorkload.hpp"
josh minor036f02d2019-11-15 14:53:22 -060074#include "workloads/NeonSliceWorkload.hpp"
Sadik Armaganbe88a572020-04-30 11:39:37 +010075#include "workloads/NeonSoftmaxWorkload.hpp"
Mike Kelly0be3a882020-01-24 11:27:50 +000076#include "workloads/NeonSpaceToBatchNdWorkload.hpp"
Ellen Norris-Thompson29794572019-06-26 16:40:36 +010077#include "workloads/NeonSpaceToDepthWorkload.hpp"
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010078#include "workloads/NeonSplitterWorkload.hpp"
Teresa Charlin06145cc2022-05-05 15:31:30 +010079#include "workloads/NeonSqrtWorkload.hpp"
Matthew Jackson87f65ea2019-08-01 10:01:34 +010080#include "workloads/NeonStackWorkload.hpp"
FinnWilliamsArm1fa19192019-08-02 17:26:31 +010081#include "workloads/NeonStridedSliceWorkload.hpp"
Conor Kennedyb99480b2019-03-08 08:24:41 +000082#include "workloads/NeonSubtractionWorkload.hpp"
Sadik Armagan581742d2019-08-12 14:11:37 +010083#include "workloads/NeonTransposeConvolution2dWorkload.hpp"
Mike Kellyc9ea45a2020-02-28 18:11:58 +000084#include "workloads/NeonTransposeWorkload.hpp"
Cathal Corbettfd5bec42022-03-03 15:13:23 +000085#include "workloads/NeonUnidirectionalSequenceLstmFloatWorkload.hpp"
Mike Kelly12994962022-04-21 11:57:09 +010086#include "workloads/NeonUnidirectionalSequenceLstmWorkload.hpp"
telsoa014fcda012018-03-09 14:13:49 +000087#endif
88
telsoa014fcda012018-03-09 14:13:49 +000089namespace armnn
90{
telsoa014fcda012018-03-09 14:13:49 +000091
Aron Virginas-Tarfc824312018-10-15 15:00:13 +010092namespace
arovir017ff76c52018-10-09 09:40:58 +010093{
telsoa014fcda012018-03-09 14:13:49 +000094
Cathal Corbett80f71a82022-12-20 18:25:40 +000095const TensorInfo OverrideDataType(const TensorInfo& info, Optional<DataType> type)
96{
97 if (!type)
98 {
99 return info;
100 }
101 return TensorInfo(info.GetShape(),
102 type.value(),
103 info.GetQuantizationScale(),
104 info.GetQuantizationOffset(),
105 info.IsConstant());
106}
107
Derek Lamberti901ea112019-12-10 22:07:09 +0000108template< typename ... Args>
109bool IsNeonBackendSupported(Optional<std::string&> reasonIfUnsupported, Args... args)
telsoa014fcda012018-03-09 14:13:49 +0000110{
Jan Eilers8eb25602020-03-09 12:13:48 +0000111 IgnoreUnused(reasonIfUnsupported, (args)...);
Matteo Martincighd95e9062019-01-31 15:35:59 +0000112#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +0000113 return true;
114#else
Derek Lamberti0790dce2019-04-15 18:37:35 +0100115 SetValueChecked(reasonIfUnsupported, "The armnn library has been built without NEON support");
telsoa014fcda012018-03-09 14:13:49 +0000116 return false;
117#endif
118}
119
telsoa01c577f2c2018-08-31 09:22:23 +0100120template<typename FloatFunc, typename Uint8Func, typename ... Params>
arovir01085f0a42018-10-08 14:48:19 +0100121bool IsSupportedForDataTypeNeon(Optional<std::string&> reasonIfUnsupported,
telsoa014fcda012018-03-09 14:13:49 +0000122 DataType dataType,
telsoa01c577f2c2018-08-31 09:22:23 +0100123 FloatFunc floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +0000124 Uint8Func uint8FuncPtr,
125 Params&&... params)
126{
127 return IsNeonBackendSupported(reasonIfUnsupported) &&
128 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
129 dataType,
130 floatFuncPtr,
telsoa01c577f2c2018-08-31 09:22:23 +0100131 floatFuncPtr,
telsoa014fcda012018-03-09 14:13:49 +0000132 uint8FuncPtr,
narpra01db2b1602019-01-23 15:23:11 +0000133 &FalseFunc<>,
kevmay012b4d88e2019-01-24 14:05:09 +0000134 &FalseFunc<>,
telsoa014fcda012018-03-09 14:13:49 +0000135 std::forward<Params>(params)...);
136}
137
Matteo Martincighd95e9062019-01-31 15:35:59 +0000138#if defined(ARMCOMPUTENEON_ENABLED)
telsoa014fcda012018-03-09 14:13:49 +0000139template<class FuncType, class... Args>
arovir01085f0a42018-10-08 14:48:19 +0100140inline bool IsWorkloadSupported(FuncType& func, Optional<std::string&> reasonIfUnsupported, Args&&... args)
telsoa014fcda012018-03-09 14:13:49 +0000141{
142 arm_compute::Status aclStatus = func(std::forward<Args>(args)...);
143 const bool supported = (aclStatus.error_code() == arm_compute::ErrorCode::OK);
144 if (!supported && reasonIfUnsupported)
145 {
arovir01085f0a42018-10-08 14:48:19 +0100146 reasonIfUnsupported.value() = aclStatus.error_description();
telsoa014fcda012018-03-09 14:13:49 +0000147 }
148 return supported;
149}
150
151#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
152 return IsWorkloadSupported(func, reasonIfUnsupported, __VA_ARGS__);
153#else
154#define FORWARD_WORKLOAD_VALIDATE_FUNC(func, reasonIfUnsupported, ...) \
Derek Lamberti901ea112019-12-10 22:07:09 +0000155 return IsNeonBackendSupported(reasonIfUnsupported, __VA_ARGS__);
telsoa014fcda012018-03-09 14:13:49 +0000156#endif
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100157} // anonymous namespace
158
Sadik Armagan045f6be2020-09-10 13:37:32 +0100159NeonLayerSupport::NeonLayerSupport(const IBackendInternal::IBackendSpecificModelContextPtr& modelContextPtr)
160 : m_ModelContextPtr(modelContextPtr)
161{
162}
163
164NeonLayerSupport::NeonLayerSupport()
165 : m_ModelContextPtr(nullptr)
166{
167}
168
Cathal Corbett80f71a82022-12-20 18:25:40 +0000169bool IsLayerTypeSupported(const LayerType& type,
170 const std::vector<TensorInfo>& infos,
171 const BaseDescriptor& descriptor,
172 const Optional<LstmInputParamsInfo>& lstmParamsInfo,
173 const Optional<QuantizedLstmInputParamsInfo>& quantizedLstmParamsInfo,
174 Optional<std::string&> reasonIfUnsupported,
175 const NeonLayerSupport& support)
Cathal Corbett34b429c2021-12-24 12:24:40 +0000176{
177 switch (type)
178 {
179 case LayerType::Activation:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000180 return support.IsActivationSupported(infos[0],
181 infos[1],
182 *(PolymorphicDowncast<const ActivationDescriptor*>(&descriptor)),
183 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000184 case LayerType::Addition:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000185 return support.IsAdditionSupported(infos[0], infos[1], infos[2], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000186 case LayerType::ArgMinMax:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000187 return support.IsArgMinMaxSupported(infos[0],
188 infos[1],
189 *(PolymorphicDowncast<const ArgMinMaxDescriptor*>(&descriptor)),
190 reasonIfUnsupported);
Teresa Charlin0f86ecf2022-10-13 15:47:08 +0100191 case LayerType::BatchMatMul:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000192 return support.IsBatchMatMulSupported(infos[0],
193 infos[1],
194 infos[2],
195 *(PolymorphicDowncast<const BatchMatMulDescriptor*>(&descriptor)),
196 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000197 case LayerType::BatchNormalization:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000198 return support.IsBatchNormalizationSupported(infos[0],
199 infos[1],
200 infos[2],
201 infos[3],
202 infos[4],
203 infos[5],
204 *(PolymorphicDowncast<const
205 BatchNormalizationDescriptor*>(&descriptor)),
206 reasonIfUnsupported);
207 case LayerType::BatchToSpaceNd:
208 return support.IsBatchToSpaceNdSupported(infos[0],
209 infos[1],
210 *(PolymorphicDowncast<const
211 BatchToSpaceNdDescriptor*>(&descriptor)),
212 reasonIfUnsupported);
213 case LayerType::Cast:
214 return support.IsCastSupported(infos[0], infos[1], reasonIfUnsupported);
215 case LayerType::ChannelShuffle:
216 return support.IsChannelShuffleSupported(infos[0],
217 infos[1],
218 *(PolymorphicDowncast<const
219 ChannelShuffleDescriptor*>(&descriptor)),
220 reasonIfUnsupported);
221 case LayerType::Comparison:
222 return support.IsComparisonSupported(infos[0],
Cathal Corbett34b429c2021-12-24 12:24:40 +0000223 infos[1],
224 infos[2],
Cathal Corbett80f71a82022-12-20 18:25:40 +0000225 *(PolymorphicDowncast<const ComparisonDescriptor*>(&descriptor)),
Cathal Corbett34b429c2021-12-24 12:24:40 +0000226 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000227 case LayerType::Concat:
228 {
229 std::vector<const TensorInfo*> inputInfos;
230 for (uint32_t i = 0; i < (infos.size() - 1); i++)
231 {
232 inputInfos.push_back(&infos[i]);
233 }
Cathal Corbett80f71a82022-12-20 18:25:40 +0000234 return support.IsConcatSupported(inputInfos,
235 infos[infos.size() - 1],
236 *(PolymorphicDowncast<const OriginsDescriptor*>(&descriptor)),
237 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000238 }
239 case LayerType::Constant:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000240 return support.IsConstantSupported(infos[0], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000241 case LayerType::ConvertFp16ToFp32:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000242 return support.IsConvertFp16ToFp32Supported(infos[0], infos[1], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000243 case LayerType::ConvertFp32ToFp16:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000244 return support.IsConvertFp32ToFp16Supported(infos[0], infos[1], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000245 case LayerType::Convolution2d:
246 {
247 if (infos.size() != 4)
248 {
249 throw InvalidArgumentException("Invalid number of TransposeConvolution2d TensorInfos. "
250 "TensorInfos should be of format: {input, output, weights, biases}.");
251 }
252
253 auto desc = *(PolymorphicDowncast<const Convolution2dDescriptor*>(&descriptor));
254 if (infos[3] == TensorInfo())
255 {
Cathal Corbett80f71a82022-12-20 18:25:40 +0000256 return support.IsConvolution2dSupported(infos[0],
257 infos[1],
258 desc,
259 infos[2],
260 EmptyOptional(),
261 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000262 }
263 else
264 {
Cathal Corbett80f71a82022-12-20 18:25:40 +0000265 return support.IsConvolution2dSupported(infos[0],
266 infos[1],
267 desc,
268 infos[2],
269 infos[3],
270 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000271 }
272 }
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000273 case LayerType::Convolution3d:
274 {
275 if (infos.size() != 4)
276 {
277 throw InvalidArgumentException("Invalid number of Convolution3d TensorInfos. "
278 "TensorInfos should be of format: {input, output, weights, biases}.");
279 }
280
281 auto desc = *(PolymorphicDowncast<const Convolution3dDescriptor*>(&descriptor));
282 if (infos[3] == TensorInfo())
283 {
Cathal Corbett80f71a82022-12-20 18:25:40 +0000284 return support.IsConvolution3dSupported(infos[0],
285 infos[1],
286 desc,
287 infos[2],
288 EmptyOptional(),
289 reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000290 }
291 else
292 {
Cathal Corbett80f71a82022-12-20 18:25:40 +0000293 return support.IsConvolution3dSupported(infos[0],
294 infos[1],
295 desc,
296 infos[2],
297 infos[3],
298 reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000299 }
300 }
Cathal Corbett34b429c2021-12-24 12:24:40 +0000301 case LayerType::DepthToSpace:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000302 return support.IsDepthToSpaceSupported(infos[0],
303 infos[1],
304 *(PolymorphicDowncast<const DepthToSpaceDescriptor*>(&descriptor)),
305 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000306 case LayerType::DepthwiseConvolution2d:
307 {
308 if (infos.size() != 4)
309 {
310 throw InvalidArgumentException("Invalid number of DepthwiseConvolution2d TensorInfos. "
311 "TensorInfos should be of format: {input, output, weights, biases}.");
312 }
313
314 auto desc = *(PolymorphicDowncast<const DepthwiseConvolution2dDescriptor*>(&descriptor));
315 if (infos[3] == TensorInfo())
316 {
Cathal Corbett80f71a82022-12-20 18:25:40 +0000317 return support.IsDepthwiseConvolutionSupported(infos[0],
318 infos[1],
319 desc,
320 infos[2],
321 EmptyOptional(),
322 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000323 }
324 else
325 {
Cathal Corbett80f71a82022-12-20 18:25:40 +0000326 return support.IsDepthwiseConvolutionSupported(infos[0],
327 infos[1],
328 desc,
329 infos[2],
330 infos[3],
331 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000332 }
333 }
334 case LayerType::Dequantize:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000335 return support.IsDequantizeSupported(infos[0], infos[1], reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000336 case LayerType::DetectionPostProcess:
337 {
338 auto desc = *(PolymorphicDowncast<const DetectionPostProcessDescriptor*>(&descriptor));
Cathal Corbett80f71a82022-12-20 18:25:40 +0000339 return support.IsDetectionPostProcessSupported(infos[0],
340 infos[1],
341 infos[2],
342 infos[3],
343 infos[4],
344 infos[5],
345 infos[6],
346 desc,
347 reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000348 }
Cathal Corbett34b429c2021-12-24 12:24:40 +0000349 case LayerType::Division:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000350 return support.IsDivisionSupported(infos[0], infos[1], infos[2], reasonIfUnsupported);
Mike Kelly3ec30772023-03-08 13:47:17 +0000351 case LayerType::ElementwiseBinary:
352 {
353 auto desc = *(PolymorphicDowncast<const ElementwiseBinaryDescriptor *>(&descriptor));
354
355 switch (desc.m_Operation)
356 {
357 case BinaryOperation::Add:
358 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAdditionWorkloadValidate,
359 reasonIfUnsupported,
360 infos[0],
361 infos[1],
362 infos[2],
363 nullptr);
364 case BinaryOperation::Div:
365 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDivisionWorkloadValidate,
366 reasonIfUnsupported,
367 infos[0],
368 infos[1],
369 infos[2],
370 nullptr);
371 case BinaryOperation::Maximum:
372 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMaximumWorkloadValidate,
373 reasonIfUnsupported,
374 infos[0],
375 infos[1],
376 infos[2]);
377 case BinaryOperation::Minimum:
378 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMinimumWorkloadValidate,
379 reasonIfUnsupported,
380 infos[0],
381 infos[1],
382 infos[2]);
383 case BinaryOperation::Mul:
384 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMultiplicationWorkloadValidate,
385 reasonIfUnsupported,
386 infos[0],
387 infos[1],
388 infos[2],
389 nullptr);
390 case BinaryOperation::Sub:
391 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSubtractionWorkloadValidate,
392 reasonIfUnsupported,
393 infos[0],
394 infos[1],
395 infos[2],
396 nullptr);
397 default:
398 return false;
399 }
400 }
Cathal Corbett34b429c2021-12-24 12:24:40 +0000401 case LayerType::ElementwiseUnary:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000402 return support.IsElementwiseUnarySupported(infos[0],
403 infos[1],
404 *(PolymorphicDowncast<const
405 ElementwiseUnaryDescriptor*>(&descriptor)),
406 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000407 case LayerType::Fill:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000408 return support.IsFillSupported(infos[0],
409 infos[1],
410 *(PolymorphicDowncast<const FillDescriptor*>(&descriptor)),
411 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000412 case LayerType::Floor:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000413 return support.IsFloorSupported(infos[0], infos[1], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000414 case LayerType::FullyConnected:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000415 return support.IsFullyConnectedSupported(infos[0],
416 infos[1],
417 infos[2],
418 infos[3],
419 *(PolymorphicDowncast<const
420 FullyConnectedDescriptor*>(&descriptor)),
421 reasonIfUnsupported);
422 case LayerType::Gather:
423 return support.IsGatherSupported(infos[0],
Cathal Corbett34b429c2021-12-24 12:24:40 +0000424 infos[1],
425 infos[2],
Cathal Corbett80f71a82022-12-20 18:25:40 +0000426 *(PolymorphicDowncast<const GatherDescriptor*>(&descriptor)),
Cathal Corbett34b429c2021-12-24 12:24:40 +0000427 reasonIfUnsupported);
Teresa Charlinbd22c7d2022-04-26 18:14:12 +0100428 case LayerType::GatherNd:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000429 return support.IsGatherNdSupported(infos[0],
430 infos[1],
431 infos[2],
432 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000433 case LayerType::Input:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000434 return support.IsInputSupported(infos[0], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000435 case LayerType::InstanceNormalization:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000436 return support.IsInstanceNormalizationSupported(infos[0],
437 infos[1],
438 *(PolymorphicDowncast<const
439 InstanceNormalizationDescriptor*>(&descriptor)),
440 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000441 case LayerType::L2Normalization:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000442 return support.IsL2NormalizationSupported(infos[0],
443 infos[1],
444 *(PolymorphicDowncast<const
445 L2NormalizationDescriptor*>(&descriptor)),
446 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000447 case LayerType::LogicalBinary:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000448 return support.IsLogicalBinarySupported(infos[0],
449 infos[1],
450 infos[2],
451 *(PolymorphicDowncast<const
452 LogicalBinaryDescriptor*>(&descriptor)),
453 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000454 case LayerType::LogSoftmax:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000455 return support.IsLogSoftmaxSupported(infos[0],
456 infos[1],
457 *(PolymorphicDowncast<const LogSoftmaxDescriptor*>(&descriptor)),
458 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000459 case LayerType::Lstm:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000460 return support.IsLstmSupported(infos[0],
461 infos[1],
462 infos[2],
463 infos[3],
464 infos[4],
465 infos[5],
466 infos[6],
467 *(PolymorphicDowncast<const LstmDescriptor*>(&descriptor)),
468 lstmParamsInfo.value(),
469 reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000470 case LayerType::Map:
471 return true;
Cathal Corbett34b429c2021-12-24 12:24:40 +0000472 case LayerType::Maximum:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000473 return support.IsMaximumSupported(infos[0], infos[1], infos[2], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000474 case LayerType::Mean:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000475 return support.IsMeanSupported(infos[0],
476 infos[1],
477 *(PolymorphicDowncast<const MeanDescriptor*>(&descriptor)),
478 reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000479 case LayerType::MemCopy:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000480 return support.IsMemCopySupported(infos[0], infos[1], reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000481 case LayerType::MemImport:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000482 return support.IsMemImportSupported(infos[0], infos[1], reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000483 case LayerType::Merge:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000484 return support.IsMergeSupported(infos[0],
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000485 infos[1],
486 infos[2],
487 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000488 case LayerType::Minimum:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000489 return support.IsMinimumSupported(infos[0], infos[1], infos[2], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000490 case LayerType::Multiplication:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000491 return support.IsMultiplicationSupported(infos[0], infos[1], infos[2], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000492 case LayerType::Normalization:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000493 return support.IsNormalizationSupported(infos[0],
494 infos[1],
495 *(PolymorphicDowncast<const
496 NormalizationDescriptor*>(&descriptor)),
497 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000498 case LayerType::Output:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000499 return support.IsOutputSupported(infos[0], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000500 case LayerType::Pad:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000501 return support.IsPadSupported(infos[0],
502 infos[1],
503 *(PolymorphicDowncast<const PadDescriptor*>(&descriptor)),
504 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000505 case LayerType::Permute:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000506 return support.IsPermuteSupported(infos[0],
507 infos[1],
508 *(PolymorphicDowncast<const PermuteDescriptor*>(&descriptor)),
509 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000510 case LayerType::Pooling2d:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000511 return support.IsPooling2dSupported(infos[0],
512 infos[1],
513 *(PolymorphicDowncast<const Pooling2dDescriptor*>(&descriptor)),
514 reasonIfUnsupported);
Ryan OShea19e79422022-05-04 00:38:03 +0100515 case LayerType::Pooling3d:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000516 return support.IsPooling3dSupported(infos[0],
517 infos[1],
518 *(PolymorphicDowncast<const Pooling3dDescriptor*>(&descriptor)),
519 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000520 case LayerType::Prelu:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000521 return support.IsPreluSupported(infos[0], infos[1], infos[2], reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000522 case LayerType::QLstm:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000523 return support.IsQLstmSupported(infos[0],
Cathal Corbett34b429c2021-12-24 12:24:40 +0000524 infos[1],
525 infos[2],
526 infos[3],
527 infos[4],
Cathal Corbett80f71a82022-12-20 18:25:40 +0000528 infos[5],
529 *(PolymorphicDowncast<const QLstmDescriptor*>(&descriptor)),
530 lstmParamsInfo.value(),
Cathal Corbett34b429c2021-12-24 12:24:40 +0000531 reasonIfUnsupported);
Cathal Corbett80f71a82022-12-20 18:25:40 +0000532 case LayerType::Quantize:
533 return support.IsQuantizeSupported(infos[0], infos[1], reasonIfUnsupported);
534 case LayerType::QuantizedLstm:
535 return support.IsQuantizedLstmSupported(infos[0],
536 infos[1],
537 infos[2],
538 infos[3],
539 infos[4],
540 quantizedLstmParamsInfo.value(),
541 reasonIfUnsupported);
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000542 case LayerType::Rank:
543 return true;
Cathal Corbett34b429c2021-12-24 12:24:40 +0000544 case LayerType::Reshape:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000545 return support.IsReshapeSupported(infos[0],
546 infos[1],
547 *(PolymorphicDowncast<const ReshapeDescriptor*>(&descriptor)),
548 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000549 case LayerType::Resize:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000550 return support.IsResizeSupported(infos[0],
Cathal Corbett34b429c2021-12-24 12:24:40 +0000551 infos[1],
Cathal Corbett80f71a82022-12-20 18:25:40 +0000552 *(PolymorphicDowncast<const ResizeDescriptor*>(&descriptor)),
Cathal Corbett34b429c2021-12-24 12:24:40 +0000553 reasonIfUnsupported);
Cathal Corbett80f71a82022-12-20 18:25:40 +0000554 case LayerType::Reduce:
555 return support.IsReduceSupported(infos[0],
556 infos[1],
557 *(PolymorphicDowncast<const ReduceDescriptor*>(&descriptor)),
558 reasonIfUnsupported);
559 case LayerType::Shape:
560 return support.IsShapeSupported(infos[0],
561 infos[1],
562 reasonIfUnsupported);
563 case LayerType::Slice:
564 return support.IsSliceSupported(infos[0],
565 infos[1],
566 *(PolymorphicDowncast<const SliceDescriptor*>(&descriptor)),
567 reasonIfUnsupported);
568 case LayerType::Softmax:
569 return support.IsSoftmaxSupported(infos[0],
570 infos[1],
571 *(PolymorphicDowncast<const SoftmaxDescriptor*>(&descriptor)),
572 reasonIfUnsupported);
573 case LayerType::SpaceToBatchNd:
574 return support.IsSpaceToBatchNdSupported(infos[0],
575 infos[1],
576 *(PolymorphicDowncast<const
577 SpaceToBatchNdDescriptor*>(&descriptor)),
578 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000579 case LayerType::SpaceToDepth:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000580 return support.IsSpaceToDepthSupported(infos[0],
581 infos[1],
582 *(PolymorphicDowncast<const SpaceToDepthDescriptor*>(&descriptor)),
583 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000584 case LayerType::Splitter:
585 {
586 std::vector<TensorInfo> outputInfos;
587 for (uint32_t i = 1; i < infos.size(); i++)
588 {
589 outputInfos.push_back(infos[i]);
590 }
Cathal Corbett80f71a82022-12-20 18:25:40 +0000591 return support.IsSplitterSupported(infos[0],
592 {outputInfos.begin(), outputInfos.end()},
593 *(PolymorphicDowncast<const ViewsDescriptor*>(&descriptor)),
594 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000595 }
596 case LayerType::Stack:
597 {
598 std::vector<const TensorInfo*> inputInfos;
599 for (uint32_t i = 0; i < infos.size() - 1; i++)
600 {
601 inputInfos.push_back(&infos[i]);
602 }
Cathal Corbett80f71a82022-12-20 18:25:40 +0000603 return support.IsStackSupported(inputInfos,
604 infos[infos.size() - 1],
605 *(PolymorphicDowncast<const StackDescriptor*>(&descriptor)),
606 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000607 }
608 case LayerType::StridedSlice:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000609 return support.IsStridedSliceSupported(infos[0],
610 infos[1],
611 *(PolymorphicDowncast<const StridedSliceDescriptor*>(&descriptor)),
612 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000613 case LayerType::Subtraction:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000614 return support.IsSubtractionSupported(infos[0], infos[1], infos[2], reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000615 case LayerType::Transpose:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000616 return support.IsTransposeSupported(infos[0],
617 infos[1],
618 *(PolymorphicDowncast<const TransposeDescriptor*>(&descriptor)),
619 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000620 case LayerType::TransposeConvolution2d:
621 {
622 if (infos.size() != 4)
623 {
624 throw InvalidArgumentException("Invalid number of TransposeConvolution2d TensorInfos. "
625 "TensorInfos should be of format: {input, output, weights, biases}.");
626 }
627
628 auto desc = *(PolymorphicDowncast<const TransposeConvolution2dDescriptor*>(&descriptor));
629 if (infos[3] == TensorInfo())
630 {
Cathal Corbett80f71a82022-12-20 18:25:40 +0000631 return support.IsTransposeConvolution2dSupported(infos[0],
632 infos[1],
633 desc,
634 infos[2],
635 EmptyOptional(),
636 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000637 }
638 else
639 {
Cathal Corbett80f71a82022-12-20 18:25:40 +0000640 return support.IsTransposeConvolution2dSupported(infos[0],
641 infos[1],
642 desc,
643 infos[2],
644 infos[3],
645 reasonIfUnsupported);
Cathal Corbett34b429c2021-12-24 12:24:40 +0000646 }
647 }
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000648 case LayerType::UnidirectionalSequenceLstm:
Cathal Corbett80f71a82022-12-20 18:25:40 +0000649 {
650 auto desc = *(PolymorphicDowncast<const UnidirectionalSequenceLstmDescriptor*>(&descriptor));
651 return support.IsUnidirectionalSequenceLstmSupported(infos[0],
652 infos[1],
653 infos[2],
654 infos[3],
655 infos[4],
656 infos[5],
657 desc,
658 lstmParamsInfo.value(),
659 reasonIfUnsupported);
660 }
Cathal Corbett34b429c2021-12-24 12:24:40 +0000661 case LayerType::Unmap:
662 return true;
Cathal Corbett34b429c2021-12-24 12:24:40 +0000663 default:
664 // layers not supported in neon by default:
Cathal Corbett4952a3e2022-03-03 15:14:18 +0000665 // debug, fakequantization, precompiled,
Ryan OShea19e79422022-05-04 00:38:03 +0100666 // standin, switch
Cathal Corbett34b429c2021-12-24 12:24:40 +0000667 return false;
668 }
669}
670
Cathal Corbett80f71a82022-12-20 18:25:40 +0000671bool NeonLayerSupport::IsLayerSupported(const LayerType& type,
672 const std::vector<TensorInfo>& infos,
673 const BaseDescriptor& descriptor,
674 const Optional<LstmInputParamsInfo>& lstmParamsInfo,
675 const Optional<QuantizedLstmInputParamsInfo>& quantizedLstmParamsInfo,
676 Optional<std::string&> reasonIfUnsupported) const
677{
678 bool isSupported = IsLayerTypeSupported(type,
679 infos,
680 descriptor,
681 lstmParamsInfo,
682 quantizedLstmParamsInfo,
683 reasonIfUnsupported,
684 *this);
685
686 // For android-nn-driver and support library, to run FP16 operations on CpuAcc we need at least v8.2
687 // architecture. If the available architecture is older than v8.2, we can check if the operator is
688 // supported by changing operator inputs & outputs to be FP32.
689 // This does not change the operator datatype in the above parsers to be FP32. We are simply reporting
690 // to the parsers if the operator can supported in ArmNN. We will then re-enter ArmNN (Network.cpp)
691 // where we will recheck IsLayerSupported() on the FP16 datatype, update the operator to be FP32,
692 // and, insert convert layers around the FP32 operator.
693 if (reasonIfUnsupported.has_value())
694 {
695 std::string checkStr = "This CPU architecture does not support F16 data type, you need v8.2 or above";
696 if (!isSupported
697 && reasonIfUnsupported.value().find(checkStr) != std::string::npos)
698 {
699 std::vector<TensorInfo> newInfos;
700 for (auto info: infos)
701 {
702 newInfos.emplace_back(OverrideDataType(info, DataType::Float32));
703 }
704
705 std::string tmpString;
706 return IsLayerTypeSupported(type,
707 newInfos,
708 descriptor,
709 lstmParamsInfo,
710 quantizedLstmParamsInfo,
711 tmpString,
712 *this);
713 }
714 }
715
716 return isSupported;
717}
718
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100719bool NeonLayerSupport::IsActivationSupported(const TensorInfo& input,
720 const TensorInfo& output,
721 const ActivationDescriptor& descriptor,
722 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000723{
Jan Eilers8eb25602020-03-09 12:13:48 +0000724 IgnoreUnused(descriptor);
telsoa01c577f2c2018-08-31 09:22:23 +0100725 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonActivationWorkloadValidate,
726 reasonIfUnsupported,
727 input,
728 output,
729 descriptor);
telsoa014fcda012018-03-09 14:13:49 +0000730}
731
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100732bool NeonLayerSupport::IsAdditionSupported(const TensorInfo& input0,
733 const TensorInfo& input1,
734 const TensorInfo& output,
735 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000736{
telsoa01c577f2c2018-08-31 09:22:23 +0100737 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAdditionWorkloadValidate,
738 reasonIfUnsupported,
739 input0,
740 input1,
Mike Kelly07810fc2020-11-12 10:58:48 +0000741 output,
742 nullptr);
telsoa014fcda012018-03-09 14:13:49 +0000743}
744
James Conroyd47a0642019-09-17 14:22:06 +0100745bool NeonLayerSupport::IsArgMinMaxSupported(const TensorInfo& input,
746 const TensorInfo& output,
747 const ArgMinMaxDescriptor& descriptor,
748 Optional<std::string&> reasonIfUnsupported) const
749{
750 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonArgMinMaxWorkloadValidate,
751 reasonIfUnsupported,
752 input,
753 output,
754 descriptor);
755}
756
Teresa Charlin0f86ecf2022-10-13 15:47:08 +0100757bool NeonLayerSupport::IsBatchMatMulSupported(const TensorInfo& inputX,
758 const TensorInfo& inputY,
759 const TensorInfo& output,
760 const BatchMatMulDescriptor& descriptor,
761 Optional<std::string&> reasonIfUnsupported) const
762{
Teresa Charlin1fe6c812022-11-01 15:59:50 +0000763 bool isFastMathEnabled = false;
764#if defined(ARMCOMPUTENEON_ENABLED)
765 if (m_ModelContextPtr)
766 {
767 if (m_ModelContextPtr.get() != nullptr)
768 {
769 auto modelOptions = dynamic_cast<NeonBackendModelContext*>(m_ModelContextPtr.get());
770 if (modelOptions)
771 {
772 isFastMathEnabled = modelOptions->IsFastMathEnabled();
773 }
774 }
775 }
776#endif
Teresa Charlin0f86ecf2022-10-13 15:47:08 +0100777 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonBatchMatMulValidate,
778 reasonIfUnsupported,
779 inputX,
780 inputY,
781 output,
Teresa Charlin1fe6c812022-11-01 15:59:50 +0000782 descriptor,
783 isFastMathEnabled,
784 nullptr);
Teresa Charlin0f86ecf2022-10-13 15:47:08 +0100785}
786
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100787bool NeonLayerSupport::IsBatchNormalizationSupported(const TensorInfo& input,
788 const TensorInfo& output,
789 const TensorInfo& mean,
790 const TensorInfo& var,
791 const TensorInfo& beta,
792 const TensorInfo& gamma,
793 const BatchNormalizationDescriptor& descriptor,
794 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000795{
telsoa01c577f2c2018-08-31 09:22:23 +0100796 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonBatchNormalizationValidate,
797 reasonIfUnsupported,
798 input,
799 output,
800 mean,
801 var,
802 beta,
803 gamma,
Mike Kelly07810fc2020-11-12 10:58:48 +0000804 descriptor,
805 nullptr);
telsoa014fcda012018-03-09 14:13:49 +0000806}
807
Mike Kelly56858022020-01-27 12:14:47 +0000808bool NeonLayerSupport::IsBatchToSpaceNdSupported(const TensorInfo& input,
809 const TensorInfo& output,
810 const BatchToSpaceNdDescriptor& descriptor,
811 Optional<std::string&> reasonIfUnsupported) const
812{
813 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonBatchToSpaceNdWorkloadValidate,
814 reasonIfUnsupported,
815 input,
816 output,
817 descriptor);
818}
819
Sadik Armagan48f011e2021-04-21 10:50:34 +0100820bool NeonLayerSupport::IsCastSupported(const TensorInfo& input,
821 const TensorInfo& output,
822 Optional<std::string&> reasonIfUnsupported) const
823{
824 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonCastValidate,
825 reasonIfUnsupported,
826 input,
827 output);
828}
829
Teresa Charline89dd692021-09-01 16:30:34 +0100830bool NeonLayerSupport::IsChannelShuffleSupported(const TensorInfo& input,
831 const TensorInfo& output,
832 const ChannelShuffleDescriptor& descriptor,
833 Optional<std::string&> reasonIfUnsupported) const
834{
835 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonChannelShuffleValidate,
836 reasonIfUnsupported,
837 input,
838 output,
839 descriptor);
840}
841
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100842bool NeonLayerSupport::IsComparisonSupported(const TensorInfo& input0,
843 const TensorInfo& input1,
844 const TensorInfo& output,
845 const ComparisonDescriptor& descriptor,
846 Optional<std::string&> reasonIfUnsupported) const
847{
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100848
Teresa Charlincedd34f2020-03-30 11:17:30 +0100849 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonComparisonWorkloadValidate,
850 reasonIfUnsupported,
851 input0,
852 input1,
853 output,
854 descriptor);
Aron Virginas-Tar77bfb5e2019-10-16 17:45:38 +0100855}
856
Jim Flynn906f9462019-05-10 13:55:21 +0100857bool NeonLayerSupport::IsConcatSupported(const std::vector<const TensorInfo*> inputs,
858 const TensorInfo& output,
Cathal Corbett34b429c2021-12-24 12:24:40 +0000859 const OriginsDescriptor& descriptor,
Jim Flynn906f9462019-05-10 13:55:21 +0100860 Optional<std::string&> reasonIfUnsupported) const
861{
Jim Flynne242f2d2019-05-22 14:24:13 +0100862 if (descriptor.GetNumDimensions() <= descriptor.GetConcatAxis())
863 {
864 SetValueChecked(reasonIfUnsupported, "Neon Concat: Concat axis > Number of dimensions.");
865 return false;
866 }
867
868 unsigned int concatInnerAxis = (descriptor.GetNumDimensions() - descriptor.GetConcatAxis()) - 1;
869 if(concatInnerAxis < 3) // Width, height, or channels
870 {
871 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConcatWorkloadValidate,
872 reasonIfUnsupported,
873 inputs,
874 output,
875 descriptor);
876 }
877 else if (concatInnerAxis == 3)
878 {
879 for (auto& input : inputs)
880 {
881 if (input && !output.IsTypeSpaceMatch(*input)) // Cannot use sub-tensors if the types are not same space
882 {
883 SetValueChecked(reasonIfUnsupported, "Neon Concat: Types and quantization parameters must match.");
884 return false;
885 }
886 }
887 return true; // Sub-tensors support concat along batch
888 }
889 else // > 4 dimensions not supported.
890 {
891 SetValueChecked(reasonIfUnsupported, "Neon Concat: Maximum of 4 dimensions supported.");
892 return false;
893 }
Jim Flynn906f9462019-05-10 13:55:21 +0100894}
895
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100896bool NeonLayerSupport::IsConstantSupported(const TensorInfo& output,
897 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000898{
Mike Kelly0886ac42020-04-27 09:55:40 +0100899 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConstantWorkloadValidate,
900 reasonIfUnsupported,
901 output);
telsoa014fcda012018-03-09 14:13:49 +0000902}
903
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100904bool NeonLayerSupport::IsConvertFp16ToFp32Supported(const TensorInfo& input,
905 const TensorInfo& output,
906 Optional<std::string&> reasonIfUnsupported) const
907{
Matthew Bentham34336f92023-04-27 12:13:50 +0000908 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConvertFp16ToFp32WorkloadValidate,
909 reasonIfUnsupported,
910 input,
911 output);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100912}
913
914bool NeonLayerSupport::IsConvertFp32ToFp16Supported(const TensorInfo& input,
915 const TensorInfo& output,
916 Optional<std::string&> reasonIfUnsupported) const
917{
Matthew Bentham34336f92023-04-27 12:13:50 +0000918 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConvertFp32ToFp16WorkloadValidate,
919 reasonIfUnsupported,
920 input,
921 output);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +0100922}
923
924bool NeonLayerSupport::IsConvolution2dSupported(const TensorInfo& input,
925 const TensorInfo& output,
926 const Convolution2dDescriptor& descriptor,
927 const TensorInfo& weights,
928 const Optional<TensorInfo>& biases,
929 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +0000930{
Sadik Armagan045f6be2020-09-10 13:37:32 +0100931 bool isFastMathEnabled = false;
932#if defined(ARMCOMPUTENEON_ENABLED)
933 if (m_ModelContextPtr)
934 {
935 if (m_ModelContextPtr.get() != nullptr)
936 {
Sadik Armagan04a72972020-09-14 15:44:18 +0100937 auto modelOptions = dynamic_cast<NeonBackendModelContext*>(m_ModelContextPtr.get());
Sadik Armagan045f6be2020-09-10 13:37:32 +0100938 if (modelOptions)
939 {
940 isFastMathEnabled = modelOptions->IsFastMathEnabled();
941 }
942 }
943 }
944#endif
945
surmeh013537c2c2018-05-18 16:31:43 +0100946 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConvolution2dWorkloadValidate,
947 reasonIfUnsupported,
948 input,
949 output,
950 descriptor,
951 weights,
Sadik Armagan045f6be2020-09-10 13:37:32 +0100952 biases,
Mike Kelly07810fc2020-11-12 10:58:48 +0000953 isFastMathEnabled,
954 nullptr);
telsoa014fcda012018-03-09 14:13:49 +0000955}
956
Teresa Charlinec5f7d12021-10-22 17:15:00 +0100957bool NeonLayerSupport::IsConvolution3dSupported(const TensorInfo& input,
958 const TensorInfo& output,
959 const Convolution3dDescriptor& descriptor,
960 const TensorInfo& weights,
961 const Optional<TensorInfo>& biases,
962 Optional<std::string&> reasonIfUnsupported) const
963{
964 bool isFastMathEnabled = false;
965#if defined(ARMCOMPUTENEON_ENABLED)
966 if (m_ModelContextPtr)
967 {
968 if (m_ModelContextPtr.get() != nullptr)
969 {
970 auto modelOptions = dynamic_cast<NeonBackendModelContext*>(m_ModelContextPtr.get());
971 if (modelOptions)
972 {
973 isFastMathEnabled = modelOptions->IsFastMathEnabled();
974 }
975 }
976 }
977#endif
978
979 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonConvolution3dWorkloadValidate,
980 reasonIfUnsupported,
981 input,
982 output,
983 descriptor,
984 weights,
985 biases,
986 isFastMathEnabled,
987 nullptr);
988}
989
Aron Virginas-Tar2f00b742019-09-30 13:28:08 +0100990bool NeonLayerSupport::IsDepthToSpaceSupported(const TensorInfo& input,
991 const TensorInfo& output,
992 const DepthToSpaceDescriptor& descriptor,
993 Optional<std::string&> reasonIfUnsupported) const
994{
995 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthToSpaceWorkloadValidate,
996 reasonIfUnsupported,
997 input,
998 output,
999 descriptor);
1000}
1001
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001002bool NeonLayerSupport::IsDepthwiseConvolutionSupported(const TensorInfo& input,
1003 const TensorInfo& output,
1004 const DepthwiseConvolution2dDescriptor& descriptor,
1005 const TensorInfo& weights,
1006 const Optional<TensorInfo>& biases,
1007 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +00001008{
telsoa01c577f2c2018-08-31 09:22:23 +01001009 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
1010 reasonIfUnsupported,
1011 input,
1012 output,
1013 descriptor,
1014 weights,
Mike Kelly07810fc2020-11-12 10:58:48 +00001015 biases,
1016 nullptr);
telsoa014fcda012018-03-09 14:13:49 +00001017}
1018
Narumol Prangnawarat01961a72019-05-30 16:47:12 +01001019bool NeonLayerSupport::IsDequantizeSupported(const TensorInfo& input,
1020 const TensorInfo& output,
1021 Optional<std::string&> reasonIfUnsupported) const
1022{
1023 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDequantizeWorkloadValidate,
1024 reasonIfUnsupported,
1025 input,
1026 output);
1027}
1028
Pablo Tellof0bd6832019-04-26 17:58:13 +01001029bool NeonLayerSupport::IsDilatedDepthwiseConvolutionSupported(const TensorInfo& input,
1030 const TensorInfo& output,
1031 const DepthwiseConvolution2dDescriptor& descriptor,
1032 const TensorInfo& weights,
1033 const Optional<TensorInfo>& biases,
1034 Optional<std::string&> reasonIfUnsupported) const
1035{
1036 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDepthwiseConvolutionWorkloadValidate,
1037 reasonIfUnsupported,
1038 input,
1039 output,
1040 descriptor,
1041 weights,
Mike Kelly07810fc2020-11-12 10:58:48 +00001042 biases,
1043 nullptr);
Pablo Tellof0bd6832019-04-26 17:58:13 +01001044}
1045
josh minor4a3c6102020-01-06 16:40:46 -06001046bool NeonLayerSupport::IsElementwiseUnarySupported(const TensorInfo& input,
1047 const TensorInfo& output,
1048 const ElementwiseUnaryDescriptor& descriptor,
1049 Optional<std::string&> reasonIfUnsupported) const
1050{
Derek Lambertic77874a2020-04-28 13:34:56 +01001051 switch(descriptor.m_Operation)
josh minor4a3c6102020-01-06 16:40:46 -06001052 {
Derek Lambertic77874a2020-04-28 13:34:56 +01001053 case UnaryOperation::Abs:
1054 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonAbsWorkloadValidate,
1055 reasonIfUnsupported,
1056 input,
1057 output);
1058 case UnaryOperation::Exp:
1059 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonExpWorkloadValidate,
1060 reasonIfUnsupported,
1061 input,
1062 output);
Teresa Charlin50de4fa2021-05-31 18:47:33 +01001063 case UnaryOperation::LogicalNot:
1064 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLogicalNotWorkloadValidate,
1065 reasonIfUnsupported,
1066 input,
1067 output);
1068 case UnaryOperation::Log:
1069 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLogWorkloadValidate,
1070 reasonIfUnsupported,
1071 input,
1072 output);
Derek Lambertic77874a2020-04-28 13:34:56 +01001073 case UnaryOperation::Neg:
1074 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonNegWorkloadValidate,
1075 reasonIfUnsupported,
1076 input,
1077 output);
1078 case UnaryOperation::Rsqrt:
1079 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonRsqrtWorkloadValidate,
1080 reasonIfUnsupported,
1081 input,
1082 output);
ryan.oshea3cff135b2021-10-07 15:28:14 +00001083 case UnaryOperation::Sin:
1084 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSinWorkloadValidate,
1085 reasonIfUnsupported,
1086 input,
1087 output);
Teresa Charlin06145cc2022-05-05 15:31:30 +01001088 case UnaryOperation::Sqrt:
1089 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSqrtWorkloadValidate,
1090 reasonIfUnsupported,
1091 input,
1092 output);
Derek Lambertic77874a2020-04-28 13:34:56 +01001093 default:
1094 return false;
josh minor4a3c6102020-01-06 16:40:46 -06001095 }
josh minor4a3c6102020-01-06 16:40:46 -06001096}
1097
Teresa Charlin4b10fef2020-07-29 09:36:41 +01001098bool NeonLayerSupport::IsFillSupported(const TensorInfo& input,
1099 const TensorInfo& output,
1100 const FillDescriptor& descriptor,
1101 Optional<std::string&> reasonIfUnsupported) const
Sadik Armagana792a052020-06-23 16:22:23 +01001102{
Teresa Charlin4b10fef2020-07-29 09:36:41 +01001103 armnn::IgnoreUnused(input);
1104 armnn::IgnoreUnused(output);
1105 armnn::IgnoreUnused(descriptor);
1106
1107 return IsNeonBackendSupported(reasonIfUnsupported);
Sadik Armagana792a052020-06-23 16:22:23 +01001108}
1109
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001110bool NeonLayerSupport::IsFloorSupported(const TensorInfo& input,
1111 const TensorInfo& output,
1112 Optional<std::string&> reasonIfUnsupported) const
1113{
Jan Eilers8eb25602020-03-09 12:13:48 +00001114 armnn::IgnoreUnused(output);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001115 return IsNeonBackendSupported(reasonIfUnsupported) &&
1116 IsSupportedForDataTypeGeneric(reasonIfUnsupported,
1117 input.GetDataType(),
1118 &FalseFuncF16<>,
1119 &TrueFunc<>,
narpra01db2b1602019-01-23 15:23:11 +00001120 &FalseFuncU8<>,
kevmay012b4d88e2019-01-24 14:05:09 +00001121 &FalseFuncI32<>,
1122 &FalseFuncU8<>);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001123}
1124
1125bool NeonLayerSupport::IsFullyConnectedSupported(const TensorInfo& input,
1126 const TensorInfo& output,
1127 const TensorInfo& weights,
1128 const TensorInfo& biases,
1129 const FullyConnectedDescriptor& descriptor,
1130 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +00001131{
telsoa01c577f2c2018-08-31 09:22:23 +01001132 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonFullyConnectedWorkloadValidate,
1133 reasonIfUnsupported,
1134 input,
1135 output,
1136 weights,
1137 biases,
Mike Kelly07810fc2020-11-12 10:58:48 +00001138 descriptor,
1139 nullptr);
telsoa014fcda012018-03-09 14:13:49 +00001140}
1141
Teresa Charlinf540eb82020-04-10 19:24:55 +01001142bool NeonLayerSupport::IsGatherSupported(const TensorInfo& input0,
1143 const TensorInfo& input1,
1144 const TensorInfo& output,
Teresa Charlin52664732020-06-29 16:27:03 +01001145 const GatherDescriptor& descriptor,
Teresa Charlinf540eb82020-04-10 19:24:55 +01001146 Optional<std::string&> reasonIfUnsupported) const
1147{
1148 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonGatherWorkloadValidate,
1149 reasonIfUnsupported,
1150 input0,
1151 input1,
Teresa Charlin52664732020-06-29 16:27:03 +01001152 output,
1153 descriptor);
Teresa Charlinf540eb82020-04-10 19:24:55 +01001154}
1155
Teresa Charlinbd22c7d2022-04-26 18:14:12 +01001156bool NeonLayerSupport::IsGatherNdSupported(const TensorInfo& input0,
1157 const TensorInfo& input1,
1158 const TensorInfo& output,
1159 Optional<std::string&> reasonIfUnsupported) const
1160{
1161 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonGatherNdWorkloadValidate,
1162 reasonIfUnsupported,
1163 input0,
1164 input1,
1165 output);
1166}
1167
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001168bool NeonLayerSupport::IsInputSupported(const TensorInfo& input,
1169 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +00001170{
Derek Lamberti901ea112019-12-10 22:07:09 +00001171 return IsNeonBackendSupported(reasonIfUnsupported, input);
telsoa014fcda012018-03-09 14:13:49 +00001172}
1173
Sadik Armagan0d4863d2019-10-09 14:26:32 +01001174bool NeonLayerSupport::IsInstanceNormalizationSupported(const TensorInfo& input,
1175 const TensorInfo& output,
1176 const InstanceNormalizationDescriptor& descriptor,
1177 Optional<std::string&> reasonIfUnsupported) const
1178{
1179 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonInstanceNormalizationWorkloadValidate,
1180 reasonIfUnsupported,
1181 input,
1182 output,
1183 descriptor);
1184}
1185
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001186bool NeonLayerSupport::IsL2NormalizationSupported(const TensorInfo& input,
1187 const TensorInfo& output,
1188 const L2NormalizationDescriptor& descriptor,
1189 Optional<std::string&> reasonIfUnsupported) const
telsoa014fcda012018-03-09 14:13:49 +00001190{
Matteo Martincighbcd3c852018-09-28 14:14:12 +01001191 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonL2NormalizationWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +00001192}
1193
James Conroy177df1e2020-11-13 10:18:51 +00001194bool NeonLayerSupport::IsLogicalBinarySupported(const TensorInfo& input0,
1195 const TensorInfo& input1,
1196 const TensorInfo& output,
1197 const LogicalBinaryDescriptor& descriptor,
1198 Optional<std::string&> reasonIfUnsupported) const
1199{
1200 switch(descriptor.m_Operation)
1201 {
1202 case LogicalBinaryOperation::LogicalAnd:
1203 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLogicalAndWorkloadValidate,
1204 reasonIfUnsupported,
1205 input0,
1206 input1,
1207 output);
1208 case LogicalBinaryOperation::LogicalOr:
1209 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLogicalOrWorkloadValidate,
1210 reasonIfUnsupported,
1211 input0,
1212 input1,
1213 output);
1214 default:
1215 return false;
1216 }
1217}
1218
Keith Davis69e653f2020-07-02 11:49:26 +01001219bool NeonLayerSupport::IsLogSoftmaxSupported(const TensorInfo& input,
1220 const TensorInfo& output,
1221 const LogSoftmaxDescriptor& descriptor,
1222 Optional<std::string&> reasonIfUnsupported) const
1223{
1224 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLogSoftmaxWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
1225}
1226
Jan Eilersad5293a2019-07-08 09:57:55 +01001227bool NeonLayerSupport::IsLstmSupported(const TensorInfo& input,
1228 const TensorInfo& outputStateIn,
1229 const TensorInfo& cellStateIn,
1230 const TensorInfo& scratchBuffer,
1231 const TensorInfo& outputStateOut,
1232 const TensorInfo& cellStateOut,
1233 const TensorInfo& output,
1234 const LstmDescriptor& descriptor,
1235 const LstmInputParamsInfo& paramsInfo,
1236 Optional<std::string&> reasonIfUnsupported) const
1237{
1238 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonLstmFloatWorkloadValidate,
1239 reasonIfUnsupported,
1240 input,
1241 outputStateIn,
1242 cellStateIn,
1243 scratchBuffer,
1244 outputStateOut,
1245 cellStateOut,
1246 output,
1247 descriptor,
1248 paramsInfo);
1249}
1250
Nattapat Chaimanowong4e6597a2018-12-20 14:14:06 +00001251bool NeonLayerSupport::IsMaximumSupported(const TensorInfo& input0,
1252 const TensorInfo& input1,
1253 const TensorInfo& output,
1254 Optional<std::string&> reasonIfUnsupported) const
1255{
1256 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMaximumWorkloadValidate,
1257 reasonIfUnsupported,
1258 input0,
1259 input1,
1260 output);
1261}
1262
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001263bool NeonLayerSupport::IsMeanSupported(const TensorInfo& input,
1264 const TensorInfo& output,
1265 const MeanDescriptor& descriptor,
1266 Optional<std::string&> reasonIfUnsupported) const
narpra0132b90462018-09-13 11:07:48 +01001267{
Matthew Benthamfd899962018-12-31 15:49:42 +00001268 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMeanWorkloadValidate,
1269 reasonIfUnsupported,
1270 input,
1271 output,
1272 descriptor);
narpra0132b90462018-09-13 11:07:48 +01001273}
1274
Conor Kennedy54b21692019-01-09 07:57:38 +00001275bool NeonLayerSupport::IsMinimumSupported(const TensorInfo& input0,
1276 const TensorInfo& input1,
1277 const TensorInfo& output,
1278 Optional<std::string&> reasonIfUnsupported) const
1279{
1280 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMinimumWorkloadValidate,
1281 reasonIfUnsupported,
1282 input0,
1283 input1,
1284 output);
1285}
1286
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001287bool NeonLayerSupport::IsMultiplicationSupported(const TensorInfo& input0,
1288 const TensorInfo& input1,
1289 const TensorInfo& output,
1290 Optional<std::string&> reasonIfUnsupported) const
1291{
1292 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonMultiplicationWorkloadValidate,
1293 reasonIfUnsupported,
1294 input0,
1295 input1,
Mike Kelly07810fc2020-11-12 10:58:48 +00001296 output,
1297 nullptr);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001298}
1299
Pablo Telloe61f0712020-01-23 10:37:17 +00001300bool NeonLayerSupport::IsDivisionSupported(const TensorInfo& input0,
1301 const TensorInfo& input1,
1302 const TensorInfo& output,
1303 Optional<std::string&> reasonIfUnsupported) const
1304{
1305 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonDivisionWorkloadValidate,
1306 reasonIfUnsupported,
1307 input0,
1308 input1,
Mike Kelly07810fc2020-11-12 10:58:48 +00001309 output,
1310 nullptr);
Pablo Telloe61f0712020-01-23 10:37:17 +00001311}
1312
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001313bool NeonLayerSupport::IsNormalizationSupported(const TensorInfo& input,
1314 const TensorInfo& output,
1315 const NormalizationDescriptor& descriptor,
1316 Optional<std::string&> reasonIfUnsupported) const
1317{
1318 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonNormalizationWorkloadValidate,
1319 reasonIfUnsupported,
1320 input,
1321 output,
1322 descriptor);
1323}
1324
1325bool NeonLayerSupport::IsOutputSupported(const TensorInfo& output,
1326 Optional<std::string&> reasonIfUnsupported) const
1327{
Derek Lamberti901ea112019-12-10 22:07:09 +00001328 return IsNeonBackendSupported(reasonIfUnsupported, output);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001329}
1330
Éanna Ó Catháin12055742019-01-25 10:01:40 +00001331bool NeonLayerSupport::IsPadSupported(const TensorInfo& input,
1332 const TensorInfo& output,
1333 const PadDescriptor& descriptor,
1334 Optional<std::string&> reasonIfUnsupported) const
1335{
1336 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPadWorkloadValidate,
1337 reasonIfUnsupported,
1338 input,
1339 output,
1340 descriptor);
1341}
1342
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001343bool NeonLayerSupport::IsPermuteSupported(const TensorInfo& input,
1344 const TensorInfo& output,
1345 const PermuteDescriptor& descriptor,
1346 Optional<std::string&> reasonIfUnsupported) const
1347{
1348 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPermuteWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
telsoa014fcda012018-03-09 14:13:49 +00001349}
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001350
1351bool NeonLayerSupport::IsPooling2dSupported(const TensorInfo& input,
1352 const TensorInfo& output,
1353 const Pooling2dDescriptor& descriptor,
1354 Optional<std::string&> reasonIfUnsupported) const
1355{
1356 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPooling2dWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
1357}
1358
Ryan OShea19e79422022-05-04 00:38:03 +01001359bool NeonLayerSupport::IsPooling3dSupported(const TensorInfo& input,
1360 const TensorInfo& output,
1361 const Pooling3dDescriptor& descriptor,
1362 Optional<std::string&> reasonIfUnsupported) const
1363{
1364 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPooling3dWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
1365}
1366
Nikhil Raj9b461482019-07-03 15:58:31 +01001367bool NeonLayerSupport::IsPreluSupported(const armnn::TensorInfo &input,
1368 const armnn::TensorInfo &alpha,
1369 const armnn::TensorInfo &output,
1370 armnn::Optional<std::string &> reasonIfUnsupported) const
1371{
1372 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonPreluWorkloadValidate, reasonIfUnsupported, input, alpha, output);
1373}
1374
James Conroycc340932020-05-12 18:08:52 +01001375bool NeonLayerSupport::IsQLstmSupported(const TensorInfo& input,
1376 const TensorInfo& previousOutputIn,
1377 const TensorInfo& previousCellStateIn,
1378 const TensorInfo& outputStateOut,
1379 const TensorInfo& cellStateOut,
1380 const TensorInfo& output,
1381 const QLstmDescriptor& descriptor,
1382 const LstmInputParamsInfo& paramsInfo,
1383 Optional<std::string&> reasonIfUnsupported) const
1384{
1385 // Check required here in order to pass IsLayerSupported for datatypes tests
1386 if (input.GetDataType() == armnn::DataType::QAsymmS8 &&
1387 previousOutputIn.GetDataType() == armnn::DataType::QAsymmS8 &&
1388 previousCellStateIn.GetDataType() == armnn::DataType::QSymmS16 &&
1389 outputStateOut.GetDataType() == armnn::DataType::QAsymmS8 &&
1390 cellStateOut.GetDataType() == armnn::DataType::QSymmS16 &&
1391 output.GetDataType() == armnn::DataType::QAsymmS8)
1392 {
1393 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQLstmWorkloadValidate,
1394 reasonIfUnsupported,
1395 input,
1396 previousCellStateIn,
1397 previousOutputIn,
1398 cellStateOut,
1399 outputStateOut,
1400 output,
1401 descriptor,
1402 paramsInfo);
1403 }
1404 else
1405 {
1406 return false;
1407 }
1408}
1409
Sadik Armaganfabc2892019-05-31 09:05:11 +01001410bool NeonLayerSupport::IsQuantizeSupported(const TensorInfo& input,
1411 const TensorInfo& output,
1412 Optional<std::string&> reasonIfUnsupported) const
1413{
1414 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizeWorkloadValidate,
1415 reasonIfUnsupported,
1416 input,
1417 output);
1418}
1419
Francis Murtagh4fc3c482019-08-02 13:20:54 +01001420bool NeonLayerSupport::IsQuantizedLstmSupported(const TensorInfo& input,
1421 const TensorInfo& cellStateIn,
1422 const TensorInfo& outputStateIn,
1423 const TensorInfo& cellStateOut,
1424 const TensorInfo& outputStateOut,
1425 const QuantizedLstmInputParamsInfo& paramsInfo,
1426 Optional<std::string&> reasonIfUnsupported) const
1427{
1428 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonQuantizedLstmWorkloadValidate,
1429 reasonIfUnsupported,
1430 input,
1431 cellStateIn,
1432 outputStateIn,
1433 cellStateOut,
1434 outputStateOut,
1435 paramsInfo);
1436}
1437
Sadik Armagana2747482021-02-09 10:28:54 +00001438bool NeonLayerSupport::IsReduceSupported(const TensorInfo& input,
1439 const TensorInfo& output,
1440 const ReduceDescriptor& descriptor,
1441 Optional<std::string&> reasonIfUnsupported) const
1442{
1443 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonReduceWorkloadValidate,
1444 reasonIfUnsupported,
1445 input,
1446 output,
1447 descriptor);
1448}
1449
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001450bool NeonLayerSupport::IsReshapeSupported(const TensorInfo& input,
Kevin Maya023c402019-12-12 17:28:05 +00001451 const TensorInfo& output,
Matteo Martincigh992d6dc2019-01-10 17:34:20 +00001452 const ReshapeDescriptor& descriptor,
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001453 Optional<std::string&> reasonIfUnsupported) const
1454{
Jan Eilers8eb25602020-03-09 12:13:48 +00001455 armnn::IgnoreUnused(descriptor);
Kevin Maya023c402019-12-12 17:28:05 +00001456 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonReshapeWorkloadValidate,
1457 reasonIfUnsupported,
1458 input,
1459 output);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001460}
1461
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +01001462bool NeonLayerSupport::IsResizeSupported(const TensorInfo& input,
1463 const TensorInfo& output,
1464 const ResizeDescriptor& descriptor,
1465 Optional<std::string&> reasonIfUnsupported) const
1466{
Ellen Norris-Thompson37e68682019-07-15 14:23:30 +01001467 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonResizeWorkloadValidate,
1468 reasonIfUnsupported,
1469 input,
1470 output,
1471 descriptor);
Aron Virginas-Tar169d2f12019-07-01 19:01:44 +01001472}
1473
josh minor036f02d2019-11-15 14:53:22 -06001474bool NeonLayerSupport::IsSliceSupported(const TensorInfo& input,
1475 const TensorInfo& output,
1476 const SliceDescriptor& descriptor,
1477 Optional<std::string&> reasonIfUnsupported) const
1478{
1479 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSliceWorkloadValidate,
1480 reasonIfUnsupported,
1481 input,
1482 output,
1483 descriptor);
1484}
1485
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001486bool NeonLayerSupport::IsSoftmaxSupported(const TensorInfo& input,
1487 const TensorInfo& output,
1488 const SoftmaxDescriptor& descriptor,
1489 Optional<std::string&> reasonIfUnsupported) const
1490{
1491 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSoftmaxWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
1492}
1493
Mike Kelly0be3a882020-01-24 11:27:50 +00001494bool NeonLayerSupport::IsSpaceToBatchNdSupported(const TensorInfo& input,
1495 const TensorInfo& output,
1496 const SpaceToBatchNdDescriptor& descriptor,
1497 Optional<std::string&> reasonIfUnsupported) const
1498{
1499 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSpaceToBatchNdWorkloadValidate,
1500 reasonIfUnsupported,
1501 input,
1502 output,
1503 descriptor);
1504}
1505
Ellen Norris-Thompson29794572019-06-26 16:40:36 +01001506bool NeonLayerSupport::IsSpaceToDepthSupported(const TensorInfo& input,
Mike Kelly0be3a882020-01-24 11:27:50 +00001507 const TensorInfo& output,
1508 const SpaceToDepthDescriptor& descriptor,
1509 Optional<std::string&> reasonIfUnsupported) const
Ellen Norris-Thompson29794572019-06-26 16:40:36 +01001510{
1511 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSpaceToDepthWorkloadValidate,
1512 reasonIfUnsupported,
1513 input,
1514 output,
1515 descriptor);
1516}
1517
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001518bool NeonLayerSupport::IsSplitterSupported(const TensorInfo& input,
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +01001519 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
1520 const ViewsDescriptor& descriptor,
1521 Optional<std::string&> reasonIfUnsupported) const
1522{
1523#if defined(ARMCOMPUTENEON_ENABLED)
1524 // Split along the last dimension, cannot use sub-tensors
1525 // as width and height of the sub-tensors do not match
1526 // the width and height of the parent tensor
1527 // in case of input with more than 2D.
1528 std::set<unsigned int> splitAxis = ComputeSplitAxis(descriptor, input.GetShape());
1529 if (descriptor.GetNumDimensions() > 2 && splitAxis.size() == 1 &&
1530 *splitAxis.begin() == descriptor.GetNumDimensions() - 1 )
1531 {
1532 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSplitterWorkloadValidate,
1533 reasonIfUnsupported,
1534 input,
1535 outputs,
1536 *splitAxis.begin());
1537 }
1538#endif
Jan Eilers8eb25602020-03-09 12:13:48 +00001539 IgnoreUnused(descriptor);
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +01001540 for (auto output : outputs)
1541 {
1542 if (!input.IsTypeSpaceMatch(output)) // Cannot use sub-tensors if the types are not same space
1543 {
1544 SetValueChecked(reasonIfUnsupported, "Neon Splitter: Types and quantization parameters must match.");
1545 return false;
1546 }
1547 }
1548 return true;
1549}
1550
Matthew Jackson87f65ea2019-08-01 10:01:34 +01001551bool NeonLayerSupport::IsStackSupported(const std::vector<const TensorInfo*>& inputs,
1552 const TensorInfo& output,
1553 const StackDescriptor& descriptor,
1554 Optional<std::string&> reasonIfUnsupported) const
1555{
1556 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStackWorkloadValidate,
1557 reasonIfUnsupported,
1558 inputs,
1559 output,
1560 descriptor);
1561}
1562
FinnWilliamsArm1fa19192019-08-02 17:26:31 +01001563bool NeonLayerSupport::IsStridedSliceSupported(const TensorInfo& input,
1564 const TensorInfo& output,
1565 const StridedSliceDescriptor& descriptor,
1566 Optional<std::string&> reasonIfUnsupported) const
1567{
1568 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonStridedSliceWorkloadValidate,
1569 reasonIfUnsupported,
1570 input,
1571 output,
1572 descriptor);
1573}
1574
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001575bool NeonLayerSupport::IsSubtractionSupported(const TensorInfo& input0,
1576 const TensorInfo& input1,
1577 const TensorInfo& output,
1578 Optional<std::string&> reasonIfUnsupported) const
1579{
1580 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonSubtractionWorkloadValidate,
1581 reasonIfUnsupported,
1582 input0,
1583 input1,
Mike Kelly07810fc2020-11-12 10:58:48 +00001584 output,
1585 nullptr);
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001586}
1587
Sadik Armagan581742d2019-08-12 14:11:37 +01001588bool NeonLayerSupport::IsTransposeConvolution2dSupported(const TensorInfo& input,
1589 const TensorInfo& output,
1590 const TransposeConvolution2dDescriptor& descriptor,
1591 const TensorInfo& weights,
1592 const Optional<TensorInfo>& biases,
1593 Optional<std::string&> reasonIfUnsupported) const
1594{
1595 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonTransposeConvolution2dWorkloadValidate,
1596 reasonIfUnsupported,
1597 input,
1598 output,
1599 descriptor,
1600 weights,
1601 biases);
1602}
1603
Mike Kellyc9ea45a2020-02-28 18:11:58 +00001604bool NeonLayerSupport::IsTransposeSupported(const TensorInfo& input,
1605 const TensorInfo& output,
1606 const TransposeDescriptor& descriptor,
1607 Optional<std::string&> reasonIfUnsupported) const
1608{
1609 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonTransposeWorkloadValidate, reasonIfUnsupported, input, output, descriptor);
1610}
1611
Cathal Corbettfd5bec42022-03-03 15:13:23 +00001612bool NeonLayerSupport::IsUnidirectionalSequenceLstmSupported(const TensorInfo& input,
1613 const TensorInfo& outputStateIn,
1614 const TensorInfo& cellStateIn,
Mike Kelly12994962022-04-21 11:57:09 +01001615 const TensorInfo& outputStateOut,
1616 const TensorInfo& cellStateOut,
Cathal Corbettfd5bec42022-03-03 15:13:23 +00001617 const TensorInfo& output,
Cathal Corbettfd5bec42022-03-03 15:13:23 +00001618 const UnidirectionalSequenceLstmDescriptor& descriptor,
1619 const LstmInputParamsInfo& paramsInfo,
1620 Optional<std::string&> reasonIfUnsupported) const
1621{
Mike Kelly12994962022-04-21 11:57:09 +01001622 if (input.GetDataType() == armnn::DataType::QAsymmS8 &&
1623 outputStateIn.GetDataType() == armnn::DataType::QAsymmS8 &&
1624 cellStateIn.GetDataType() == armnn::DataType::QSymmS16 &&
1625 outputStateOut.GetDataType() == armnn::DataType::QAsymmS8 &&
1626 cellStateOut.GetDataType() == armnn::DataType::QSymmS16 &&
1627 output.GetDataType() == armnn::DataType::QAsymmS8)
1628 {
1629 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonUnidirectionalSequenceLstmWorkloadValidate,
1630 reasonIfUnsupported,
1631 input,
1632 outputStateIn,
1633 cellStateIn,
1634 outputStateOut,
1635 cellStateOut,
1636 output,
1637 descriptor,
1638 paramsInfo);
1639 }
1640 else
1641 {
1642 FORWARD_WORKLOAD_VALIDATE_FUNC(NeonUnidirectionalSequenceLstmFloatWorkloadValidate,
1643 reasonIfUnsupported,
1644 input,
1645 outputStateIn,
1646 cellStateIn,
1647 outputStateOut,
1648 cellStateOut,
1649 output,
1650 descriptor,
1651 paramsInfo);
1652 }
Cathal Corbettfd5bec42022-03-03 15:13:23 +00001653}
1654
Aron Virginas-Tarfc824312018-10-15 15:00:13 +01001655} // namespace armnn