blob: 968bce48c810b4502adebf12bfdf2c542aac32a1 [file] [log] [blame]
arovir014424b0a2018-10-04 10:46:04 +01001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
5
6#include "NeonBackend.hpp"
David Beck3e9e1152018-10-17 14:17:50 +01007#include "NeonBackendId.hpp"
Sadik Armagan045f6be2020-09-10 13:37:32 +01008#include "NeonBackendModelContext.hpp"
arovir01a0944792018-10-11 15:00:58 +01009#include "NeonWorkloadFactory.hpp"
David Beck111b5d92018-11-12 14:59:37 +000010#include "NeonLayerSupport.hpp"
Narumol Prangnawarat4e3e8182019-08-14 12:25:50 +010011#include "NeonTensorHandleFactory.hpp"
arovir01a0944792018-10-11 15:00:58 +010012
Matteo Martincighc601aa62019-10-29 15:03:22 +000013#include <armnn/BackendRegistry.hpp>
Mike Kelly07810fc2020-11-12 10:58:48 +000014#include <armnn/Descriptors.hpp>
Matteo Martincighc601aa62019-10-29 15:03:22 +000015
Mike Kelly07810fc2020-11-12 10:58:48 +000016#include <aclCommon/ArmComputeSubgraphUtils.hpp>
17#include <aclCommon/ArmComputeUtils.hpp>
Aron Virginas-Tar56055192018-11-12 18:10:43 +000018#include <aclCommon/BaseMemoryManager.hpp>
19
Matteo Martincighe5b8eb92019-11-28 15:45:42 +000020#include <armnn/backends/IBackendContext.hpp>
21#include <armnn/backends/IMemoryManager.hpp>
Aron Virginas-Tar56055192018-11-12 18:10:43 +000022
Jan Eilers3c9e0452020-04-10 13:00:44 +010023#include <armnn/utility/PolymorphicDowncast.hpp>
24
Francis Murtaghe8d7ccb2021-10-14 17:30:24 +010025#include <neon/workloads/NeonAdditionWorkload.hpp>
26#include <neon/workloads/NeonBatchNormalizationWorkload.hpp>
27#include <neon/workloads/NeonConvolution2dWorkload.hpp>
28#include <neon/workloads/NeonDepthwiseConvolutionWorkload.hpp>
29#include <neon/workloads/NeonDivisionWorkload.hpp>
30#include <neon/workloads/NeonFullyConnectedWorkload.hpp>
31#include <neon/workloads/NeonMultiplicationWorkload.hpp>
32#include <neon/workloads/NeonReduceWorkload.hpp>
33#include <neon/workloads/NeonSubtractionWorkload.hpp>
34#include <backendsCommon/DefaultAllocator.hpp>
Mike Kelly07810fc2020-11-12 10:58:48 +000035
David Beck263e3492018-11-09 14:46:40 +000036#include <Optimizer.hpp>
arovir01a0944792018-10-11 15:00:58 +010037
Mike Kelly07810fc2020-11-12 10:58:48 +000038#include <arm_compute/core/Types.h>
Aron Virginas-Tar56055192018-11-12 18:10:43 +000039#include <arm_compute/runtime/Allocator.h>
40
arovir014424b0a2018-10-04 10:46:04 +010041namespace armnn
42{
43
David Beck3cc9a622018-10-12 10:38:31 +010044const BackendId& NeonBackend::GetIdStatic()
arovir014424b0a2018-10-04 10:46:04 +010045{
David Beck3e9e1152018-10-17 14:17:50 +010046 static const BackendId s_Id{NeonBackendId()};
arovir014424b0a2018-10-04 10:46:04 +010047 return s_Id;
48}
49
Aron Virginas-Tar56055192018-11-12 18:10:43 +000050IBackendInternal::IMemoryManagerUniquePtr NeonBackend::CreateMemoryManager() const
arovir014424b0a2018-10-04 10:46:04 +010051{
Aron Virginas-Tar56055192018-11-12 18:10:43 +000052 return std::make_unique<NeonMemoryManager>(std::make_unique<arm_compute::Allocator>(),
Sadik Armagan13a9fa62019-04-26 16:04:34 +010053 BaseMemoryManager::MemoryAffinity::Offset);
Aron Virginas-Tar56055192018-11-12 18:10:43 +000054}
55
56IBackendInternal::IWorkloadFactoryPtr NeonBackend::CreateWorkloadFactory(
57 const IBackendInternal::IMemoryManagerSharedPtr& memoryManager) const
58{
59 return std::make_unique<NeonWorkloadFactory>(
Jan Eilers3c9e0452020-04-10 13:00:44 +010060 PolymorphicPointerDowncast<NeonMemoryManager>(memoryManager));
arovir014424b0a2018-10-04 10:46:04 +010061}
62
Narumol Prangnawarat4e3e8182019-08-14 12:25:50 +010063IBackendInternal::IWorkloadFactoryPtr NeonBackend::CreateWorkloadFactory(
Sadik Armagan04a72972020-09-14 15:44:18 +010064 const IBackendInternal::IMemoryManagerSharedPtr& memoryManager, const ModelOptions& modelOptions) const
65{
66 return std::make_unique<NeonWorkloadFactory>(
67 PolymorphicPointerDowncast<NeonMemoryManager>(memoryManager), CreateBackendSpecificModelContext(modelOptions));
68}
69
70IBackendInternal::IWorkloadFactoryPtr NeonBackend::CreateWorkloadFactory(
Narumol Prangnawarat4e3e8182019-08-14 12:25:50 +010071 class TensorHandleFactoryRegistry& tensorHandleFactoryRegistry) const
72{
73 auto memoryManager = std::make_shared<NeonMemoryManager>(std::make_unique<arm_compute::Allocator>(),
74 BaseMemoryManager::MemoryAffinity::Offset);
75
76 tensorHandleFactoryRegistry.RegisterMemoryManager(memoryManager);
Narumol Prangnawarat77400452022-01-13 17:43:41 +000077
78 auto factory = std::make_unique<NeonTensorHandleFactory>(memoryManager);
79 // Register copy and import factory pair
80 tensorHandleFactoryRegistry.RegisterCopyAndImportFactoryPair(factory->GetId(), factory->GetId());
81 // Register the factory
82 tensorHandleFactoryRegistry.RegisterFactory(std::move(factory));
83
Narumol Prangnawarat549cb7a2020-07-10 17:50:53 +010084
Narumol Prangnawarat4e3e8182019-08-14 12:25:50 +010085 return std::make_unique<NeonWorkloadFactory>(
Jan Eilers3c9e0452020-04-10 13:00:44 +010086 PolymorphicPointerDowncast<NeonMemoryManager>(memoryManager));
Narumol Prangnawarat4e3e8182019-08-14 12:25:50 +010087}
88
Sadik Armagan04a72972020-09-14 15:44:18 +010089IBackendInternal::IWorkloadFactoryPtr NeonBackend::CreateWorkloadFactory(
90 TensorHandleFactoryRegistry& tensorHandleFactoryRegistry, const ModelOptions& modelOptions) const
91{
92 auto memoryManager = std::make_shared<NeonMemoryManager>(std::make_unique<arm_compute::Allocator>(),
93 BaseMemoryManager::MemoryAffinity::Offset);
94
95 tensorHandleFactoryRegistry.RegisterMemoryManager(memoryManager);
Narumol Prangnawarat77400452022-01-13 17:43:41 +000096
97 auto factory = std::make_unique<NeonTensorHandleFactory>(memoryManager);
98 // Register copy and import factory pair
99 tensorHandleFactoryRegistry.RegisterCopyAndImportFactoryPair(factory->GetId(), factory->GetId());
100 // Register the factory
101 tensorHandleFactoryRegistry.RegisterFactory(std::move(factory));
Sadik Armagan04a72972020-09-14 15:44:18 +0100102
103 return std::make_unique<NeonWorkloadFactory>(
104 PolymorphicPointerDowncast<NeonMemoryManager>(memoryManager), CreateBackendSpecificModelContext(modelOptions));
105}
106
David Beck263e3492018-11-09 14:46:40 +0000107IBackendInternal::IBackendContextPtr NeonBackend::CreateBackendContext(const IRuntime::CreationOptions&) const
108{
109 return IBackendContextPtr{};
110}
111
Colm Donelane49755b2020-01-29 15:22:43 +0000112IBackendInternal::IBackendProfilingContextPtr NeonBackend::CreateBackendProfilingContext(
Colm Donelan1aff3932020-02-05 17:48:59 +0000113 const IRuntime::CreationOptions&, IBackendProfilingPtr&)
Colm Donelane49755b2020-01-29 15:22:43 +0000114{
115 return IBackendProfilingContextPtr{};
116}
117
Sadik Armagan045f6be2020-09-10 13:37:32 +0100118IBackendInternal::IBackendSpecificModelContextPtr NeonBackend::CreateBackendSpecificModelContext(
119 const ModelOptions& modelOptions) const
120{
121 return IBackendSpecificModelContextPtr{new NeonBackendModelContext{modelOptions}};
122}
123
David Beck111b5d92018-11-12 14:59:37 +0000124IBackendInternal::ILayerSupportSharedPtr NeonBackend::GetLayerSupport() const
125{
Sadik Armagan045f6be2020-09-10 13:37:32 +0100126 static ILayerSupportSharedPtr layerSupport
127 {
128 new NeonLayerSupport(IBackendInternal::IBackendSpecificModelContextPtr{})
129 };
130 return layerSupport;
131}
132
133IBackendInternal::ILayerSupportSharedPtr NeonBackend::GetLayerSupport(const ModelOptions& modelOptions) const
134{
135 static ILayerSupportSharedPtr layerSupport
136 {
137 new NeonLayerSupport(CreateBackendSpecificModelContext(modelOptions))
138 };
David Beck111b5d92018-11-12 14:59:37 +0000139 return layerSupport;
140}
141
Mike Kelly80512b02022-05-16 23:10:42 +0100142OptimizationViews NeonBackend::OptimizeSubgraphView(const SubgraphView& subgraph,
143 const ModelOptions& modelOptions) const
Matteo Martincighadddddb2019-01-24 14:06:23 +0000144{
Mike Kelly80512b02022-05-16 23:10:42 +0100145 OptimizationViews optimizationViews(modelOptions);
Matteo Martincighadddddb2019-01-24 14:06:23 +0000146
Francis Murtagh56ccf682021-12-13 18:48:12 +0000147 auto it = subgraph.endIConnectable();
Mike Kelly1ac690a2020-11-17 11:41:38 +0000148 std::map<LayerGuid, Layer*> untouched;
Mike Kelly07810fc2020-11-12 10:58:48 +0000149
Francis Murtagh56ccf682021-12-13 18:48:12 +0000150 while (it != subgraph.beginIConnectable())
Mike Kelly07810fc2020-11-12 10:58:48 +0000151 {
152 --it;
Francis Murtagh56ccf682021-12-13 18:48:12 +0000153 Layer& base = *(PolymorphicDowncast<Layer*>(*it));
Mike Kelly1ac690a2020-11-17 11:41:38 +0000154 untouched.insert({base.GetGuid(), &base});
155 }
156
Francis Murtagh56ccf682021-12-13 18:48:12 +0000157 it = subgraph.endIConnectable();
158 while (it != subgraph.beginIConnectable())
Mike Kelly1ac690a2020-11-17 11:41:38 +0000159 {
160 --it;
Francis Murtagh56ccf682021-12-13 18:48:12 +0000161 Layer& base = *(PolymorphicDowncast<Layer*>(*it));
Mike Kelly07810fc2020-11-12 10:58:48 +0000162
Matthew Sloyan5fc0fd62021-05-03 12:22:03 +0100163 // Fuse activation into previous layer if supported by backend
Mike Kelly07810fc2020-11-12 10:58:48 +0000164 if ((base.GetType() == LayerType::DepthwiseConvolution2d || base.GetType() == LayerType::Convolution2d
165 || base.GetType() == LayerType::BatchNormalization || base.GetType() == LayerType::FullyConnected
166 || base.GetType() == LayerType::Addition || base.GetType() == LayerType::Multiplication
Matthew Sloyanae123062021-05-07 14:18:01 +0000167 || base.GetType() == LayerType::Subtraction || base.GetType() == LayerType::Division)
Mike Kelly07810fc2020-11-12 10:58:48 +0000168 && (base.GetAdditionalInformation<ActivationDescriptor>() == nullptr))
169 {
170 for (auto output = base.BeginOutputSlots(); output != base.EndOutputSlots(); ++output)
171 {
172 if (output->GetNumConnections() == 1)
173 {
174 for (auto&& childInput : output->GetConnections())
175 {
Teresa Charlind672f5d2021-01-18 18:07:57 +0000176 if ((childInput->GetOwningLayer().GetType() == LayerType::Activation) &&
177 (checkDataTypeInputandOutput(childInput->GetOwningLayer())))
Mike Kelly07810fc2020-11-12 10:58:48 +0000178 {
179 Layer& child = childInput->GetOwningLayer();
180
181 auto* activationLayer = PolymorphicDowncast<ActivationLayer*>(&child);
182
183 const std::string name = std::string("fused-") + child.GetName() + std::string("-into-") +
184 base.GetName();
185
186 // Get params from activation layer
187 ActivationDescriptor activationDesc = activationLayer->GetParameters();
188
189 if (base.GetType() == LayerType::Convolution2d)
190 {
191 Convolution2dLayer* baseLayer = PolymorphicDowncast<Convolution2dLayer*>(&base);
192
193 Optional<TensorInfo> biases;
194
195 if (baseLayer->GetParameters().m_BiasEnabled)
196 {
Keith Davisb4dd5cc2022-04-07 11:32:00 +0100197 biases = baseLayer->GetInputSlot(2).GetConnectedOutputSlot()->GetTensorInfo();
Mike Kelly07810fc2020-11-12 10:58:48 +0000198 }
199
200 arm_compute::Status status = NeonConvolution2dWorkloadValidate(
201 baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
202 activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
203 baseLayer->GetParameters(),
Keith Davisb4dd5cc2022-04-07 11:32:00 +0100204 baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),
Mike Kelly07810fc2020-11-12 10:58:48 +0000205 biases,
206 false,
207 &activationDesc);
208
209 if (status)
210 {
Cathal Corbettcbfd7182021-12-15 17:12:59 +0000211 FuseConvolution2dLayer<Convolution2dLayer>(optimizationViews,
212 baseLayer,
213 activationLayer,
214 activationDesc,
215 name);
Mike Kelly1ac690a2020-11-17 11:41:38 +0000216 untouched.erase(baseLayer->GetGuid());
217 untouched.erase(activationLayer->GetGuid());
Mike Kelly07810fc2020-11-12 10:58:48 +0000218 }
219 }
220 else if (base.GetType() == LayerType::DepthwiseConvolution2d)
221 {
222 DepthwiseConvolution2dLayer* baseLayer =
223 PolymorphicDowncast<DepthwiseConvolution2dLayer*>(&base);
224
225 Optional<TensorInfo> biases;
226
227 if (baseLayer->GetParameters().m_BiasEnabled)
228 {
Cathal Corbett06902652022-04-14 17:55:11 +0100229 biases = baseLayer->GetInputSlot(2).GetConnectedOutputSlot()->GetTensorInfo();
Mike Kelly07810fc2020-11-12 10:58:48 +0000230 }
231
232 arm_compute::Status status = NeonDepthwiseConvolutionWorkloadValidate(
233 baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
234 activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
235 baseLayer->GetParameters(),
Cathal Corbett06902652022-04-14 17:55:11 +0100236 baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),
Mike Kelly07810fc2020-11-12 10:58:48 +0000237 biases,
238 &activationDesc);
239
240 if (status)
241 {
Cathal Corbettcbfd7182021-12-15 17:12:59 +0000242 FuseDepthwiseConvolution2dLayer<DepthwiseConvolution2dLayer>(optimizationViews,
243 baseLayer,
244 activationLayer,
245 activationDesc,
246 name);
Mike Kelly1ac690a2020-11-17 11:41:38 +0000247 untouched.erase(baseLayer->GetGuid());
248 untouched.erase(activationLayer->GetGuid());
Mike Kelly07810fc2020-11-12 10:58:48 +0000249 }
250 }
251 else if (base.GetType() == LayerType::FullyConnected)
252 {
253 FullyConnectedLayer* baseLayer = PolymorphicDowncast<FullyConnectedLayer*>(&base);
Cathal Corbett4452baf2022-05-13 09:55:59 +0100254 FullyConnectedDescriptor descriptor = baseLayer->GetParameters();
Matthew Bentham67d63902022-02-08 15:03:07 +0000255
Cathal Corbett4452baf2022-05-13 09:55:59 +0100256 // As bias is optional only try to get TensorInfo from input if bias is enabled.
257 Optional<TensorInfo> biases;
258 if (descriptor.m_BiasEnabled)
Matthew Bentham67d63902022-02-08 15:03:07 +0000259 {
Cathal Corbett4452baf2022-05-13 09:55:59 +0100260 biases = baseLayer->GetInputSlot(2).GetConnectedOutputSlot()->GetTensorInfo();
Matthew Bentham67d63902022-02-08 15:03:07 +0000261 }
Mike Kelly07810fc2020-11-12 10:58:48 +0000262
263 arm_compute::Status status = NeonFullyConnectedWorkloadValidate(
264 baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
265 activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
Cathal Corbett4452baf2022-05-13 09:55:59 +0100266 baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),
Matthew Bentham67d63902022-02-08 15:03:07 +0000267 biases,
Mike Kelly07810fc2020-11-12 10:58:48 +0000268 baseLayer->GetParameters(),
269 &activationDesc);
270
271 if (status)
272 {
Cathal Corbettcbfd7182021-12-15 17:12:59 +0000273 FuseFullyConnectedLayer<FullyConnectedLayer>(optimizationViews,
274 baseLayer,
275 activationLayer,
276 activationDesc,
277 name);
Mike Kelly1ac690a2020-11-17 11:41:38 +0000278 untouched.erase(baseLayer->GetGuid());
279 untouched.erase(activationLayer->GetGuid());
Mike Kelly07810fc2020-11-12 10:58:48 +0000280 }
281 }
282 else if (base.GetType() == LayerType::BatchNormalization)
283 {
284 BatchNormalizationLayer* baseLayer =
285 PolymorphicDowncast<BatchNormalizationLayer*>(&base);
286
287 arm_compute::Status status = NeonBatchNormalizationValidate(
288 baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
289 activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
290 baseLayer->m_Mean->GetTensorInfo(),
291 baseLayer->m_Variance->GetTensorInfo(),
292 baseLayer->m_Beta->GetTensorInfo(),
293 baseLayer->m_Gamma->GetTensorInfo(),
294 baseLayer->GetParameters(),
295 &activationDesc);
296
297 if (status)
298 {
299 BatchNormalizationLayer* replacementLayer =
Cathal Corbettcbfd7182021-12-15 17:12:59 +0000300 FuseBatchNormalizationLayer<BatchNormalizationLayer>(optimizationViews,
301 baseLayer,
302 activationLayer,
303 activationDesc,
304 name);
Mike Kelly07810fc2020-11-12 10:58:48 +0000305
306 replacementLayer->m_Beta = std::move(baseLayer->m_Beta);
307 replacementLayer->m_Gamma = std::move(baseLayer->m_Gamma);
308 replacementLayer->m_Mean = std::move(baseLayer->m_Mean);
309 replacementLayer->m_Variance = std::move(baseLayer->m_Variance);
Mike Kelly1ac690a2020-11-17 11:41:38 +0000310 untouched.erase(baseLayer->GetGuid());
311 untouched.erase(activationLayer->GetGuid());
Mike Kelly07810fc2020-11-12 10:58:48 +0000312 }
313 }
314 else if (base.GetType() == LayerType::Addition)
315 {
316 AdditionLayer* baseLayer = PolymorphicDowncast<AdditionLayer*>(&base);
317
318 arm_compute::Status status = NeonAdditionWorkloadValidate(
319 baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
320 baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),
321 activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
322 &activationDesc);
323
324 if (status)
325 {
Cathal Corbettcbfd7182021-12-15 17:12:59 +0000326 FuseAdditionLayer<AdditionLayer>(optimizationViews,
327 baseLayer,
328 activationLayer,
329 activationDesc,
330 name);
Mike Kelly1ac690a2020-11-17 11:41:38 +0000331 untouched.erase(baseLayer->GetGuid());
332 untouched.erase(activationLayer->GetGuid());
Mike Kelly07810fc2020-11-12 10:58:48 +0000333 }
334 }
335 else if (base.GetType() == LayerType::Division)
336 {
337 DivisionLayer* baseLayer = PolymorphicDowncast<DivisionLayer*>(&base);
338
339 arm_compute::Status status = NeonDivisionWorkloadValidate(
340 baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
341 baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),
342 activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
343 &activationDesc);
344
345 if (status)
346 {
Cathal Corbettcbfd7182021-12-15 17:12:59 +0000347 FuseDivisionLayer<DivisionLayer>(optimizationViews,
348 baseLayer,
349 activationLayer,
350 activationDesc,
351 name);
Mike Kelly1ac690a2020-11-17 11:41:38 +0000352 untouched.erase(baseLayer->GetGuid());
353 untouched.erase(activationLayer->GetGuid());
Mike Kelly07810fc2020-11-12 10:58:48 +0000354 }
355 }
356 else if (base.GetType() == LayerType::Multiplication)
357 {
358 MultiplicationLayer* baseLayer = PolymorphicDowncast<MultiplicationLayer*>(&base);
359
360 arm_compute::Status status = NeonMultiplicationWorkloadValidate(
361 baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
362 baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),
363 activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
364 &activationDesc);
365
366 if (status)
367 {
Cathal Corbettcbfd7182021-12-15 17:12:59 +0000368 FuseMultiplicationLayer<MultiplicationLayer>(optimizationViews,
369 baseLayer,
370 activationLayer,
371 activationDesc,
372 name);
Mike Kelly1ac690a2020-11-17 11:41:38 +0000373 untouched.erase(baseLayer->GetGuid());
374 untouched.erase(activationLayer->GetGuid());
Mike Kelly07810fc2020-11-12 10:58:48 +0000375 }
376 }
377 else if (base.GetType() == LayerType::Subtraction)
378 {
379 SubtractionLayer* baseLayer = PolymorphicDowncast<SubtractionLayer*>(&base);
380
381 arm_compute::Status status = NeonSubtractionWorkloadValidate(
382 baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
383 baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),
384 activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),
385 &activationDesc);
386
387 if (status)
388 {
Cathal Corbettcbfd7182021-12-15 17:12:59 +0000389 FuseSubtractionLayer<SubtractionLayer>(optimizationViews,
390 baseLayer,
391 activationLayer,
392 activationDesc,
393 name);
Mike Kelly1ac690a2020-11-17 11:41:38 +0000394 untouched.erase(baseLayer->GetGuid());
395 untouched.erase(activationLayer->GetGuid());
Mike Kelly07810fc2020-11-12 10:58:48 +0000396 }
397 }
398 }
399 }
400 }
401 }
402 }
Matthew Sloyan5fc0fd62021-05-03 12:22:03 +0100403
404 // Separate reduce layer with multiple axes into multiple reduce layers with 1 axis.
405 if (base.GetType() == LayerType::Reduce)
406 {
407 ReduceLayer* baseLayer = PolymorphicDowncast<ReduceLayer*>(&base);
408 ReduceDescriptor reduceDescriptor = baseLayer->GetParameters();
409
410 if (!reduceDescriptor.m_vAxis.empty() && reduceDescriptor.m_vAxis.size() > 1)
411 {
412 // Add new layers to the graph and connect them.
Francis Murtagh56ccf682021-12-13 18:48:12 +0000413 std::vector<IConnectableLayer*> layers = ChainReduceLayers<ReduceLayer>(optimizationViews,
414 baseLayer,
415 reduceDescriptor);
Matthew Sloyan5fc0fd62021-05-03 12:22:03 +0100416
417 // Replace existing baselayer with new subgraph.
418 ReplaceLayers<ReduceLayer>(optimizationViews, baseLayer, layers);
419 untouched.erase(baseLayer->GetGuid());
420 }
421 }
Mike Kelly07810fc2020-11-12 10:58:48 +0000422 }
423
424 if (optimizationViews.GetSubstitutions().empty())
425 {
426 optimizationViews.AddUntouchedSubgraph(SubgraphView(subgraph));
427 }
Mike Kelly1ac690a2020-11-17 11:41:38 +0000428 else
429 {
430 ReportUntouchedLayers(optimizationViews, untouched);
431 }
Matteo Martincighc3ba50e2019-05-22 14:28:16 +0100432
433 return optimizationViews;
Matteo Martincighadddddb2019-01-24 14:06:23 +0000434}
435
Narumol Prangnawarat4e3e8182019-08-14 12:25:50 +0100436std::vector<ITensorHandleFactory::FactoryId> NeonBackend::GetHandleFactoryPreferences() const
437{
Narumol Prangnawarat265e53e2020-10-30 16:06:55 +0000438 return std::vector<ITensorHandleFactory::FactoryId>() = { NeonTensorHandleFactory::GetIdStatic() };
Narumol Prangnawarat4e3e8182019-08-14 12:25:50 +0100439}
440
441void NeonBackend::RegisterTensorHandleFactories(class TensorHandleFactoryRegistry& registry)
442{
443 auto memoryManager = std::make_shared<NeonMemoryManager>(std::make_unique<arm_compute::Allocator>(),
444 BaseMemoryManager::MemoryAffinity::Offset);
445
446 registry.RegisterMemoryManager(memoryManager);
Narumol Prangnawarat77400452022-01-13 17:43:41 +0000447
448 auto factory = std::make_unique<NeonTensorHandleFactory>(memoryManager);
449 // Register copy and import factory pair
450 registry.RegisterCopyAndImportFactoryPair(factory->GetId(), factory->GetId());
451 // Register the factory
452 registry.RegisterFactory(std::move(factory));
Narumol Prangnawarat4e3e8182019-08-14 12:25:50 +0100453}
454
Francis Murtaghe8d7ccb2021-10-14 17:30:24 +0100455std::unique_ptr<ICustomAllocator> NeonBackend::GetDefaultAllocator() const
456{
457 return std::make_unique<DefaultAllocator>();
458}
459
460
Matthew Bentham42bad952018-12-17 09:23:36 +0000461} // namespace armnn