Blame - src/backends/neon/NeonBackend.cpp - ml/armnn

2018-10-04 10:46:04 +0100

[diff] [blame]

1

//

Mike Kelly

3ec3077

2023-03-08 13:47:17 +0000

[diff] [blame]

2

arovir01

2018-10-04 10:46:04 +0100

[diff] [blame]

3

// SPDX-License-Identifier: MIT

4

//

5

6

#include "NeonBackend.hpp"

David Beck

3e9e115

2018-10-17 14:17:50 +0100

[diff] [blame]

7

#include "NeonBackendId.hpp"

Sadik Armagan

045f6be

2020-09-10 13:37:32 +0100

[diff] [blame]

8

#include "NeonBackendModelContext.hpp"

arovir01

a094479

2018-10-11 15:00:58 +0100

[diff] [blame]

9

#include "NeonWorkloadFactory.hpp"

David Beck

111b5d9

2018-11-12 14:59:37 +0000

[diff] [blame]

10

#include "NeonLayerSupport.hpp"

Narumol Prangnawarat

2019-08-14 12:25:50 +0100

[diff] [blame]

11

#include "NeonTensorHandleFactory.hpp"

arovir01

a094479

2018-10-11 15:00:58 +0100

[diff] [blame]

12

Matteo Martincigh

c601aa6

2019-10-29 15:03:22 +0000

[diff] [blame]

13

#include <armnn/BackendRegistry.hpp>

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

14

#include <armnn/Descriptors.hpp>

Matteo Martincigh

c601aa6

2019-10-29 15:03:22 +0000

[diff] [blame]

15

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

16

#include <aclCommon/ArmComputeSubgraphUtils.hpp>

17

#include <aclCommon/ArmComputeUtils.hpp>

Aron Virginas-Tar

2018-11-12 18:10:43 +0000

[diff] [blame]

18

#include <aclCommon/BaseMemoryManager.hpp>

19

Matteo Martincigh

e5b8eb9

2019-11-28 15:45:42 +0000

[diff] [blame]

20

#include <armnn/backends/IBackendContext.hpp>

21

#include <armnn/backends/IMemoryManager.hpp>

Aron Virginas-Tar

2018-11-12 18:10:43 +0000

[diff] [blame]

22

Jan Eilers

3c9e045

2020-04-10 13:00:44 +0100

[diff] [blame]

23

#include <armnn/utility/PolymorphicDowncast.hpp>

24

Francis Murtagh

e8d7ccb

2021-10-14 17:30:24 +0100

[diff] [blame]

25

#include <neon/workloads/NeonAdditionWorkload.hpp>

26

#include <neon/workloads/NeonBatchNormalizationWorkload.hpp>

27

#include <neon/workloads/NeonConvolution2dWorkload.hpp>

28

#include <neon/workloads/NeonDepthwiseConvolutionWorkload.hpp>

29

#include <neon/workloads/NeonDivisionWorkload.hpp>

30

#include <neon/workloads/NeonFullyConnectedWorkload.hpp>

31

#include <neon/workloads/NeonMultiplicationWorkload.hpp>

32

#include <neon/workloads/NeonReduceWorkload.hpp>

33

#include <neon/workloads/NeonSubtractionWorkload.hpp>

34

#include <backendsCommon/DefaultAllocator.hpp>

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

35

David Beck

263e349

2018-11-09 14:46:40 +0000

[diff] [blame]

36

#include <Optimizer.hpp>

arovir01

a094479

2018-10-11 15:00:58 +0100

[diff] [blame]

37

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

38

#include <arm_compute/core/Types.h>

Aron Virginas-Tar

2018-11-12 18:10:43 +0000

[diff] [blame]

39

#include <arm_compute/runtime/Allocator.h>

40

arovir01

2018-10-04 10:46:04 +0100

[diff] [blame]

namespace armnn

{

David Beck

2018-10-12 10:38:31 +0100

[diff] [blame]

44

const BackendId& NeonBackend::GetIdStatic()

arovir01

2018-10-04 10:46:04 +0100

[diff] [blame]

45

{

David Beck

3e9e115

2018-10-17 14:17:50 +0100

[diff] [blame]

46

static const BackendId s_Id{NeonBackendId()};

arovir01

2018-10-04 10:46:04 +0100

[diff] [blame]

return s_Id;

}

Aron Virginas-Tar

2018-11-12 18:10:43 +0000

[diff] [blame]

50

IBackendInternal::IMemoryManagerUniquePtr NeonBackend::CreateMemoryManager() const

arovir01

2018-10-04 10:46:04 +0100

[diff] [blame]

51

{

Aron Virginas-Tar

2018-11-12 18:10:43 +0000

[diff] [blame]

52

return std::make_unique<NeonMemoryManager>(std::make_unique<arm_compute::Allocator>(),

Sadik Armagan

13a9fa6

2019-04-26 16:04:34 +0100

[diff] [blame]

53

BaseMemoryManager::MemoryAffinity::Offset);

Aron Virginas-Tar

2018-11-12 18:10:43 +0000

[diff] [blame]

54

}

55

56

IBackendInternal::IWorkloadFactoryPtr NeonBackend::CreateWorkloadFactory(

57

const IBackendInternal::IMemoryManagerSharedPtr& memoryManager) const

58

{

59

return std::make_unique<NeonWorkloadFactory>(

Jan Eilers

3c9e045

2020-04-10 13:00:44 +0100

[diff] [blame]

60

PolymorphicPointerDowncast<NeonMemoryManager>(memoryManager));

arovir01

2018-10-04 10:46:04 +0100

[diff] [blame]

61

}

62

Narumol Prangnawarat

2019-08-14 12:25:50 +0100

[diff] [blame]

63

IBackendInternal::IWorkloadFactoryPtr NeonBackend::CreateWorkloadFactory(

Sadik Armagan

04a7297

2020-09-14 15:44:18 +0100

[diff] [blame]

64

const IBackendInternal::IMemoryManagerSharedPtr& memoryManager, const ModelOptions& modelOptions) const

65

{

66

return std::make_unique<NeonWorkloadFactory>(

67

PolymorphicPointerDowncast<NeonMemoryManager>(memoryManager), CreateBackendSpecificModelContext(modelOptions));

68

}

69

70

IBackendInternal::IWorkloadFactoryPtr NeonBackend::CreateWorkloadFactory(

Narumol Prangnawarat

2019-08-14 12:25:50 +0100

[diff] [blame]

71

class TensorHandleFactoryRegistry& tensorHandleFactoryRegistry) const

72

{

73

auto memoryManager = std::make_shared<NeonMemoryManager>(std::make_unique<arm_compute::Allocator>(),

74

BaseMemoryManager::MemoryAffinity::Offset);

75

76

tensorHandleFactoryRegistry.RegisterMemoryManager(memoryManager);

Narumol Prangnawarat

7740045

2022-01-13 17:43:41 +0000

[diff] [blame]

77

78

auto factory = std::make_unique<NeonTensorHandleFactory>(memoryManager);

79

// Register copy and import factory pair

80

tensorHandleFactoryRegistry.RegisterCopyAndImportFactoryPair(factory->GetId(), factory->GetId());

81

// Register the factory

82

tensorHandleFactoryRegistry.RegisterFactory(std::move(factory));

83

Narumol Prangnawarat

549cb7a

2020-07-10 17:50:53 +0100

[diff] [blame]

84

Narumol Prangnawarat

2019-08-14 12:25:50 +0100

[diff] [blame]

85

return std::make_unique<NeonWorkloadFactory>(

Jan Eilers

3c9e045

2020-04-10 13:00:44 +0100

[diff] [blame]

86

PolymorphicPointerDowncast<NeonMemoryManager>(memoryManager));

Narumol Prangnawarat

2019-08-14 12:25:50 +0100

[diff] [blame]

87

}

88

Sadik Armagan

04a7297

2020-09-14 15:44:18 +0100

[diff] [blame]

89

IBackendInternal::IWorkloadFactoryPtr NeonBackend::CreateWorkloadFactory(

90

TensorHandleFactoryRegistry& tensorHandleFactoryRegistry, const ModelOptions& modelOptions) const

91

{

92

auto memoryManager = std::make_shared<NeonMemoryManager>(std::make_unique<arm_compute::Allocator>(),

93

BaseMemoryManager::MemoryAffinity::Offset);

94

95

tensorHandleFactoryRegistry.RegisterMemoryManager(memoryManager);

Narumol Prangnawarat

7740045

2022-01-13 17:43:41 +0000

[diff] [blame]

96

97

auto factory = std::make_unique<NeonTensorHandleFactory>(memoryManager);

98

// Register copy and import factory pair

99

tensorHandleFactoryRegistry.RegisterCopyAndImportFactoryPair(factory->GetId(), factory->GetId());

100

// Register the factory

101

tensorHandleFactoryRegistry.RegisterFactory(std::move(factory));

Sadik Armagan

04a7297

2020-09-14 15:44:18 +0100

[diff] [blame]

102

103

return std::make_unique<NeonWorkloadFactory>(

104

PolymorphicPointerDowncast<NeonMemoryManager>(memoryManager), CreateBackendSpecificModelContext(modelOptions));

105

}

106

David Beck

263e349

2018-11-09 14:46:40 +0000

[diff] [blame]

107

IBackendInternal::IBackendContextPtr NeonBackend::CreateBackendContext(const IRuntime::CreationOptions&) const

108

{

109

return IBackendContextPtr{};

110

}

111

Colm Donelan

e49755b

2020-01-29 15:22:43 +0000

[diff] [blame]

112

IBackendInternal::IBackendProfilingContextPtr NeonBackend::CreateBackendProfilingContext(

Colm Donelan

1aff393

2020-02-05 17:48:59 +0000

[diff] [blame]

113

const IRuntime::CreationOptions&, IBackendProfilingPtr&)

Colm Donelan

e49755b

2020-01-29 15:22:43 +0000

[diff] [blame]

114

{

115

return IBackendProfilingContextPtr{};

116

}

117

Sadik Armagan

045f6be

2020-09-10 13:37:32 +0100

[diff] [blame]

118

IBackendInternal::IBackendSpecificModelContextPtr NeonBackend::CreateBackendSpecificModelContext(

119

const ModelOptions& modelOptions) const

120

{

121

return IBackendSpecificModelContextPtr{new NeonBackendModelContext{modelOptions}};

122

}

123

David Beck

111b5d9

2018-11-12 14:59:37 +0000

[diff] [blame]

124

IBackendInternal::ILayerSupportSharedPtr NeonBackend::GetLayerSupport() const

125

{

Sadik Armagan

045f6be

2020-09-10 13:37:32 +0100

[diff] [blame]

126

static ILayerSupportSharedPtr layerSupport

127

{

128

new NeonLayerSupport(IBackendInternal::IBackendSpecificModelContextPtr{})

};

return layerSupport;

}

IBackendInternal::ILayerSupportSharedPtr NeonBackend::GetLayerSupport(const ModelOptions& modelOptions) const

134

{

135

static ILayerSupportSharedPtr layerSupport

136

{

137

new NeonLayerSupport(CreateBackendSpecificModelContext(modelOptions))

138

};

David Beck

111b5d9

2018-11-12 14:59:37 +0000

[diff] [blame]

return layerSupport;

}

Mike Kelly

2022-05-16 23:10:42 +0100

[diff] [blame]

142

OptimizationViews NeonBackend::OptimizeSubgraphView(const SubgraphView& subgraph,

143

const ModelOptions& modelOptions) const

Matteo Martincigh

adddddb

2019-01-24 14:06:23 +0000

[diff] [blame]

144

{

Mike Kelly

80512b0

2022-05-16 23:10:42 +0100

[diff] [blame]

145

OptimizationViews optimizationViews(modelOptions);

Matteo Martincigh

adddddb

2019-01-24 14:06:23 +0000

[diff] [blame]

146

Francis Murtagh

0f3e9a0

2023-07-28 14:29:46 +0100

[diff] [blame]

147

auto it = subgraph.end();

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

148

std::map<LayerGuid, Layer*> untouched;

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

149

Francis Murtagh

0f3e9a0

2023-07-28 14:29:46 +0100

[diff] [blame]

150

while (it != subgraph.begin())

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

151

{

152

--it;

Francis Murtagh

56ccf68

2021-12-13 18:48:12 +0000

[diff] [blame]

153

Layer& base = *(PolymorphicDowncast<Layer*>(*it));

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

154

untouched.insert({base.GetGuid(), &base});

155

}

156

Francis Murtagh

0f3e9a0

2023-07-28 14:29:46 +0100

[diff] [blame]

157

it = subgraph.end();

158

while (it != subgraph.begin())

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

159

{

160

--it;

Francis Murtagh

56ccf68

2021-12-13 18:48:12 +0000

[diff] [blame]

161

Layer& base = *(PolymorphicDowncast<Layer*>(*it));

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

162

Matthew Sloyan

5fc0fd6

2021-05-03 12:22:03 +0100

[diff] [blame]

163

// Fuse activation into previous layer if supported by backend

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

164

if ((base.GetType() == LayerType::DepthwiseConvolution2d || base.GetType() == LayerType::Convolution2d

165

|| base.GetType() == LayerType::BatchNormalization || base.GetType() == LayerType::FullyConnected

166

|| base.GetType() == LayerType::Addition || base.GetType() == LayerType::Multiplication

Teresa Charlin

0aa080d

2023-09-19 16:46:54 +0100

[diff] [blame]

167

|| base.GetType() == LayerType::Subtraction || base.GetType() == LayerType::Division

168

|| base.GetType() == LayerType::ElementwiseBinary)

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

169

&& (base.GetAdditionalInformation<ActivationDescriptor>() == nullptr))

170

{

171

for (auto output = base.BeginOutputSlots(); output != base.EndOutputSlots(); ++output)

172

{

173

if (output->GetNumConnections() == 1)

174

{

175

for (auto&& childInput : output->GetConnections())

176

{

Teresa Charlin

d672f5d

2021-01-18 18:07:57 +0000

[diff] [blame]

177

if ((childInput->GetOwningLayer().GetType() == LayerType::Activation) &&

178

(checkDataTypeInputandOutput(childInput->GetOwningLayer())))

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

179

{

180

Layer& child = childInput->GetOwningLayer();

181

182

auto* activationLayer = PolymorphicDowncast<ActivationLayer*>(&child);

183

184

const std::string name = std::string("fused-") + child.GetName() + std::string("-into-") +

185

base.GetName();

186

187

// Get params from activation layer

188

ActivationDescriptor activationDesc = activationLayer->GetParameters();

189

190

if (base.GetType() == LayerType::Convolution2d)

191

{

192

Convolution2dLayer* baseLayer = PolymorphicDowncast<Convolution2dLayer*>(&base);

193

194

Optional<TensorInfo> biases;

195

196

if (baseLayer->GetParameters().m_BiasEnabled)

197

{

Keith Davis

b4dd5cc

2022-04-07 11:32:00 +0100

[diff] [blame]

198

biases = baseLayer->GetInputSlot(2).GetConnectedOutputSlot()->GetTensorInfo();

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

199

}

200

201

arm_compute::Status status = NeonConvolution2dWorkloadValidate(

202

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

203

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

204

baseLayer->GetParameters(),

Keith Davis

b4dd5cc

2022-04-07 11:32:00 +0100

[diff] [blame]

205

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

biases,

false,

&activationDesc);

if (status)

{

Cathal Corbett

2021-12-15 17:12:59 +0000

[diff] [blame]

212

FuseConvolution2dLayer<Convolution2dLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

name);

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

217

untouched.erase(baseLayer->GetGuid());

218

untouched.erase(activationLayer->GetGuid());

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

219

}

220

}

221

else if (base.GetType() == LayerType::DepthwiseConvolution2d)

222

{

223

DepthwiseConvolution2dLayer* baseLayer =

224

PolymorphicDowncast<DepthwiseConvolution2dLayer*>(&base);

225

226

Optional<TensorInfo> biases;

227

228

if (baseLayer->GetParameters().m_BiasEnabled)

229

{

Cathal Corbett

0690265

2022-04-14 17:55:11 +0100

[diff] [blame]

230

biases = baseLayer->GetInputSlot(2).GetConnectedOutputSlot()->GetTensorInfo();

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

231

}

232

233

arm_compute::Status status = NeonDepthwiseConvolutionWorkloadValidate(

234

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

235

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

236

baseLayer->GetParameters(),

Cathal Corbett

0690265

2022-04-14 17:55:11 +0100

[diff] [blame]

237

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

biases,

&activationDesc);

if (status)

{

Cathal Corbett

2021-12-15 17:12:59 +0000

[diff] [blame]

243

FuseDepthwiseConvolution2dLayer<DepthwiseConvolution2dLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

name);

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

248

untouched.erase(baseLayer->GetGuid());

249

untouched.erase(activationLayer->GetGuid());

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

250

}

251

}

252

else if (base.GetType() == LayerType::FullyConnected)

253

{

254

FullyConnectedLayer* baseLayer = PolymorphicDowncast<FullyConnectedLayer*>(&base);

Cathal Corbett

2022-05-13 09:55:59 +0100

[diff] [blame]

255

FullyConnectedDescriptor descriptor = baseLayer->GetParameters();

Matthew Bentham

2022-02-08 15:03:07 +0000

[diff] [blame]

256

Cathal Corbett

2022-05-13 09:55:59 +0100

[diff] [blame]

257

// As bias is optional only try to get TensorInfo from input if bias is enabled.

258

Optional<TensorInfo> biases;

259

if (descriptor.m_BiasEnabled)

Matthew Bentham

2022-02-08 15:03:07 +0000

[diff] [blame]

260

{

Cathal Corbett

2022-05-13 09:55:59 +0100

[diff] [blame]

261

biases = baseLayer->GetInputSlot(2).GetConnectedOutputSlot()->GetTensorInfo();

Matthew Bentham

2022-02-08 15:03:07 +0000

[diff] [blame]

262

}

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

263

264

arm_compute::Status status = NeonFullyConnectedWorkloadValidate(

265

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

266

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

Cathal Corbett

2022-05-13 09:55:59 +0100

[diff] [blame]

267

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

Matthew Bentham

2022-02-08 15:03:07 +0000

[diff] [blame]

268

biases,

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

269

baseLayer->GetParameters(),

&activationDesc);

if (status)

{

Cathal Corbett

2021-12-15 17:12:59 +0000

[diff] [blame]

274

FuseFullyConnectedLayer<FullyConnectedLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

name);

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

279

untouched.erase(baseLayer->GetGuid());

280

untouched.erase(activationLayer->GetGuid());

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

281

}

282

}

283

else if (base.GetType() == LayerType::BatchNormalization)

284

{

285

BatchNormalizationLayer* baseLayer =

286

PolymorphicDowncast<BatchNormalizationLayer*>(&base);

287

288

arm_compute::Status status = NeonBatchNormalizationValidate(

289

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

290

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

291

baseLayer->m_Mean->GetTensorInfo(),

292

baseLayer->m_Variance->GetTensorInfo(),

293

baseLayer->m_Beta->GetTensorInfo(),

294

baseLayer->m_Gamma->GetTensorInfo(),

295

baseLayer->GetParameters(),

&activationDesc);

if (status)

{

BatchNormalizationLayer* replacementLayer =

Cathal Corbett

2021-12-15 17:12:59 +0000

[diff] [blame]

301

FuseBatchNormalizationLayer<BatchNormalizationLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

name);

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

306

307

replacementLayer->m_Beta = std::move(baseLayer->m_Beta);

308

replacementLayer->m_Gamma = std::move(baseLayer->m_Gamma);

309

replacementLayer->m_Mean = std::move(baseLayer->m_Mean);

310

replacementLayer->m_Variance = std::move(baseLayer->m_Variance);

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

311

untouched.erase(baseLayer->GetGuid());

312

untouched.erase(activationLayer->GetGuid());

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

313

}

314

}

315

else if (base.GetType() == LayerType::Addition)

316

{

317

AdditionLayer* baseLayer = PolymorphicDowncast<AdditionLayer*>(&base);

318

319

arm_compute::Status status = NeonAdditionWorkloadValidate(

320

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

321

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

322

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

&activationDesc);

if (status)

{

Cathal Corbett

2021-12-15 17:12:59 +0000

[diff] [blame]

327

FuseAdditionLayer<AdditionLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

name);

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

332

untouched.erase(baseLayer->GetGuid());

333

untouched.erase(activationLayer->GetGuid());

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

334

}

335

}

336

else if (base.GetType() == LayerType::Division)

337

{

338

DivisionLayer* baseLayer = PolymorphicDowncast<DivisionLayer*>(&base);

339

340

arm_compute::Status status = NeonDivisionWorkloadValidate(

341

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

342

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

343

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

&activationDesc);

if (status)

{

Cathal Corbett

2021-12-15 17:12:59 +0000

[diff] [blame]

348

FuseDivisionLayer<DivisionLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

name);

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

353

untouched.erase(baseLayer->GetGuid());

354

untouched.erase(activationLayer->GetGuid());

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

355

}

356

}

357

else if (base.GetType() == LayerType::Multiplication)

358

{

359

MultiplicationLayer* baseLayer = PolymorphicDowncast<MultiplicationLayer*>(&base);

360

361

arm_compute::Status status = NeonMultiplicationWorkloadValidate(

362

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

363

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

364

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

&activationDesc);

if (status)

{

Cathal Corbett

2021-12-15 17:12:59 +0000

[diff] [blame]

369

FuseMultiplicationLayer<MultiplicationLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

name);

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

374

untouched.erase(baseLayer->GetGuid());

375

untouched.erase(activationLayer->GetGuid());

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

376

}

377

}

378

else if (base.GetType() == LayerType::Subtraction)

379

{

380

SubtractionLayer* baseLayer = PolymorphicDowncast<SubtractionLayer*>(&base);

381

382

arm_compute::Status status = NeonSubtractionWorkloadValidate(

383

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

384

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

385

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

&activationDesc);

if (status)

{

Cathal Corbett

2021-12-15 17:12:59 +0000

[diff] [blame]

390

FuseSubtractionLayer<SubtractionLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

name);

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

395

untouched.erase(baseLayer->GetGuid());

396

untouched.erase(activationLayer->GetGuid());

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

397

}

398

}

Mike Kelly

3ec3077

2023-03-08 13:47:17 +0000

[diff] [blame]

399

else if (base.GetType() == LayerType::ElementwiseBinary)

400

{

401

ElementwiseBinaryLayer* baseLayer = PolymorphicDowncast<ElementwiseBinaryLayer*>(&base);

402

403

if (baseLayer->GetParameters().m_Operation == BinaryOperation::Add)

404

{

405

arm_compute::Status status = NeonAdditionWorkloadValidate(

406

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

407

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

408

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

&activationDesc);

if (status)

{

FuseElementwiseBinaryLayer<ElementwiseBinaryLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

BinaryOperation::Add,

418

name);

419

untouched.erase(baseLayer->GetGuid());

420

untouched.erase(activationLayer->GetGuid());

421

}

422

}

423

else if (baseLayer->GetParameters().m_Operation == BinaryOperation::Div)

424

{

425

arm_compute::Status status = NeonDivisionWorkloadValidate(

426

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

427

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

428

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

&activationDesc);

if (status)

{

FuseElementwiseBinaryLayer<ElementwiseBinaryLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

BinaryOperation::Div,

438

name);

439

untouched.erase(baseLayer->GetGuid());

440

untouched.erase(activationLayer->GetGuid());

441

}

442

}

443

else if (baseLayer->GetParameters().m_Operation == BinaryOperation::Mul)

444

{

445

arm_compute::Status status = NeonMultiplicationWorkloadValidate(

446

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

447

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

448

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

&activationDesc);

if (status)

{

FuseElementwiseBinaryLayer<ElementwiseBinaryLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

BinaryOperation::Mul,

458

name);

459

untouched.erase(baseLayer->GetGuid());

460

untouched.erase(activationLayer->GetGuid());

461

}

462

}

463

else if (baseLayer->GetParameters().m_Operation == BinaryOperation::Sub)

464

{

465

arm_compute::Status status = NeonSubtractionWorkloadValidate(

466

baseLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

467

baseLayer->GetInputSlot(1).GetConnectedOutputSlot()->GetTensorInfo(),

468

activationLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo(),

&activationDesc);

if (status)

{

FuseElementwiseBinaryLayer<ElementwiseBinaryLayer>(optimizationViews,

baseLayer,

activationLayer,

activationDesc,

BinaryOperation::Sub,

478

name);

479

untouched.erase(baseLayer->GetGuid());

480

untouched.erase(activationLayer->GetGuid());

481

}

482

}

483

// No fusion available for other BinaryOperations

484

}

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

}

}

}

}

}

Matthew Sloyan

5fc0fd6

2021-05-03 12:22:03 +0100

[diff] [blame]

490

491

// Separate reduce layer with multiple axes into multiple reduce layers with 1 axis.

492

if (base.GetType() == LayerType::Reduce)

493

{

494

ReduceLayer* baseLayer = PolymorphicDowncast<ReduceLayer*>(&base);

495

ReduceDescriptor reduceDescriptor = baseLayer->GetParameters();

496

497

if (!reduceDescriptor.m_vAxis.empty() && reduceDescriptor.m_vAxis.size() > 1)

498

{

499

// Add new layers to the graph and connect them.

Francis Murtagh

56ccf68

2021-12-13 18:48:12 +0000

[diff] [blame]

500

std::vector<IConnectableLayer*> layers = ChainReduceLayers<ReduceLayer>(optimizationViews,

501

baseLayer,

502

reduceDescriptor);

Matthew Sloyan

5fc0fd6

2021-05-03 12:22:03 +0100

[diff] [blame]

503

504

// Replace existing baselayer with new subgraph.

505

ReplaceLayers<ReduceLayer>(optimizationViews, baseLayer, layers);

506

untouched.erase(baseLayer->GetGuid());

507

}

508

}

Mike Kelly

2023-07-07 15:43:06 +0100

[diff] [blame]

509

510

// Remove Reshape where possible

511

if (base.GetType() == LayerType::Reshape)

512

{

513

ReshapeLayer* baseLayer = PolymorphicDowncast<ReshapeLayer*>(&base);

Mike Kelly

2023-07-07 15:43:06 +0100

[diff] [blame]

514

Mike Kelly

be06f10

2023-07-17 17:49:55 +0100

[diff] [blame]

515

// Cannot remove a Reshape if it's connected to any layer that has an NCHW layout

516

if (ConnectedToLayerWithNCHW(baseLayer))

Mike Kelly

2023-07-07 15:43:06 +0100

[diff] [blame]

517

{

518

continue;

519

}

Mike Kelly

a638f10

2023-07-24 17:42:47 +0100

[diff] [blame]

520

// Cannot remove a Reshape if it's connected to a SplitterLayer

521

if (ConnectedToLayerType(baseLayer, LayerType::Splitter))

Mike Kelly

2023-07-07 15:43:06 +0100

[diff] [blame]

{

continue;

}

RemoveReshapeLayer(baseLayer, untouched, optimizationViews);

526

}

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

527

}

528

Mike Kelly

2023-07-07 15:43:06 +0100

[diff] [blame]

529

if (optimizationViews.GetSubstitutions().empty() && optimizationViews.GetDeletedSubgraphs().empty())

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

530

{

531

optimizationViews.AddUntouchedSubgraph(SubgraphView(subgraph));

532

}

Mike Kelly

2020-11-17 11:41:38 +0000

[diff] [blame]

533

else

534

{

535

ReportUntouchedLayers(optimizationViews, untouched);

536

}

Matteo Martincigh

c3ba50e

2019-05-22 14:28:16 +0100

[diff] [blame]

537

538

return optimizationViews;

Matteo Martincigh

adddddb

2019-01-24 14:06:23 +0000

[diff] [blame]

539

}

540

Narumol Prangnawarat

2019-08-14 12:25:50 +0100

[diff] [blame]

541

std::vector<ITensorHandleFactory::FactoryId> NeonBackend::GetHandleFactoryPreferences() const

542

{

Narumol Prangnawarat

265e53e

2020-10-30 16:06:55 +0000

[diff] [blame]

543

return std::vector<ITensorHandleFactory::FactoryId>() = { NeonTensorHandleFactory::GetIdStatic() };

Narumol Prangnawarat

2019-08-14 12:25:50 +0100

[diff] [blame]

544

}

545

546

void NeonBackend::RegisterTensorHandleFactories(class TensorHandleFactoryRegistry& registry)

547

{

548

auto memoryManager = std::make_shared<NeonMemoryManager>(std::make_unique<arm_compute::Allocator>(),

549

BaseMemoryManager::MemoryAffinity::Offset);

550

551

registry.RegisterMemoryManager(memoryManager);

Narumol Prangnawarat

7740045

2022-01-13 17:43:41 +0000

[diff] [blame]

552

553

auto factory = std::make_unique<NeonTensorHandleFactory>(memoryManager);

554

// Register copy and import factory pair

555

registry.RegisterCopyAndImportFactoryPair(factory->GetId(), factory->GetId());

556

// Register the factory

557

registry.RegisterFactory(std::move(factory));

Narumol Prangnawarat