Blame - src/armnn/Network.cpp - ml/armnn

2018-03-09 14:13:49 +0000

[diff] [blame]

1

//

2

David Beck

ecb56cd

2018-09-05 12:52:57 +0100

[diff] [blame]

3

// SPDX-License-Identifier: MIT

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

4

//

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

5

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

6

#include "Network.hpp"

7

#include "Graph.hpp"

8

#include "Layer.hpp"

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

9

#include "DeviceSpec.hpp"

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

10

#include "Optimizer.hpp"

Derek Lamberti

2019-04-26 13:05:17 +0100

[diff] [blame]

11

#include "SubgraphViewSelector.hpp"

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

12

#include "BackendSettings.hpp"

David Beck

ac42efd

2018-09-26 17:41:13 +0100

[diff] [blame]

13

#include "optimizations/All.hpp"

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

14

Aron Virginas-Tar

c9cc804

2018-11-01 16:15:57 +0000

[diff] [blame]

15

#include <backendsCommon/CpuTensorHandle.hpp>

16

#include <backendsCommon/WorkloadFactory.hpp>

Matteo Martincigh

e5b8eb9

2019-11-28 15:45:42 +0000

[diff] [blame]

17

#include <armnn/backends/IBackendInternal.hpp>

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

18

#include <backendsCommon/TensorHandleFactoryRegistry.hpp>

David Beck

ac42efd

2018-09-26 17:41:13 +0100

[diff] [blame]

19

20

#include <armnn/Exceptions.hpp>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

21

#include <armnn/Utils.hpp>

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

22

#include <armnn/TypesUtils.hpp>

Matteo Martincigh

c601aa6

2019-10-29 15:03:22 +0000

[diff] [blame]

23

#include <armnn/BackendRegistry.hpp>

Matthew Bentham

f48afc6

2020-01-15 17:55:08 +0000

[diff] [blame]

24

#include <armnn/Logging.hpp>

Jan Eilers

8eb2560

2020-03-09 12:13:48 +0000

[diff] [blame]

25

#include <armnn/utility/IgnoreUnused.hpp>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

26

Jan Eilers

99d9d4a

2019-11-06 10:02:16 +0000

[diff] [blame]

27

#include <ProfilingService.hpp>

28

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

#include <fcntl.h>

#include <algorithm>

#include <fstream>

#include <memory>

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

33

#include <vector>

34

#include <algorithm>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

35

36

#include <boost/assert.hpp>

37

#include <boost/format.hpp>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

38

#include <boost/numeric/conversion/converter_policies.hpp>

39

#include <boost/cast.hpp>

namespace armnn

{

armnn::INetwork* INetwork::CreateRaw()

45

{

46

return new Network();

47

}

48

49

armnn::INetworkPtr INetwork::Create()

50

{

51

return INetworkPtr(CreateRaw(), &INetwork::Destroy);

52

}

53

54

void INetwork::Destroy(INetwork* network)

55

{

56

delete boost::polymorphic_downcast<Network*>(network);

57

}

58

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

59

void IOptimizedNetwork::Destroy(IOptimizedNetwork* network)

60

{

61

delete boost::polymorphic_downcast<OptimizedNetwork*>(network);

62

}

63

64

Status OptimizedNetwork::PrintGraph()

65

{

66

m_Graph->Print();

67

return Status::Success;

68

}

69

surmeh01

bceff2f

2018-03-29 16:29:27 +0100

[diff] [blame]

70

Status OptimizedNetwork::SerializeToDot(std::ostream& stream) const

71

{

72

return m_Graph->SerializeToDot(stream);

73

}

74

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

75

void ReportError(const std::string& errorMessage,

76

Optional<std::vector<std::string>&> errorMessages)

77

{

78

std::stringstream fullErrorMessage;

79

fullErrorMessage << "ERROR: " << errorMessage;

Derek Lamberti

0844697

2019-11-26 16:38:31 +0000

[diff] [blame]

80

ARMNN_LOG(warning) << fullErrorMessage.str();

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

81

if (errorMessages)

82

{

83

errorMessages.value().push_back(fullErrorMessage.str());

}

}

void ReportWarning(const std::string& warningMessage,

88

Optional<std::vector<std::string>&> warningMessages)

89

{

90

std::stringstream fullWarningMessage;

91

fullWarningMessage << "WARNING: " << warningMessage;

Derek Lamberti

0844697

2019-11-26 16:38:31 +0000

[diff] [blame]

92

ARMNN_LOG(warning) << fullWarningMessage.str();

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

93

if (warningMessages)

94

{

95

warningMessages.value().push_back(fullWarningMessage.str());

}

}

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

99

OptimizationResult ReturnWithError(OptimizationResult res,

100

const Layer* layer,

101

const BackendSettings& backendSettings,

102

Optional<std::vector<std::string>&> errMessages)

103

{

104

std::stringstream failureMsg;

105

failureMsg << "Layer of type " << GetLayerTypeAsCString(layer->GetType())

106

<< " is not supported on any preferred backend " << backendSettings.m_PreferredBackends;

107

ReportError(failureMsg.str(), errMessages);

res.m_Error = true;

return res;

}

jimfly01

2018-10-08 14:43:01 +0100

[diff] [blame]

114

bool CheckScaleSetOnQuantizedType(Layer* layer, Optional<std::vector<std::string>&> errMessages)

115

{

116

bool noErrors = true;

117

unsigned int numOutputs = layer->GetNumOutputSlots();

118

for (unsigned int i = 0; i < numOutputs; i++) {

David Monahan

b855470

2019-04-25 16:03:38 +0100

[diff] [blame]

119

OutputSlot& outputSlot = layer->GetOutputSlot(i);

120

TensorInfo info = outputSlot.GetTensorInfo();

Derek Lamberti

f90c56d

2020-01-10 17:14:08 +0000

[diff] [blame]

121

if (DataType::QAsymmU8 == info.GetDataType()) {

jimfly01

2018-10-08 14:43:01 +0100

[diff] [blame]

122

if (0.f == info.GetQuantizationScale()) {

123

noErrors = false;

124

std::stringstream ss;

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

125

ss << "output " << i << " of layer " << GetLayerTypeAsCString(layer->GetType())

jimfly01

2018-10-08 14:43:01 +0100

[diff] [blame]

126

<< " (" << layer->GetNameStr() << ") is of type"

127

<< " Quantized 8 bit but its scale parameter has not been set";

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

128

ReportError(ss.str(), errMessages);

jimfly01

2018-10-08 14:43:01 +0100

[diff] [blame]

129

}

David Monahan

b855470

2019-04-25 16:03:38 +0100

[diff] [blame]

130

// Softmax under QuantisedAsymm8 must always be scale (1.0f/256.0f) and offset 0

131

if ((info.GetQuantizationScale() != (1.0f / 256.0f) ||

132

info.GetQuantizationOffset() != 0) &&

133

layer->GetType() == armnn::LayerType::Softmax)

134

{

135

std::stringstream ss;

136

ss << "Quantization parameters for Softmax layer (Scale: " <<

137

info.GetQuantizationScale() << " and Offset: " << info.GetQuantizationOffset() <<

138

") are incorrect and have been updated to Scale: 0.00390625 and Offset: 0";

Derek Lamberti

0844697

2019-11-26 16:38:31 +0000

[diff] [blame]

139

ARMNN_LOG(warning) << ss.str();

David Monahan

b855470

2019-04-25 16:03:38 +0100

[diff] [blame]

140

info.SetQuantizationScale((1.0f /256.0f));

141

info.SetQuantizationOffset(0);

142

outputSlot.SetTensorInfo(info);

143

}

jimfly01

2018-10-08 14:43:01 +0100

[diff] [blame]

}

}

return noErrors;

}

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

149

OptimizationResult AttemptBackendAssignment(BackendSettings& backendSettings,

Graph& graph,

Layer* layer,

BackendId backend,

DataType dataTypeIn,

DataType dataTypeOut,

155

const std::vector<BackendId>& availablePreferredBackends,

156

std::string& reasonIfUnsupported,

157

Optional<std::vector<std::string>&> errMessages)

158

{

159

OptimizationResult result;

160

161

// Helper lambda to compose meaningful error message before returning with error

162

auto ReturnError = [&](const Layer* layer)

163

{

164

return ReturnWithError(result, layer, backendSettings, errMessages);

165

};

166

167

// need to set the compute device on the layer

168

// before we can check if it is supported

169

layer->SetBackendId(backend);

170

if (!IWorkloadFactory::IsLayerSupported(*layer, EmptyOptional(), reasonIfUnsupported))

171

{

172

if (dataTypeIn == DataType::Float16 || dataTypeOut == DataType::Float16)

173

{

174

if (IWorkloadFactory::IsLayerSupported(*layer, DataType::Float32, reasonIfUnsupported)

175

&& layer->GetType() != LayerType::ConvertFp32ToFp16

176

&& layer->GetType() != LayerType::ConvertFp16ToFp32)

177

{

178

// Insert FP16 -> FP32 conversion layer before current layer

179

std::vector<ConvertFp16ToFp32Layer*> convertFp16ToFp32Layers;

180

if (dataTypeIn == DataType::Float16)

181

{

182

convertFp16ToFp32Layers =

183

InsertConvertFp16ToFp32LayersBefore(graph, *layer);

184

}

185

186

// Insert FP32 -> FP16 conversion layer after current layer

187

std::vector<ConvertFp32ToFp16Layer*> convertFp32ToFp16Layers;

188

if (dataTypeOut == DataType::Float16)

189

{

190

convertFp32ToFp16Layers =

191

InsertConvertFp32ToFp16LayersAfter(graph, *layer);

192

}

193

194

// Assign a supported backend to the newly introduced conversion layers

195

auto AssignFirstSupportedBackend = [&](Layer* layer, BackendId preferredBackend)

196

{

197

bool supportedBackendFound = false;

198

std::string reasonIfUnsupported;

199

200

// Try preferred backend first

201

layer->SetBackendId(preferredBackend);

202

if (IWorkloadFactory::IsLayerSupported(*layer,

203

EmptyOptional(),

204

reasonIfUnsupported))

205

{

206

supportedBackendFound = true;

}

else

{

for (const auto& backend : availablePreferredBackends)

211

{

212

// Skip preferred backend (we already determined that it is not supported)

213

if (backend == preferredBackend)

{

continue;

}

layer->SetBackendId(backend);

219

if (IWorkloadFactory::IsLayerSupported(*layer,

220

EmptyOptional(),

221

reasonIfUnsupported))

222

{

223

supportedBackendFound = true;

break;

}

}

}

return supportedBackendFound;

230

};

231

232

for (ConvertFp16ToFp32Layer* convertLayer : convertFp16ToFp32Layers)

233

{

234

if (!AssignFirstSupportedBackend(convertLayer, backend))

235

{

236

return ReturnError(convertLayer);

}

}

for (ConvertFp32ToFp16Layer* convertLayer : convertFp32ToFp16Layers)

241

{

242

if (!AssignFirstSupportedBackend(convertLayer, backend))

243

{

244

return ReturnError(convertLayer);

}

}

return result;

}

}

Narumol Prangnawarat

2020-03-20 15:01:01 +0000

[diff] [blame]

251

else if (dataTypeIn == DataType::BFloat16 || dataTypeOut == DataType::BFloat16)

252

{

253

if (IWorkloadFactory::IsLayerSupported(*layer, DataType::Float32, reasonIfUnsupported)

254

&& layer->GetType() != LayerType::ConvertFp32ToBf16

255

&& layer->GetType() != LayerType::ConvertBf16ToFp32)

256

{

257

// Insert BF16 -> FP32 conversion layer before current layer

258

std::vector<ConvertBf16ToFp32Layer*> convertBf16ToFp32Layers;

259

if (dataTypeIn == DataType::BFloat16)

260

{

261

convertBf16ToFp32Layers =

262

InsertConvertBf16ToFp32LayersBefore(graph, *layer);

263

}

264

265

// Insert FP32 -> BF16 conversion layer after current layer

266

std::vector<ConvertFp32ToBf16Layer*> convertFp32ToBf16Layers;

267

if (dataTypeOut == DataType::BFloat16)

268

{

269

convertFp32ToBf16Layers =

270

InsertConvertFp32ToBf16LayersAfter(graph, *layer);

271

}

272

273

// Assign a supported backend to the newly introduced conversion layers

274

auto AssignFirstSupportedBackend = [&](Layer* layer, BackendId preferredBackend)

275

{

276

bool supportedBackendFound = false;

277

std::string reasonIfUnsupported;

278

279

// Try preferred backend first

280

layer->SetBackendId(preferredBackend);

281

if (IWorkloadFactory::IsLayerSupported(*layer,

282

EmptyOptional(),

283

reasonIfUnsupported))

284

{

285

supportedBackendFound = true;

}

else

{

for (const auto& backend : availablePreferredBackends)

290

{

291

// Skip preferred backend (we already determined that it is not supported)

292

if (backend == preferredBackend)

{

continue;

}

layer->SetBackendId(backend);

298

if (IWorkloadFactory::IsLayerSupported(*layer,

299

EmptyOptional(),

300

reasonIfUnsupported))

301

{

302

supportedBackendFound = true;

break;

}

}

}

return supportedBackendFound;

309

};

310

311

for (ConvertBf16ToFp32Layer* convertLayer : convertBf16ToFp32Layers)

312

{

313

if (!AssignFirstSupportedBackend(convertLayer, backend))

314

{

315

return ReturnError(convertLayer);

}

}

for (ConvertFp32ToBf16Layer* convertLayer : convertFp32ToBf16Layers)

320

{

321

if (!AssignFirstSupportedBackend(convertLayer, backend))

322

{

323

return ReturnError(convertLayer);

}

}

return result;

}

}

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

331

std::stringstream warningMsg;

332

warningMsg << "Layer of type " << GetLayerTypeAsCString(layer->GetType())

333

<< " is not supported on requested backend " << layer->GetBackendId().Get()

334

<< " for input data type " << GetDataTypeName(dataTypeIn)

335

<< " and output data type " << GetDataTypeName(dataTypeOut)

336

<< " (reason: " << reasonIfUnsupported

337

<< "), falling back to the next backend.";

338

ReportWarning(warningMsg.str(), errMessages);

339

340

return OptimizationResult(true, false);

}

else

{

return result;

}

}

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

349

OptimizationResult AssignBackends(OptimizedNetwork* optNetObjPtr,

350

BackendSettings& backendSettings,

351

Graph::Iterator& firstLayer,

352

Graph::Iterator& lastLayer,

353

Optional<std::vector<std::string>&> errMessages)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

354

{

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

355

OptimizationResult result;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

356

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

357

// Helper lambda to compose meaningful error message before returning with error

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

358

auto ReturnError = [&](const Layer* layer)

359

{

360

return ReturnWithError(result, layer, backendSettings, errMessages);

361

};

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

362

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

363

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

364

auto availablePreferredBackends = backendSettings.GetAvailablePreferredBackends();

365

if (availablePreferredBackends.empty())

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

366

{

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

367

std::stringstream failureMsg;

368

failureMsg << "No preferred backends are available";

369

ReportError(failureMsg.str(), errMessages);

370

371

result.m_Error = true;

return result;

}

for (auto it = firstLayer; it != lastLayer; ++it)

376

{

377

auto layer = *it;

Aron Virginas-Tar

87972be

2019-11-13 15:16:28 +0000

[diff] [blame]

378

379

DataType dataTypeIn = layer->GetNumInputSlots() == 0 ? DataType::Float32 :

380

layer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo().GetDataType();

381

DataType dataTypeOut = layer->GetNumOutputSlots() == 0 ? DataType::Float32 :

382

layer->GetOutputSlot(0).GetTensorInfo().GetDataType();

383

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

384

std::string reasonIfUnsupported;

385

bool found = false;

jimfly01

2018-10-08 14:43:01 +0100

[diff] [blame]

386

if (!CheckScaleSetOnQuantizedType(layer, errMessages))

387

{

388

// don't bomb immediately, find all the quantized outputs

389

// which haven't had a scale set and report them all back.

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

390

result.m_Error = true;

jimfly01

2018-10-08 14:43:01 +0100

[diff] [blame]

391

}

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

392

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

393

// First try assign layer to hint backend

394

if (layer->GetBackendHint().has_value() &&

395

backendSettings.IsBackendSupported(layer->GetBackendHint().value()) &&

396

AttemptBackendAssignment(backendSettings,

397

optNetObjPtr->GetGraph(),

398

layer,

399

layer->GetBackendHint().value(),

400

dataTypeIn,

401

dataTypeOut,

402

availablePreferredBackends,

403

reasonIfUnsupported,

404

errMessages).IsOk())

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

405

{

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

406

found = true;

407

backendSettings.m_SelectedBackends.insert(layer->GetBackendHint().value());

}

else

{

// Try assign layer to prefered list of backends

412

for (const auto& backend : availablePreferredBackends)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

413

{

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

414

if (layer->GetBackendHint().has_value() &&

415

layer->GetBackendHint().value() == backend)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

416

{

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

417

continue; //Don't re-test the backend hint

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

418

}

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

419

420

OptimizationResult res = AttemptBackendAssignment(backendSettings,

421

optNetObjPtr->GetGraph(),

layer,

backend,

dataTypeIn,

dataTypeOut,

availablePreferredBackends,

reasonIfUnsupported,

errMessages);

if (res.IsOk())

{

found = true;

backendSettings.m_SelectedBackends.insert(backend);

434

break;

435

}

436

else if (res.IsError())

437

{

438

return res; // Cannot continue.

439

// Note: we don't need to log the error as it would already

440

// be logged in AttemptBackendAssignment().

}

else

{

BOOST_ASSERT_MSG(res.IsWarningOnly(), "OptimizationResult in unexpected state.");

445

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

}

}

// If the layer is unsupported by any devices, log and return a null network.

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

450

if (!found)

451

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

452

// NOTE: if the layer is not an operation queue type AND we have not got CpuRef as a

453

// fallback we should set the compute device on the layer to CpuRef (these are not

454

// available as accelerated operations, or are only available under certain

455

// conditions, currently they comprise MemCopy, Constant, Permute)

456

armnn::LayerType layerType = layer->GetType();

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

457

if (!backendSettings.IsCpuRefUsed() && (layerType == armnn::LayerType::MemCopy ||

458

layerType == armnn::LayerType::Constant ||

459

layerType == armnn::LayerType::Permute))

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

460

{

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

461

BackendId cpuBackendId(armnn::Compute::CpuRef);

462

layer->SetBackendId(cpuBackendId);

463

backendSettings.m_SelectedBackends.insert(cpuBackendId);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

464

}

465

else

466

{

Derek Lamberti

2020-01-03 16:53:38 +0000

[diff] [blame]

467

return ReturnError(layer);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

468

}

469

}

470

}

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

return result;

}

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

475

OptimizationResult AssignBackends(OptimizedNetwork* optNetObjPtr,

476

BackendSettings& backendSettings,

Derek Lamberti

2019-04-26 13:05:17 +0100

[diff] [blame]

477

SubgraphView& subgraph,

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

478

Optional<std::vector<std::string>&> errMessages)

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

479

{

Derek Lamberti

2019-04-26 13:05:17 +0100

[diff] [blame]

480

Graph::Iterator firstLayer = subgraph.begin();

481

Graph::Iterator lastLayer = subgraph.end();

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

482

return AssignBackends(optNetObjPtr,

backendSettings,

firstLayer,

lastLayer,

errMessages);

}

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

489

BackendsMap CreateSupportedBackends(TensorHandleFactoryRegistry& handleFactoryRegistry,

490

BackendSettings& backendSettings)

491

{

492

BackendsMap backends;

493

auto const& backendRegistry = BackendRegistryInstance();

494

for (auto&& selectedBackend : backendSettings.m_SupportedBackends)

495

{

496

auto backendFactory = backendRegistry.GetFactory(selectedBackend);

497

auto backendObjPtr = backendFactory();

498

BOOST_ASSERT(backendObjPtr);

499

500

backendObjPtr->RegisterTensorHandleFactories(handleFactoryRegistry);

501

502

backends[backendObjPtr->GetId()] = std::move(backendObjPtr);

}

return backends;

}

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

508

OptimizationResult ApplyBackendOptimizations(OptimizedNetwork* optNetObjPtr,

509

BackendSettings& backendSettings,

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

510

BackendsMap& backends,

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

511

Optional<std::vector<std::string>&> errMessages)

512

{

513

BOOST_ASSERT(optNetObjPtr);

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

514

515

OptimizationResult result;

516

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

517

// Get the optimized graph

518

Graph& optGraph = optNetObjPtr->GetGraph();

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

519

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

520

// Run backend specific optimizations

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

521

for (auto&& selectedBackend : backendSettings.m_SelectedBackends)

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

522

{

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

523

auto backendObjPtr = backends.find(selectedBackend)->second.get();

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

524

BOOST_ASSERT(backendObjPtr);

525

526

// Select sub-graphs based on backend

Derek Lamberti

2019-04-26 13:05:17 +0100

[diff] [blame]

527

SubgraphViewSelector::Subgraphs subgraphs =

Rob Hughes

65c3226

2019-07-23 15:33:39 +0100

[diff] [blame]

528

SubgraphViewSelector::SelectSubgraphs(optGraph,

Matteo Martincigh

602af09

2019-05-01 10:31:27 +0100

[diff] [blame]

529

// Select layers assigned to the requested backend

530

[&backendObjPtr](const Layer& layer)

531

{

532

return layer.GetType() != LayerType::Input &&

533

layer.GetType() != LayerType::Output &&

534

layer.GetBackendId() == backendObjPtr->GetId();

535

});

Derek Lamberti

2019-04-26 13:05:17 +0100

[diff] [blame]

536

if (subgraphs.empty())

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

537

{

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

538

// No sub-graphs found, try with next selected backend

539

continue;

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

540

}

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

541

542

// Try to optimize each sub-graph

Derek Lamberti

2019-04-26 13:05:17 +0100

[diff] [blame]

543

for (auto& subgraph : subgraphs)

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

544

{

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

545

// Try to optimize the current sub-graph

Matteo Martincigh

2019-05-09 12:46:16 +0100

[diff] [blame]

546

OptimizationViews optimizationViews = backendObjPtr->OptimizeSubgraphView(*subgraph);

547

BOOST_ASSERT(optimizationViews.Validate(*subgraph));

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

548

549

// Optimization attempted, check the resulting optimized sub-graph

Matteo Martincigh

2019-05-09 12:46:16 +0100

[diff] [blame]

550

for (auto& substitution : optimizationViews.GetSubstitutions())

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

551

{

552

// Sub-graph optimized, substitute the sub-graph with the new optimized one in the main optimized graph

Matteo Martincigh

2019-05-09 12:46:16 +0100

[diff] [blame]

553

SubgraphView& replacementSubgraph = substitution.m_ReplacementSubgraph;

554

SubgraphView& substitutableSubgraph = substitution.m_SubstitutableSubgraph;

555

optGraph.SubstituteSubgraph(substitutableSubgraph, replacementSubgraph);

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

556

557

// Assign the current backend to the optimized sub-graph

Matteo Martincigh

2019-05-09 12:46:16 +0100

[diff] [blame]

558

std::for_each(replacementSubgraph.begin(), replacementSubgraph.end(), [&selectedBackend](Layer* l)

Derek Lamberti

2019-05-08 10:23:08 +0100

[diff] [blame]

559

{

560

BOOST_ASSERT(l);

561

l->SetBackendId(selectedBackend);

562

});

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

563

}

Derek Lamberti

2019-05-08 10:23:08 +0100

[diff] [blame]

564

Matteo Martincigh

2019-05-09 12:46:16 +0100

[diff] [blame]

565

if (!optimizationViews.GetFailedSubgraphs().empty())

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

566

{

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

567

std::stringstream warningMsg;

Derek Lamberti

2019-05-08 10:23:08 +0100

[diff] [blame]

568

warningMsg << "Some sub-graph(s) failed to optimized on " << backendObjPtr->GetId() << " backend.";

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

569

ReportWarning(warningMsg.str(), errMessages);

570

571

// Failed to optimize the given sub-graph, re-assign the sub-graph layers to other available backends

Derek Lamberti

2019-05-08 10:23:08 +0100

[diff] [blame]

572

BackendSettings settingsCopy(backendSettings);

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

573

if (!backendObjPtr->GetId().IsCpuRef())

574

{

575

// Add the current backend to the list of backends to ignore

Derek Lamberti

2019-05-08 10:23:08 +0100

[diff] [blame]

576

settingsCopy.m_IgnoredBackends.insert(backendObjPtr->GetId());

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

577

}

Derek Lamberti

2019-05-08 10:23:08 +0100

[diff] [blame]

578

579

int count=0;

Matteo Martincigh

2019-05-09 12:46:16 +0100

[diff] [blame]

580

for (auto& failedSubgraph : optimizationViews.GetFailedSubgraphs())

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

581

{

Derek Lamberti

2019-05-08 10:23:08 +0100

[diff] [blame]

582

// An error occurred: the optimization was attempted but not performed, try different backends

583

std::stringstream subgraphMsg;

584

subgraphMsg << "Re-assigning backends to " << failedSubgraph.GetLayers().size()

585

<< " layers inside sub-graph " << count++;

Matteo Martincigh

328d92b

2019-07-04 17:52:55 +0100

[diff] [blame]

586

ReportWarning(subgraphMsg.str(), errMessages);

Derek Lamberti

2019-05-08 10:23:08 +0100

[diff] [blame]

587

588

OptimizationResult reassignmentResult = AssignBackends(optNetObjPtr,

settingsCopy,

*subgraph,

errMessages);

if (reassignmentResult.m_Error)

593

{

594

// Failed to re-assign one of the remaining backends to each layer of the sub-graph

595

result.m_Error = true;

596

return result;

597

}

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

598

}

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

}

}

}

return result;

}

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

606

bool RequiresCopy(ITensorHandleFactory::FactoryId src,

607

ITensorHandleFactory::FactoryId dst,

608

TensorHandleFactoryRegistry& registry)

{

if (src != dst)

{

ITensorHandleFactory* srcFactory = registry.GetFactory(src);

613

ITensorHandleFactory* dstFactory = registry.GetFactory(dst);

614

Matteo Martincigh

a6539ed

2019-08-27 13:43:32 +0100

[diff] [blame]

615

if (srcFactory && dstFactory &&

616

(srcFactory->GetExportFlags() & dstFactory->GetImportFlags()) != 0)

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

{

return false;

}

return true;

}

return false;

}

// Find the handle factory for the input layer which results in fewest required copies.

626

ITensorHandleFactory::FactoryId CalculateSlotOptionForInput(BackendsMap& backends,

627

OutputSlot& slot,

628

TensorHandleFactoryRegistry& registry)

629

{

630

Layer& layer = slot.GetOwningLayer();

631

BOOST_ASSERT(layer.GetType() == LayerType::Input);

632

633

// Explicitly select the tensorhandle factory for InputLayer because the rules for it are slightly different. It

634

// doesn't matter which backend it is assigned to because they all use the same implementation, which

635

// requires Map/Unmap support. This means that, so long as the handle type supports map/unmap semantics, we can

636

// select a factory with maximum compatibility with the layers connected to the InputLayer.

637

638

// First ensure the from backends can support the TensorHandeAPI

639

auto frmBackend = backends.find(layer.GetBackendId());

640

if (frmBackend == backends.end() ||

641

!frmBackend->second->SupportsTensorAllocatorAPI())

642

{

643

return ITensorHandleFactory::LegacyFactoryId;

644

}

645

646

// Go through all connections to the output slot and determine the TensorHandleFactory which results in the

647

// fewest copies.

648

std::map<ITensorHandleFactory::FactoryId, int> factoryScores;

649

int topScore = 0;

650

ITensorHandleFactory::FactoryId topChoice = ITensorHandleFactory::LegacyFactoryId;

651

652

for (auto&& connection : slot.GetConnections())

653

{

654

const Layer& connectedLayer = connection->GetOwningLayer();

655

656

auto toBackend = backends.find(connectedLayer.GetBackendId());

657

BOOST_ASSERT_MSG(toBackend != backends.end(), "Backend id not found for the connected layer");

658

659

if (!toBackend->second.get()->SupportsTensorAllocatorAPI())

660

{

661

// The destination backend does not support the tensor allocator API, move to the next one

continue;

}

auto dstPrefs = toBackend->second.get()->GetHandleFactoryPreferences();

666

for (auto&& dst : dstPrefs)

667

{

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

668

// Input layers use the mem copy workload or import, so the selected factory must

669

// support either the map/unmap API or Import API

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

670

ITensorHandleFactory* factory = registry.GetFactory(dst);

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

671

if (!factory->SupportsMapUnmap() &&

672

!CheckFlag(factory->GetImportFlags(), MemorySource::Malloc)) // Just support cpu mem imports for now

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

673

{

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

674

// The current tensor handle factory does not support the map/unmap or import

675

// strategy, move to the next one

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

continue;

}

auto it = factoryScores.find(dst);

680

if (it == factoryScores.end())

681

{

682

// Add new score to the table

683

factoryScores[dst] = 0;

684

if (topChoice == ITensorHandleFactory::LegacyFactoryId)

{

topChoice = dst;

}

}

else

{

// Increase the score

692

factoryScores[dst]++;

693

694

// Track the best option

695

if (factoryScores[dst] > topScore)

696

{

697

topScore = factoryScores[dst];

topChoice = dst;

}

}

}

}

return topChoice;

}

// Find the handle factory for the output layer which results in fewest required copies.

708

ITensorHandleFactory::FactoryId CalculateSlotOptionForOutput(BackendsMap& backends,

709

OutputSlot& slot,

710

TensorHandleFactoryRegistry& registry)

711

{

Jan Eilers

8eb2560

2020-03-09 12:13:48 +0000

[diff] [blame]

712

IgnoreUnused(backends, slot, registry);

Derek Lamberti

94a88d2

2019-12-10 21:12:59 +0000

[diff] [blame]

713

return ITensorHandleFactory::DeferredFactoryId;

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

714

}

715

716

// For all handle factories supported on the source backend, we wish to find the one which requires the fewest copies

717

// when considering all connections.

718

ITensorHandleFactory::FactoryId CalculateSlotOption(BackendsMap& backends,

719

OutputSlot& outputSlot,

720

TensorHandleFactoryRegistry& registry)

721

{

722

// First ensure the from backends can support the TensorHandeAPI

723

Layer& layer = outputSlot.GetOwningLayer();

724

auto frmBackend = backends.find(layer.GetBackendId());

725

if (frmBackend == backends.end() ||

726

!frmBackend->second->SupportsTensorAllocatorAPI())

727

{

728

return ITensorHandleFactory::LegacyFactoryId;

729

}

730

731

// Connections to Output Layers requires support for map/unmap on the TensorHandle.

732

bool requiresMapUnmap = false;

733

for (auto&& connection : outputSlot.GetConnections())

734

{

735

const Layer& connectedLayer = connection->GetOwningLayer();

736

if (connectedLayer.GetType() == LayerType::Output)

737

{

738

requiresMapUnmap = true;

}

}

IBackendInternal* srcBackend = frmBackend->second.get();

743

auto srcPrefs = srcBackend->GetHandleFactoryPreferences();

744

745

// Initialize the scores

746

std::map<ITensorHandleFactory::FactoryId, int> factoryScores;

747

for (auto&& pref : srcPrefs)

748

{

749

if (requiresMapUnmap) // Only consider factories that support map/unmap if required

750

{

751

ITensorHandleFactory* factory = registry.GetFactory(pref);

752

if (!factory->SupportsMapUnmap())

753

{

754

// The current tensor handle factory does not support the map/unmap strategy, move to the next one

continue;

}

}

auto it = factoryScores.find(pref);

760

if (it == factoryScores.end())

761

{

762

// Add new score to the table

763

factoryScores[pref] = 0;

}

}

// Score each handle factory based on how many times it requires copies on the slot connections

768

for (auto&& connection : outputSlot.GetConnections())

769

{

770

const Layer& connectedLayer = connection->GetOwningLayer();

771

772

auto toBackend = backends.find(connectedLayer.GetBackendId());

773

BOOST_ASSERT_MSG(toBackend != backends.end(), "Backend id not found for the connected layer");

774

775

auto dstPrefs = toBackend->second.get()->GetHandleFactoryPreferences();

776

for (auto&& src : srcPrefs)

777

{

778

if (factoryScores.find(src) == factoryScores.end()) // Don't consider excluded factories

{

continue;

}

for (auto&& dst : dstPrefs)

784

{

785

if (RequiresCopy(src, dst, registry))

786

{

787

// Copy avoided, increase the score

788

factoryScores[src]++;

break;

}

}

}

}

// Find the lowest score

796

int minScore = std::numeric_limits<int>::max();

797

for (auto it : factoryScores)

798

{

799

minScore = std::min(minScore, it.second);

800

}

801

802

// Collect factories matching the best(lowest) score

803

std::vector<ITensorHandleFactory::FactoryId> optimalFactories;

804

for (auto it : factoryScores)

805

{

806

if (it.second == minScore)

807

{

808

optimalFactories.push_back(it.first);

}

}

// For all compatible Factories matching the best score, find the preferred one for the current layer.

813

for (auto&& srcPref : srcPrefs)

814

{

815

for (auto&& comp : optimalFactories)

{

if (comp == srcPref)

{

return comp;

}

}

}

return ITensorHandleFactory::LegacyFactoryId;

825

}

826

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

827

EdgeStrategy CalculateEdgeStrategy(BackendsMap& backends,

828

ITensorHandleFactory::FactoryId srcFactoryId,

829

const Layer& layer,

830

const Layer& connectedLayer,

831

TensorHandleFactoryRegistry& registry)

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

832

{

833

auto toBackend = backends.find(connectedLayer.GetBackendId());

834

BOOST_ASSERT_MSG(toBackend != backends.end(), "Backend id not found for the connected layer");

835

836

auto dstPrefs = toBackend->second.get()->GetHandleFactoryPreferences();

837

838

// Legacy API check for backward compatibility

839

if (srcFactoryId == ITensorHandleFactory::LegacyFactoryId || dstPrefs.empty())

840

{

841

if (layer.GetBackendId() != connectedLayer.GetBackendId())

842

{

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

843

return EdgeStrategy::CopyToTarget;

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

844

}

845

else

846

{

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

847

return EdgeStrategy::DirectCompatibility;

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

}

}

// TensorHandleFactory API present, so perform more sophisticated strategies.

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

852

// Dst Output layers don't require copy because they use import or map/unmap

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

853

if (connectedLayer.GetType() == LayerType::Output)

854

{

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

855

return EdgeStrategy::DirectCompatibility;

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

856

}

857

858

// Search for direct match in prefs

859

for (auto&& pref : dstPrefs)

860

{

861

if (pref == srcFactoryId)

862

{

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

863

return EdgeStrategy::DirectCompatibility;

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

}

}

// Search for export/import options

868

ITensorHandleFactory* srcFactory = registry.GetFactory(srcFactoryId);

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

869

if (srcFactory->GetExportFlags() != 0)

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

870

{

871

for (auto&& pref : dstPrefs)

872

{

873

ITensorHandleFactory* dstFactory = registry.GetFactory(pref);

James Conroy

ffab16f

2019-11-07 14:37:09 +0000

[diff] [blame]

874

James Conroy

47e863d

2019-11-18 17:07:43 +0000

[diff] [blame]

875

// Handles cases when a destPref is not listed in TensorHandleFactoryRegistry

James Conroy

ffab16f

2019-11-07 14:37:09 +0000

[diff] [blame]

876

if (!dstFactory) {

James Conroy

47e863d

2019-11-18 17:07:43 +0000

[diff] [blame]

877

continue;

James Conroy

ffab16f

2019-11-07 14:37:09 +0000

[diff] [blame]

878

}

879

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

880

if ((dstFactory->GetImportFlags() & srcFactory->GetExportFlags()) != 0)

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

881

{

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

882

return EdgeStrategy::ExportToTarget;

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

}

}

}

// Search for copy options via map/unmap

888

if (srcFactory->SupportsMapUnmap())

889

{

890

for (auto&& pref : dstPrefs)

891

{

892

ITensorHandleFactory* dstFactory = registry.GetFactory(pref);

James Conroy

47e863d

2019-11-18 17:07:43 +0000

[diff] [blame]

893

if (dstFactory && dstFactory->SupportsMapUnmap())

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

894

{

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

895

return EdgeStrategy::CopyToTarget;

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

}

}

}

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

900

return EdgeStrategy::Undefined;

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

901

}

902

903

// Select the TensorHandleFactories and the corresponding memory strategy

904

OptimizationResult SelectTensorHandleStrategy(Graph& optGraph,

905

BackendsMap& backends,

906

TensorHandleFactoryRegistry& registry,

907

Optional<std::vector<std::string>&> errMessages)

908

{

909

OptimizationResult result;

910

911

optGraph.ForEachLayer([&backends, &registry, &result, &errMessages](Layer* layer)

{

BOOST_ASSERT(layer);

// Lets make sure the backend is in our list of supported backends. Something went wrong during backend

916

// assignment if this check fails

917

BOOST_ASSERT(backends.find(layer->GetBackendId()) != backends.end());

918

919

// Check each output separately

920

for (unsigned int slotIdx = 0; slotIdx < layer->GetNumOutputSlots(); slotIdx++)

921

{

922

OutputSlot& outputSlot = layer->GetOutputSlot(slotIdx);

923

924

ITensorHandleFactory::FactoryId slotOption = ITensorHandleFactory::LegacyFactoryId;

925

926

// Calculate the factory to use which results in the fewest copies being made.

927

switch(layer->GetType())

928

{

929

case LayerType::Input:

930

slotOption = CalculateSlotOptionForInput(backends, outputSlot, registry);

931

break;

932

case LayerType::Output:

933

slotOption = CalculateSlotOptionForOutput(backends, outputSlot, registry);

934

break;

935

default:

936

slotOption = CalculateSlotOption(backends, outputSlot, registry);

937

break;

938

}

939

outputSlot.SetTensorHandleFactory(slotOption);

940

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

941

// Now determine the "best" edge strategy for each connection given the slotOption.

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

942

unsigned int connectionIdx = 0;

943

for (auto&& connection : outputSlot.GetConnections())

944

{

945

const Layer& connectedLayer = connection->GetOwningLayer();

946

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

947

EdgeStrategy strategy = CalculateEdgeStrategy(backends, slotOption, *layer, connectedLayer, registry);

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

948

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

949

if (strategy == EdgeStrategy::Undefined)

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

950

{

951

result.m_Error = true;

952

if (errMessages)

953

{

954

errMessages.value().emplace_back("Could not find valid strategy required for compatibility"

955

" between backends.");

}

return;

}

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

960

outputSlot.SetEdgeStrategy(connectionIdx, strategy);

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

connectionIdx++;

}

}

});

return result;

}

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

970

IOptimizedNetworkPtr Optimize(const INetwork& inNetwork,

971

const std::vector<BackendId>& backendPreferences,

972

const IDeviceSpec& deviceSpec,

973

const OptimizerOptions& options,

Rob Hughes

2019-11-05 11:27:36 +0000

[diff] [blame]

974

Optional<std::vector<std::string>&> messages)

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

975

{

976

if (backendPreferences.empty())

977

{

978

throw armnn::InvalidArgumentException("Invoked Optimize with no backends specified");

979

}

980

Narumol Prangnawarat

2020-03-20 15:01:01 +0000

[diff] [blame]

981

if (options.m_ReduceFp32ToFp16 && options.m_ReduceFp32ToBf16)

982

{

983

throw InvalidArgumentException("BFloat16 and Float16 optimization cannot be enabled at the same time.");

984

}

985

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

986

const Network& network = *boost::polymorphic_downcast<const Network*>(&inNetwork);

987

std::unique_ptr<Graph> graph = std::make_unique<Graph>(network.GetGraph());

988

989

auto optNet = IOptimizedNetworkPtr(new OptimizedNetwork(std::move(graph)), &IOptimizedNetwork::Destroy);

990

991

OptimizedNetwork* optNetObjPtr = boost::polymorphic_downcast<OptimizedNetwork*>(optNet.get());

992

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

993

// Get the optimized graph

994

Graph& optGraph = optNetObjPtr->GetGraph();

995

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

996

// Perform optimisation passes

997

using namespace optimizations;

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

998

Optimizer::Pass(optGraph, MakeOptimizations(SquashEqualPermuteSiblings(),

Mike Kelly

2020-03-03 12:39:09 +0000

[diff] [blame]

999

SquashEqualTransposeSiblings(),

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1000

SquashEqualReshapeSiblings(),

1001

OptimizeInversePermutes(),

Mike Kelly

2020-03-03 12:39:09 +0000

[diff] [blame]

1002

OptimizeInverseTransposes(),

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1003

MovePermuteUp(),

Mike Kelly

2020-03-03 12:39:09 +0000

[diff] [blame]

1004

MoveTransposeUp(),

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1005

PermuteAsReshape(),

Mike Kelly

2020-03-03 12:39:09 +0000

[diff] [blame]

1006

TransposeAsReshape(),

Nina Drozd

861985f

2019-04-18 14:48:51 +0100

[diff] [blame]

1007

OptimizeConsecutiveReshapes(),

Rob Hughes

3a7d3a7

2019-09-24 16:59:56 +0100

[diff] [blame]

1008

FoldPadIntoConvolution2d(),

Mike Kelly

2020-03-03 12:39:09 +0000

[diff] [blame]

1009

PermuteAndBatchToSpaceAsDepthToSpace(),

1010

TransposeAndBatchToSpaceAsDepthToSpace()));

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1011

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1012

// Infer the tensor infos for all output slots. Throws an exception on failure

1013

optGraph.InferTensorInfos();

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1014

1015

// If Fp32 to Fp16 optimization is set convert Fp32 network to Fp16

1016

if (options.m_ReduceFp32ToFp16)

1017

{

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1018

Optimizer::Pass(optGraph, MakeOptimizations(Fp32NetworkToFp16Converter()));

Derek Lamberti

dd6804b

2019-11-27 09:29:57 +0000

[diff] [blame]

1019

Optimizer::Pass(optGraph, MakeOptimizations(ConvertConstantsFloatToHalf()));

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1020

}

1021

Narumol Prangnawarat

2020-03-20 15:01:01 +0000

[diff] [blame]

1022

// If Fp32 to Bf16 optimization is set convert Fp32 network to Bf16

Narumol Prangnawarat

57ef008

2020-03-26 09:20:43 +0000

[diff] [blame]

1023

// Convert input of Convolution2d and FullyConnected from Fp32 to Bf16

1024

// Only Constant weight of Convolution2d and FullyConnected are converted from Fp32 to Bf16

Narumol Prangnawarat

2020-03-20 15:01:01 +0000

[diff] [blame]

1025

if (options.m_ReduceFp32ToBf16)

1026

{

1027

Optimizer::Pass(optGraph, MakeOptimizations(Fp32NetworkToBf16Converter()));

Narumol Prangnawarat

2020-03-20 15:01:01 +0000

[diff] [blame]

1028

}

1029

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1030

// Initialize backend settings

1031

BackendSettings backendSettings(backendPreferences, deviceSpec);

1032

if (backendSettings.GetAvailablePreferredBackends().empty())

1033

{

1034

std::stringstream failureMsg;

1035

failureMsg << "None of the preferred backends " << backendPreferences

1036

<< " are supported. Current platform provides " << backendSettings.m_SupportedBackends;

Rob Hughes

2019-11-05 11:27:36 +0000

[diff] [blame]

1037

ReportError(failureMsg.str(), messages);

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1038

return IOptimizedNetworkPtr(nullptr, &IOptimizedNetwork::Destroy);

1039

}

1040

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

1041

// Create a map to temporarily hold initialized backend objects

1042

TensorHandleFactoryRegistry tensorHandleFactoryRegistry;

1043

BackendsMap backends = CreateSupportedBackends(tensorHandleFactoryRegistry, backendSettings);

1044

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1045

// Assign an available backend to each layer

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1046

Graph::Iterator firstLayer = optGraph.begin();

1047

Graph::Iterator lastLayer = optGraph.end();

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

1048

OptimizationResult assignBackendsResult = AssignBackends(optNetObjPtr,

1049

backendSettings,

1050

firstLayer,

1051

lastLayer,

Rob Hughes

2019-11-05 11:27:36 +0000

[diff] [blame]

1052

messages);

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

1053

if (assignBackendsResult.m_Error)

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1054

{

1055

// Failed to assign a backend to each layer

jimfly01

2018-10-08 14:43:01 +0100

[diff] [blame]

1056

return IOptimizedNetworkPtr(nullptr, &IOptimizedNetwork::Destroy);

1057

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1058

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1059

Optimizer::Pass(optGraph, MakeOptimizations(OptimizeInverseConversionsFp16(),

1060

OptimizeInverseConversionsFp32()));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1061

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1062

// Apply the backend-specific optimizations

1063

OptimizationResult backendOptimizationResult = ApplyBackendOptimizations(optNetObjPtr,

1064

backendSettings,

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

1065

backends,

Rob Hughes

2019-11-05 11:27:36 +0000

[diff] [blame]

1066

messages);

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1067

if (backendOptimizationResult.m_Error)

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1068

{

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1069

// Failed to apply the backend-specific optimizations

1070

return IOptimizedNetworkPtr(nullptr, &IOptimizedNetwork::Destroy);

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1071

}

1072

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1073

// If the debug flag is set, then insert a DebugLayer after each layer

1074

// Doing this after applying the backend optimizations as they might have changed some layers

1075

if (options.m_Debug)

1076

{

1077

Optimizer::Pass(optGraph, MakeOptimizations(InsertDebugLayer()));

1078

}

1079

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

1080

// Calculate the compatibility strategies for tensor handles

1081

OptimizationResult strategyResult = SelectTensorHandleStrategy(optGraph,

1082

backends,

1083

tensorHandleFactoryRegistry,

Rob Hughes

2019-11-05 11:27:36 +0000

[diff] [blame]

1084

messages);

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

1085

if (strategyResult.m_Error)

1086

{

1087

// Failed to apply the backend-specific optimizations

1088

return IOptimizedNetworkPtr(nullptr, &IOptimizedNetwork::Destroy);

1089

}

1090

1091

// Based on the tensor handle strategy determined above, insert copy layers where required.

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

1092

optGraph.AddCompatibilityLayers(backends, tensorHandleFactoryRegistry);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1093

1094

// Convert constants

Matteo Martincigh

2019-01-24 14:06:23 +0000

[diff] [blame]

1095

Optimizer::Pass(optGraph, MakeOptimizations(ConvertConstantsFloatToHalf()));

1096

Optimizer::Pass(optGraph, MakeOptimizations(ConvertConstantsHalfToFloat()));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1097

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

1098

// Run backend specific optimizations (deprecated)

Matteo Martincigh

2019-01-11 13:25:59 +0000

[diff] [blame]

1099

for (auto&& chosenBackend : backendSettings.m_SelectedBackends)

David Beck

263e349

2018-11-09 14:46:40 +0000

[diff] [blame]

1100

{

1101

auto factoryFun = BackendRegistryInstance().GetFactory(chosenBackend);

1102

auto backendPtr = factoryFun();

1103

BOOST_ASSERT(backendPtr.get() != nullptr);

1104

Matteo Martincigh

ed73504

2019-05-22 09:42:43 +0100

[diff] [blame]

1105

ARMNN_NO_DEPRECATE_WARN_BEGIN

David Beck

263e349

2018-11-09 14:46:40 +0000

[diff] [blame]

1106

auto backendSpecificOptimizations = backendPtr->GetOptimizations();

Matteo Martincigh

ed73504

2019-05-22 09:42:43 +0100

[diff] [blame]

1107

ARMNN_NO_DEPRECATE_WARN_END

1108

David Beck

263e349

2018-11-09 14:46:40 +0000

[diff] [blame]

1109

if (!backendSpecificOptimizations.empty())

1110

{

1111

Optimizer::Pass(optNetObjPtr->GetGraph(), backendSpecificOptimizations);

}

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1115

return optNet;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1116

}

1117

1118

Network::Network()

Sadik Armagan

3184c90

2020-03-18 10:57:30 +0000

[diff] [blame]

1119

: m_Graph(std::make_unique<Graph>())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

{

}

Network::~Network()

{

}

Jan Eilers

2019-11-06 10:02:16 +0000

[diff] [blame]

1127

Status Network::PrintGraph()

1128

{

1129

m_Graph->Print();

1130

return Status::Success;

1131

}

1132

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1133

IConnectableLayer* Network::AddInputLayer(LayerBindingId id, const char* name)

1134

{

1135

return m_Graph->AddLayer<InputLayer>(id, name);

1136

}

1137

Éanna Ó Catháin

4e1e136

2018-11-12 11:36:34 +0000

[diff] [blame]

1138

IConnectableLayer* Network::AddBatchToSpaceNdLayer(const BatchToSpaceNdDescriptor& batchToSpaceNdDescriptor,

1139

const char* name)

1140

{

1141

return m_Graph->AddLayer<BatchToSpaceNdLayer>(batchToSpaceNdDescriptor, name);

1142

}

1143

Aron Virginas-Tar

77bfb5e

2019-10-16 17:45:38 +0100

[diff] [blame]

1144

IConnectableLayer* Network::AddComparisonLayer(const ComparisonDescriptor& comparisonDescriptor,

1145

const char* name)

1146

{

1147

return m_Graph->AddLayer<ComparisonLayer>(comparisonDescriptor, name);

1148

}

1149

josh minor

4a3c610

2020-01-06 16:40:46 -0600

[diff] [blame]

1150

IConnectableLayer* Network::AddElementwiseUnaryLayer(const ElementwiseUnaryDescriptor& elementwiseUnaryDescriptor,

1151

const char* name)

1152

{

1153

return m_Graph->AddLayer<ElementwiseUnaryLayer>(elementwiseUnaryDescriptor, name);

1154

}

1155

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1156

IConnectableLayer* Network::AddFullyConnectedLayerImpl(const FullyConnectedDescriptor& fullyConnectedDescriptor,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1157

const ConstTensor& weights,

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1158

const Optional<ConstTensor>& biases,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1159

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1160

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1161

if (fullyConnectedDescriptor.m_BiasEnabled && !biases.has_value())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1162

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1163

throw InvalidArgumentException("AddFullyConnectedLayer: biases cannot be empty");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1164

}

1165

1166

const auto layer = m_Graph->AddLayer<FullyConnectedLayer>(fullyConnectedDescriptor, name);

1167

1168

layer->m_Weight = std::make_unique<ScopedCpuTensorHandle>(weights);

1169

1170

if (fullyConnectedDescriptor.m_BiasEnabled)

1171

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1172

layer->m_Bias = std::make_unique<ScopedCpuTensorHandle>(biases.value());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

return layer;

}

IConnectableLayer* Network::AddFullyConnectedLayer(const FullyConnectedDescriptor& fullyConnectedDescriptor,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1179

const ConstTensor& weights,

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1180

const Optional<ConstTensor>& biases,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1181

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1182

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1183

return AddFullyConnectedLayerImpl(fullyConnectedDescriptor, weights, biases, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1184

}

1185

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1186

IConnectableLayer* Network::AddFullyConnectedLayer(const FullyConnectedDescriptor& fullyConnectedDescriptor,

1187

const ConstTensor& weights,

1188

const char* name)

1189

{

Matteo Martincigh

fc598e1

2019-05-14 10:36:13 +0100

[diff] [blame]

1190

Optional<ConstTensor> biases;

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1191

return AddFullyConnectedLayerImpl(fullyConnectedDescriptor, weights, biases, name);

1192

}

1193

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1194

IConnectableLayer* Network::AddFullyConnectedLayer(const FullyConnectedDescriptor& fullyConnectedDescriptor,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1195

const ConstTensor& weights,

1196

const ConstTensor& biases,

1197

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1198

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1199

Optional<ConstTensor> optionalBiases(biases);

1200

return AddFullyConnectedLayerImpl(fullyConnectedDescriptor, weights, optionalBiases, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1201

}

1202

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

1203

IConnectableLayer* Network::AddConcatLayer(const ConcatDescriptor& concatDescriptor,

Jim Flynn

906f946

2019-05-10 13:55:21 +0100

[diff] [blame]

1204

const char* name)

1205

{

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

1206

return m_Graph->AddLayer<ConcatLayer>(concatDescriptor, name);

Jim Flynn

906f946

2019-05-10 13:55:21 +0100

[diff] [blame]

1207

}

1208

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1209

IConnectableLayer* Network::AddConvolution2dLayerImpl(const Convolution2dDescriptor& convolution2dDescriptor,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1210

const ConstTensor& weights,

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1211

const Optional<ConstTensor>& biases,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1212

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1213

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1214

if (convolution2dDescriptor.m_BiasEnabled && !biases.has_value())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1215

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1216

throw InvalidArgumentException("AddConvolution2dLayer: biases cannot be empty");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1217

}

1218

1219

const auto layer = m_Graph->AddLayer<Convolution2dLayer>(convolution2dDescriptor, name);

1220

1221

layer->m_Weight = std::make_unique<ScopedCpuTensorHandle>(weights);

1222

1223

if (convolution2dDescriptor.m_BiasEnabled)

1224

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1225

layer->m_Bias = std::make_unique<ScopedCpuTensorHandle>(biases.value());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

return layer;

}

IConnectableLayer* Network::AddConvolution2dLayer(const Convolution2dDescriptor& convolution2dDescriptor,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1232

const ConstTensor& weights,

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1233

const Optional<ConstTensor>& biases,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1234

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1235

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1236

return AddConvolution2dLayerImpl(convolution2dDescriptor, weights, biases, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1237

}

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1238

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1239

IConnectableLayer* Network::AddConvolution2dLayer(const Convolution2dDescriptor& convolution2dDescriptor,

1240

const ConstTensor& weights,

1241

const char* name)

1242

{

Matteo Martincigh

fc598e1

2019-05-14 10:36:13 +0100

[diff] [blame]

1243

Optional<ConstTensor> biases;

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1244

return AddConvolution2dLayerImpl(convolution2dDescriptor, weights, biases, name);

1245

}

1246

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1247

IConnectableLayer* Network::AddConvolution2dLayer(const Convolution2dDescriptor& convolution2dDescriptor,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1248

const ConstTensor& weights,

1249

const ConstTensor& biases,

1250

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1251

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1252

Optional<ConstTensor> optionalBiases(biases);

1253

return AddConvolution2dLayerImpl(convolution2dDescriptor, weights, optionalBiases, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1254

}

1255

1256

IConnectableLayer* Network::AddDepthwiseConvolution2dLayerImpl(

1257

const DepthwiseConvolution2dDescriptor& convolution2dDescriptor,

1258

const ConstTensor& weights,

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1259

const Optional<ConstTensor>& biases,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1260

const char* name)

1261

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1262

if (convolution2dDescriptor.m_BiasEnabled && !biases.has_value())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1263

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1264

throw InvalidArgumentException("AddDepthwiseConvolution2dLayer: biases cannot be empty");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1265

}

1266

Matteo Martincigh

3d6898c

2019-01-15 16:11:44 +0000

[diff] [blame]

1267

const auto layer = m_Graph->AddLayer<DepthwiseConvolution2dLayer>(convolution2dDescriptor, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1268

1269

layer->m_Weight = std::make_unique<ScopedCpuTensorHandle>(weights);

1270

1271

if (convolution2dDescriptor.m_BiasEnabled)

1272

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1273

layer->m_Bias = std::make_unique<ScopedCpuTensorHandle>(biases.value());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

return layer;

}

Aron Virginas-Tar

2019-09-19 14:31:17 +0100

[diff] [blame]

1279

IConnectableLayer* Network::AddDepthToSpaceLayer(const DepthToSpaceDescriptor& depthToSpaceDescriptor,

1280

const char* name)

1281

{

1282

return m_Graph->AddLayer<DepthToSpaceLayer>(depthToSpaceDescriptor, name);

1283

}

1284

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1285

IConnectableLayer* Network::AddDepthwiseConvolution2dLayer(

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1286

const DepthwiseConvolution2dDescriptor& convolution2dDescriptor,

1287

const ConstTensor& weights,

1288

const Optional<ConstTensor>& biases,

1289

const char* name)

1290

{

1291

return AddDepthwiseConvolution2dLayerImpl(convolution2dDescriptor, weights, biases, name);

1292

}

1293

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1294

IConnectableLayer* Network::AddDepthwiseConvolution2dLayer(

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1295

const DepthwiseConvolution2dDescriptor& convolution2dDescriptor,

1296

const ConstTensor& weights,

1297

const char* name)

1298

{

Matteo Martincigh

fc598e1

2019-05-14 10:36:13 +0100

[diff] [blame]

1299

Optional<ConstTensor> biases;

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1300

return AddDepthwiseConvolution2dLayerImpl(convolution2dDescriptor, weights, biases, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1301

}

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1302

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1303

IConnectableLayer* Network::AddDepthwiseConvolution2dLayer(

1304

const DepthwiseConvolution2dDescriptor& convolution2dDescriptor,

1305

const ConstTensor& weights,

1306

const ConstTensor& biases,

1307

const char* name)

1308

{

Aron Virginas-Tar

2019-02-22 17:03:44 +0000

[diff] [blame]

1309

Optional<ConstTensor> optionalBiases(biases);

1310

return AddDepthwiseConvolution2dLayerImpl(convolution2dDescriptor, weights, optionalBiases, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1311

}

1312

Narumol Prangnawarat

94dd5d8

2019-01-23 18:06:26 +0000

[diff] [blame]

1313

IConnectableLayer* Network::AddDetectionPostProcessLayer(const armnn::DetectionPostProcessDescriptor& descriptor,

Narumol Prangnawarat

6d302bf

2019-02-04 11:46:26 +0000

[diff] [blame]

1314

const ConstTensor& anchors, const char* name)

Narumol Prangnawarat

94dd5d8

2019-01-23 18:06:26 +0000

[diff] [blame]

1315

{

Narumol Prangnawarat

6d302bf

2019-02-04 11:46:26 +0000

[diff] [blame]

1316

const auto layer = m_Graph->AddLayer<DetectionPostProcessLayer>(descriptor, name);

1317

1318

layer->m_Anchors = std::make_unique<ScopedCpuTensorHandle>(anchors);

1319

1320

return layer;

Narumol Prangnawarat

94dd5d8

2019-01-23 18:06:26 +0000

[diff] [blame]

1321

}

1322

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1323

IConnectableLayer* Network::AddPermuteLayer(const PermuteDescriptor& permuteDescriptor,

1324

const char* name)

1325

{

1326

return m_Graph->AddLayer<PermuteLayer>(permuteDescriptor, name);

1327

}

1328

1329

IConnectableLayer* Network::AddPooling2dLayer(const Pooling2dDescriptor& pooling2dDescriptor,

1330

const char* name)

1331

{

1332

return m_Graph->AddLayer<Pooling2dLayer>(pooling2dDescriptor, name);

1333

}

1334

1335

IConnectableLayer* Network::AddActivationLayer(const ActivationDescriptor& activationDescriptor,

1336

const char* name)

1337

{

1338

return m_Graph->AddLayer<ActivationLayer>(activationDescriptor, name);

1339

}

1340

Nikhil Raj

ee391d5

2019-09-05 17:50:44 +0100

[diff] [blame]

1341

IConnectableLayer* Network::AddArgMinMaxLayer(const ArgMinMaxDescriptor& argMinMaxDescriptor,

1342

const char* name)

1343

{

1344

return m_Graph->AddLayer<ArgMinMaxLayer>(argMinMaxDescriptor, name);

1345

}

1346

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1347

IConnectableLayer* Network::AddNormalizationLayer(const NormalizationDescriptor&

1348

normalizationDescriptor,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1349

const char* name)

1350

{

1351

return m_Graph->AddLayer<NormalizationLayer>(normalizationDescriptor, name);

1352

}

1353

Aron Virginas-Tar

636ab40

2019-09-16 14:27:45 +0100

[diff] [blame]

1354

IConnectableLayer* Network::AddSliceLayer(const SliceDescriptor& sliceDescriptor, const char* name)

1355

{

1356

return m_Graph->AddLayer<SliceLayer>(sliceDescriptor, name);

1357

}

1358

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1359

IConnectableLayer* Network::AddSoftmaxLayer(const SoftmaxDescriptor& softmaxDescriptor,

1360

const char* name)

1361

{

1362

return m_Graph->AddLayer<SoftmaxLayer>(softmaxDescriptor, name);

1363

}

1364

1365

IConnectableLayer* Network::AddSplitterLayer(const ViewsDescriptor& splitterDescriptor,

1366

const char* name)

1367

{

1368

return m_Graph->AddLayer<SplitterLayer>(splitterDescriptor, name);

1369

}

1370

Nattapat Chaimanowong

5a4304a

2018-11-28 10:44:37 +0000

[diff] [blame]

1371

IConnectableLayer* Network::AddMaximumLayer(const char* name)

1372

{

1373

return m_Graph->AddLayer<MaximumLayer>(name);

1374

}

1375

Éanna Ó Catháin

20e5880

2018-12-04 10:29:06 +0000

[diff] [blame]

1376

IConnectableLayer* Network::AddMinimumLayer(const char* name)

1377

{

1378

return m_Graph->AddLayer<MinimumLayer>(name);

1379

}

1380

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

1381

IConnectableLayer* Network::AddMergerLayer(const MergerDescriptor& mergerDescriptor,

Jim Flynn

906f946

2019-05-10 13:55:21 +0100

[diff] [blame]

1382

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1383

{

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

1384

return AddConcatLayer(mergerDescriptor, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1385

}

1386

Kevin May

868eb14

2019-09-04 17:29:31 +0100

[diff] [blame]

1387

IConnectableLayer* Network::AddAbsLayer(const char * name)

1388

{

josh minor

4a3c610

2020-01-06 16:40:46 -0600

[diff] [blame]

1389

return AddElementwiseUnaryLayer(ElementwiseUnaryDescriptor(UnaryOperation::Abs), name);

Kevin May

868eb14

2019-09-04 17:29:31 +0100

[diff] [blame]

1390

}

1391

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1392

IConnectableLayer* Network::AddAdditionLayer(const char* name)

1393

{

1394

return m_Graph->AddLayer<AdditionLayer>(name);

1395

}

1396

1397

IConnectableLayer* Network::AddMultiplicationLayer(const char* name)

1398

{

1399

return m_Graph->AddLayer<MultiplicationLayer>(name);

1400

}

1401

1402

IConnectableLayer* Network::AddOutputLayer(LayerBindingId id, const char* name)

1403

{

1404

return m_Graph->AddLayer<OutputLayer>(id, name);

1405

}

1406

1407

IConnectableLayer* Network::AddBatchNormalizationLayer(const BatchNormalizationDescriptor& desc,

1408

const ConstTensor& mean,

1409

const ConstTensor& variance,

1410

const ConstTensor& beta,

1411

const ConstTensor& gamma,

1412

const char* name)

1413

{

1414

const auto layer = m_Graph->AddLayer<BatchNormalizationLayer>(desc, name);

1415

1416

layer->m_Mean = std::make_unique<ScopedCpuTensorHandle>(mean);

1417

layer->m_Variance = std::make_unique<ScopedCpuTensorHandle>(variance);

1418

layer->m_Beta = std::make_unique<ScopedCpuTensorHandle>(beta);

1419

layer->m_Gamma = std::make_unique<ScopedCpuTensorHandle>(gamma);

return layer;

}

Aron Virginas-Tar

2019-07-01 19:01:44 +0100

[diff] [blame]

1424

IConnectableLayer* Network::AddResizeBilinearLayer(const ResizeBilinearDescriptor& descriptor,

1425

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1426

{

Aron Virginas-Tar

169d2f1

2019-07-01 19:01:44 +0100

[diff] [blame]

1427

ResizeDescriptor resizeDescriptor;

1428

resizeDescriptor.m_Method = ResizeMethod::Bilinear;

1429

resizeDescriptor.m_DataLayout = descriptor.m_DataLayout;

1430

resizeDescriptor.m_TargetWidth = descriptor.m_TargetWidth;

1431

resizeDescriptor.m_TargetHeight = descriptor.m_TargetHeight;

1432

1433

return m_Graph->AddLayer<ResizeLayer>(resizeDescriptor, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1434

}

1435

Teresa Charlin

a9075df

2019-06-27 15:41:57 +0100

[diff] [blame]

1436

IConnectableLayer* Network::AddResizeLayer(const ResizeDescriptor&

1437

resizeDescriptor, const char* name)

1438

{

Aron Virginas-Tar

169d2f1

2019-07-01 19:01:44 +0100

[diff] [blame]

1439

return m_Graph->AddLayer<ResizeLayer>(resizeDescriptor, name);

Teresa Charlin

a9075df

2019-06-27 15:41:57 +0100

[diff] [blame]

1440

}

1441

Kevin May

ce5045a

2019-10-02 14:07:47 +0100

[diff] [blame]

1442

IConnectableLayer* Network::AddInstanceNormalizationLayer(const InstanceNormalizationDescriptor& desc,

1443

const char* name)

1444

{

1445

return m_Graph->AddLayer<InstanceNormalizationLayer>(desc, name);

1446

}

1447

Matteo Martincigh

bcd3c85

2018-09-28 14:14:12 +0100

[diff] [blame]

1448

IConnectableLayer* Network::AddL2NormalizationLayer(const L2NormalizationDescriptor& desc,

1449

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1450

{

Matteo Martincigh

bcd3c85

2018-09-28 14:14:12 +0100

[diff] [blame]

1451

return m_Graph->AddLayer<L2NormalizationLayer>(desc, name);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1452

}

1453

Aron Virginas-Tar

f982dea

2019-10-11 14:07:53 +0100

[diff] [blame]

1454

IConnectableLayer* Network::AddLogSoftmaxLayer(const LogSoftmaxDescriptor& desc,

1455

const char* name)

1456

{

1457

return m_Graph->AddLayer<LogSoftmaxLayer>(desc, name);

1458

}

1459

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1460

IConnectableLayer* Network::AddConstantLayer(const ConstTensor& input, const char* name)

1461

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1462

auto layer = m_Graph->AddLayer<ConstantLayer>(name);

1463

1464

layer->m_LayerOutput = std::make_unique<ScopedCpuTensorHandle>(input);

1465

1466

return layer;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1467

}

1468

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1469

IConnectableLayer* Network::AddReshapeLayer(const ReshapeDescriptor& reshapeDescriptor,

1470

const char* name)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1471

{

1472

return m_Graph->AddLayer<ReshapeLayer>(reshapeDescriptor, name);

1473

}

1474

Nattapat Chaimanowong

207ef9a

2018-11-02 10:57:25 +0000

[diff] [blame]

1475

IConnectableLayer* Network::AddSpaceToBatchNdLayer(const SpaceToBatchNdDescriptor& spaceToBatchNdDescriptor,

1476

const char* name)

1477

{

1478

return m_Graph->AddLayer<SpaceToBatchNdLayer>(spaceToBatchNdDescriptor, name);

1479

}

1480

Aron Virginas-Tar

972af15

2019-06-11 14:14:03 +0100

[diff] [blame]

1481

IConnectableLayer* Network::AddSpaceToDepthLayer(const SpaceToDepthDescriptor& spaceToDepthDescriptor,

1482

const char* name)

1483

{

1484

return m_Graph->AddLayer<SpaceToDepthLayer>(spaceToDepthDescriptor, name);

1485

}

1486

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1487

IConnectableLayer* Network::AddFloorLayer(const char* name)

1488

{

1489

return m_Graph->AddLayer<FloorLayer>(name);

1490

}

1491

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1492

IConnectableLayer* Network::AddLstmLayer(const LstmDescriptor& descriptor,

1493

const LstmInputParams& params,

1494

const char* name)

1495

{

1496

const auto layer = m_Graph->AddLayer<LstmLayer>(descriptor, name);

1497

1498

//Lstm Basic Parameters

1499

layer->m_BasicParameters.m_InputToForgetWeights =

1500

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToForgetWeights));

1501

layer->m_BasicParameters.m_InputToCellWeights =

1502

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToCellWeights));

1503

layer->m_BasicParameters.m_InputToOutputWeights =

1504

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToOutputWeights));

1505

layer->m_BasicParameters.m_RecurrentToForgetWeights =

1506

std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToForgetWeights));

1507

layer->m_BasicParameters.m_RecurrentToCellWeights =

1508

std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToCellWeights));

1509

layer->m_BasicParameters.m_RecurrentToOutputWeights =

1510

std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToOutputWeights));

1511

layer->m_BasicParameters.m_ForgetGateBias =

1512

std::make_unique<ScopedCpuTensorHandle>(*(params.m_ForgetGateBias));

1513

layer->m_BasicParameters.m_CellBias =

1514

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellBias));

1515

layer->m_BasicParameters.m_OutputGateBias =

1516

std::make_unique<ScopedCpuTensorHandle>(*(params.m_OutputGateBias));

1517

1518

//Lstm Cifg parameters

1519

if(!descriptor.m_CifgEnabled)

1520

{

1521

if(params.m_InputToInputWeights == nullptr)

1522

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1523

throw InvalidArgumentException("AddLstmLayer: Input To Input Weights cannot be NULL "

1524

"when CIFG is disabled.");

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1525

}

1526

if(params.m_RecurrentToInputWeights == nullptr)

1527

{

1528

throw InvalidArgumentException(

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1529

"AddLstmLayer: Recurrent To Input Weights cannot be NULL "

1530

"when CIFG is disabled.");

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1531

}

1532

if(params.m_InputGateBias == nullptr)

1533

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1534

throw InvalidArgumentException("AddLstmLayer: Input Gate Bias cannot be NULL "

1535

"when CIFG is disabled.");

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1536

}

1537

layer->m_CifgParameters.m_InputToInputWeights =

1538

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToInputWeights));

1539

layer->m_CifgParameters.m_RecurrentToInputWeights =

1540

std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToInputWeights));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1541

layer->m_CifgParameters.m_InputGateBias =

1542

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputGateBias));

1543

}

1544

1545

//Lstm projection parameters

1546

if(descriptor.m_ProjectionEnabled)

1547

{

1548

if(params.m_ProjectionWeights == nullptr)

1549

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1550

throw InvalidArgumentException("AddLstmLayer: Projection Weights cannot be NULL "

1551

"when projection is enabled.");

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1552

}

1553

layer->m_ProjectionParameters.m_ProjectionWeights =

1554

std::make_unique<ScopedCpuTensorHandle>(*(params.m_ProjectionWeights));

1555

if(params.m_ProjectionBias != nullptr)

1556

{

1557

layer->m_ProjectionParameters.m_ProjectionBias =

1558

std::make_unique<ScopedCpuTensorHandle>(*(params.m_ProjectionBias));

}

}

//Lstm Peephole params

1563

if(descriptor.m_PeepholeEnabled)

1564

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1565

if(!descriptor.m_CifgEnabled)

1566

{

1567

if(params.m_CellToInputWeights == nullptr)

1568

{

1569

throw InvalidArgumentException("AddLstmLayer: Cell To Input Weights cannot be NULL "

1570

"when Peephole is enabled and CIFG disabled.");

1571

}

1572

1573

layer->m_PeepholeParameters.m_CellToInputWeights =

1574

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToInputWeights));

1575

}

1576

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1577

if(params.m_CellToForgetWeights == nullptr)

1578

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1579

throw InvalidArgumentException("AddLstmLayer: Cell To Forget Weights cannot be NULL "

1580

"when Peephole is enabled.");

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1581

}

1582

if(params.m_CellToOutputWeights == nullptr)

1583

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1584

throw InvalidArgumentException("AddLstmLayer: Cell To Output Weights cannot be NULL "

1585

"when Peephole is enabled.");

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1586

}

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1587

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1588

layer->m_PeepholeParameters.m_CellToForgetWeights =

1589

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToForgetWeights));

1590

layer->m_PeepholeParameters.m_CellToOutputWeights =

1591

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToOutputWeights));

1592

}

Jan Eilers

2019-07-17 11:07:49 +0100

[diff] [blame]

1593

1594

//Lstm Layer Normalization params

1595

if(descriptor.m_LayerNormEnabled)

1596

{

1597

if(!descriptor.m_CifgEnabled)

1598

{

1599

if(params.m_InputLayerNormWeights == nullptr)

1600

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1601

throw InvalidArgumentException("AddLstmLayer: Input layer normalization weights cannot be NULL "

1602

"when layer normalization is enabled and CIFG disabled.");

Jan Eilers

2019-07-17 11:07:49 +0100

[diff] [blame]

1603

}

1604

layer->m_LayerNormParameters.m_InputLayerNormWeights =

1605

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputLayerNormWeights));

1606

}

1607

1608

if(params.m_ForgetLayerNormWeights == nullptr)

1609

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1610

throw InvalidArgumentException("AddLstmLayer: Forget layer normalization weights cannot be NULL "

1611

"when layer normalization is enabled.");

Jan Eilers

2019-07-17 11:07:49 +0100

[diff] [blame]

1612

}

1613

if(params.m_CellLayerNormWeights == nullptr)

1614

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1615

throw InvalidArgumentException("AddLstmLayer: Cell layer normalization weights cannot be NULL "

1616

"when layer normalization is enabled.");

Jan Eilers

2019-07-17 11:07:49 +0100

[diff] [blame]

1617

}

1618

if(params.m_OutputLayerNormWeights == nullptr)

1619

{

Jan Eilers

2020-03-30 15:07:45 +0100

[diff] [blame^]

1620

throw InvalidArgumentException("AddLstmLayer: Output layer normalization weights cannot be NULL "

1621

"when layer normalization is enabled.");

Jan Eilers

2019-07-17 11:07:49 +0100

[diff] [blame]

1622

}

1623

layer->m_LayerNormParameters.m_ForgetLayerNormWeights =

1624

std::make_unique<ScopedCpuTensorHandle>(*(params.m_ForgetLayerNormWeights));

1625

layer->m_LayerNormParameters.m_CellLayerNormWeights =

1626

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellLayerNormWeights));

1627

layer->m_LayerNormParameters.m_OutputLayerNormWeights =

1628

std::make_unique<ScopedCpuTensorHandle>(*(params.m_OutputLayerNormWeights));

1629

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

return layer;

}

Francis Murtagh

2018-08-29 12:42:10 +0100

[diff] [blame]

1633

IConnectableLayer* Network::AddDivisionLayer(const char* name)

1634

{

1635

return m_Graph->AddLayer<DivisionLayer>(name);

1636

}

1637

David Beck

1952622

2018-09-12 16:00:08 +0100

[diff] [blame]

1638

IConnectableLayer* Network::AddSubtractionLayer(const char* name)

1639

{

1640

return m_Graph->AddLayer<SubtractionLayer>(name);

1641

}

1642

narpra01

32b9046

2018-09-13 11:07:48 +0100

[diff] [blame]

1643

IConnectableLayer* Network::AddMeanLayer(const MeanDescriptor& meanDescriptor, const char* name)

1644

{

1645

return m_Graph->AddLayer<MeanLayer>(meanDescriptor,name);

1646

}

1647

Mohamed Nour Abouelseoud

5662c20

2018-09-24 13:30:09 +0100

[diff] [blame]

1648

IConnectableLayer* Network::AddPadLayer(const PadDescriptor& padDescriptor, const char* name)

1649

{

1650

return m_Graph->AddLayer<PadLayer>(padDescriptor,name);

1651

}

1652

Derek Lamberti

a9cca6a

2019-03-25 15:41:58 +0000

[diff] [blame]

1653

IConnectableLayer *Network::AddQuantizeLayer(const char *name)

1654

{

1655

return m_Graph->AddLayer<QuantizeLayer>(name);

1656

}

1657

Nattapat Chaimanowong

e4294fd

2019-03-28 09:56:53 +0000

[diff] [blame]

1658

IConnectableLayer* Network::AddDequantizeLayer(const char* name)

1659

{

1660

return m_Graph->AddLayer<DequantizeLayer>(name);

1661

}

1662

Conor Kennedy

430b5d8

2018-11-14 15:28:28 +0000

[diff] [blame]

1663

IConnectableLayer* Network::AddStridedSliceLayer(const StridedSliceDescriptor& stridedSliceDescriptor,

1664

const char* name)

1665

{

1666

return m_Graph->AddLayer<StridedSliceLayer>(stridedSliceDescriptor, name);

1667

}

1668

Matteo Martincigh

59a950c

2018-12-13 12:48:25 +0000

[diff] [blame]

1669

IConnectableLayer* Network::AddGreaterLayer(const char* name)

1670

{

Aron Virginas-Tar

77bfb5e

2019-10-16 17:45:38 +0100

[diff] [blame]

1671

return AddComparisonLayer(ComparisonDescriptor(ComparisonOperation::Greater), name);

Matteo Martincigh

59a950c

2018-12-13 12:48:25 +0000

[diff] [blame]

1672

}

1673

FrancisMurtagh

2099595

2018-12-17 12:11:36 +0000

[diff] [blame]

1674

IConnectableLayer* Network::AddEqualLayer(const char* name)

1675

{

Aron Virginas-Tar

77bfb5e

2019-10-16 17:45:38 +0100

[diff] [blame]

1676

return AddComparisonLayer(ComparisonDescriptor(ComparisonOperation::Equal), name);

FrancisMurtagh

2099595

2018-12-17 12:11:36 +0000

[diff] [blame]

1677

}

1678

Mohamed Nour Abouelseoud

a1d3c6a

2018-12-27 12:39:16 +0000

[diff] [blame]

1679

IConnectableLayer* Network::AddRsqrtLayer(const char * name)

1680

{

josh minor

4a3c610

2020-01-06 16:40:46 -0600

[diff] [blame]

1681

return AddElementwiseUnaryLayer(ElementwiseUnaryDescriptor(UnaryOperation::Rsqrt), name);

Mohamed Nour Abouelseoud

a1d3c6a

2018-12-27 12:39:16 +0000

[diff] [blame]

1682

}

1683

narpra01

b89b05f

2019-01-16 09:53:09 +0000

[diff] [blame]

1684

IConnectableLayer* Network::AddGatherLayer(const char* name)

1685

{

1686

return m_Graph->AddLayer<GatherLayer>(name);

1687

}

1688

Nattapat Chaimanowong

1f88630

2019-04-05 13:37:19 +0100

[diff] [blame]

1689

IConnectableLayer* Network::AddMergeLayer(const char* name)

1690

{

1691

return m_Graph->AddLayer<MergeLayer>(name);

1692

}

1693

Sadik Armagan

eff363d

2019-04-05 15:25:46 +0100

[diff] [blame]

1694

IConnectableLayer* Network::AddSwitchLayer(const char* name)

1695

{

1696

return m_Graph->AddLayer<SwitchLayer>(name);

1697

}

1698

Matteo Martincigh

0e406ee

2019-06-12 15:42:18 +0100

[diff] [blame]

1699

IConnectableLayer* Network::AddPreluLayer(const char* name)

1700

{

1701

return m_Graph->AddLayer<PreluLayer>(name);

1702

}

1703

Aron Virginas-Tar

639fb04

2019-06-20 14:28:19 +0100

[diff] [blame]

1704

IConnectableLayer* Network::AddTransposeConvolution2dLayer(const TransposeConvolution2dDescriptor& descriptor,

1705

const ConstTensor& weights,

1706

const Optional<ConstTensor>& biases,

1707

const char* name)

1708

{

1709

if (descriptor.m_BiasEnabled && !biases.has_value())

1710

{

1711

throw InvalidArgumentException("AddTransposeConvolution2dLayer: Biases cannot be empty");

1712

}

1713

1714

const auto layer = m_Graph->AddLayer<TransposeConvolution2dLayer>(descriptor, name);

1715

1716

layer->m_Weight = std::make_unique<ScopedCpuTensorHandle>(weights);

1717

1718

if (descriptor.m_BiasEnabled)

1719

{

1720

layer->m_Bias = std::make_unique<ScopedCpuTensorHandle>(biases.value());

}

return layer;

}

Mike Kelly

2020-02-28 18:11:58 +0000

[diff] [blame]

1726

IConnectableLayer* Network::AddTransposeLayer(const TransposeDescriptor& transposeDescriptor,

1727

const char* name)

1728

{

1729

return m_Graph->AddLayer<TransposeLayer>(transposeDescriptor, name);

1730

}

1731

Matthew Jackson

2b8c1da

2019-07-04 14:59:16 +0100

[diff] [blame]

1732

IConnectableLayer* Network::AddStackLayer(const StackDescriptor& stackDescriptor,

1733

const char* name)

1734

{

1735

return m_Graph->AddLayer<StackLayer>(stackDescriptor, name);

1736

}

1737

Derek Lamberti

013c390

2019-10-21 10:46:16 +0100

[diff] [blame]

1738

1739

IConnectableLayer* Network::AddStandInLayer(const StandInDescriptor& desc,

1740

const char* name)

1741

{

1742

return m_Graph->AddLayer<StandInLayer>(desc, name);

1743

}

1744

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1745

IConnectableLayer* Network::AddQuantizedLstmLayer(const QuantizedLstmInputParams& params,

1746

const char* name)

1747

{

1748

const auto layer = m_Graph->AddLayer<QuantizedLstmLayer>(name);

1749

1750

// InputToX weights

1751

layer->m_QuantizedLstmParameters.m_InputToInputWeights =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1752

std::make_unique<ScopedCpuTensorHandle>(params.GetInputToInputWeights());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1753

layer->m_QuantizedLstmParameters.m_InputToForgetWeights =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1754

std::make_unique<ScopedCpuTensorHandle>(params.GetInputToForgetWeights());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1755

layer->m_QuantizedLstmParameters.m_InputToCellWeights =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1756

std::make_unique<ScopedCpuTensorHandle>(params.GetInputToCellWeights());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1757

layer->m_QuantizedLstmParameters.m_InputToOutputWeights =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1758

std::make_unique<ScopedCpuTensorHandle>(params.GetInputToOutputWeights());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1759

1760

// RecurrentToX weights

1761

layer->m_QuantizedLstmParameters.m_RecurrentToInputWeights =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1762

std::make_unique<ScopedCpuTensorHandle>(params.GetRecurrentToInputWeights());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1763

layer->m_QuantizedLstmParameters.m_RecurrentToForgetWeights =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1764

std::make_unique<ScopedCpuTensorHandle>(params.GetRecurrentToForgetWeights());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1765

layer->m_QuantizedLstmParameters.m_RecurrentToCellWeights =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1766

std::make_unique<ScopedCpuTensorHandle>(params.GetRecurrentToCellWeights());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1767

layer->m_QuantizedLstmParameters.m_RecurrentToOutputWeights =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1768

std::make_unique<ScopedCpuTensorHandle>(params.GetRecurrentToOutputWeights());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1769

1770

// Bias

1771

layer->m_QuantizedLstmParameters.m_InputGateBias =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1772

std::make_unique<ScopedCpuTensorHandle>(params.GetInputGateBias());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1773

layer->m_QuantizedLstmParameters.m_ForgetGateBias =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1774

std::make_unique<ScopedCpuTensorHandle>(params.GetForgetGateBias());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1775

layer->m_QuantizedLstmParameters.m_CellBias =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1776

std::make_unique<ScopedCpuTensorHandle>(params.GetCellBias());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

1777

layer->m_QuantizedLstmParameters.m_OutputGateBias =

Francis Murtagh

2019-08-14 09:51:36 +0100

[diff] [blame]

1778

std::make_unique<ScopedCpuTensorHandle>(params.GetOutputGateBias());

James Conroy

2019-07-17 11:27:46 +0100

[diff] [blame]

return layer;

}

James Conroy

2020-03-20 08:49:33 +0000

[diff] [blame]

1783

IConnectableLayer* Network::AddQLstmLayer(const QLstmDescriptor& descriptor,

1784

const LstmInputParams& params,

1785

const char* name)

1786

{

1787

const auto layer = m_Graph->AddLayer<QLstmLayer>(descriptor, name);

1788

1789

// QLstm Basic Parameters

1790

layer->m_BasicParameters.m_InputToForgetWeights =

1791

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToForgetWeights));

1792

layer->m_BasicParameters.m_InputToCellWeights =

1793

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToCellWeights));

1794

layer->m_BasicParameters.m_InputToOutputWeights =

1795

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToOutputWeights));

1796

layer->m_BasicParameters.m_RecurrentToForgetWeights =

1797

std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToForgetWeights));

1798

layer->m_BasicParameters.m_RecurrentToCellWeights =

1799

std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToCellWeights));

1800

layer->m_BasicParameters.m_RecurrentToOutputWeights =

1801

std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToOutputWeights));

1802

layer->m_BasicParameters.m_ForgetGateBias =

1803

std::make_unique<ScopedCpuTensorHandle>(*(params.m_ForgetGateBias));

1804

layer->m_BasicParameters.m_CellBias =

1805

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellBias));

1806

layer->m_BasicParameters.m_OutputGateBias =

1807

std::make_unique<ScopedCpuTensorHandle>(*(params.m_OutputGateBias));

1808

1809

// QLstm Cifg parameters

1810

if(!descriptor.m_CifgEnabled)

1811

{

1812

if(params.m_InputToInputWeights == nullptr)

1813

{

1814

throw InvalidArgumentException("AddQLstmLayer: Input To Input Weights cannot be NULL");

1815

}

1816

1817

if(params.m_RecurrentToInputWeights == nullptr)

1818

{

1819

throw InvalidArgumentException(

1820

"AddQLstmLayer: Recurrent To Input Weights cannot be NULL");

1821

}

1822

1823

if(params.m_InputGateBias == nullptr)

1824

{

1825

throw InvalidArgumentException("AddQLstmLayer: Input Gate Bias cannot be NULL");

1826

}

1827

1828

layer->m_CifgParameters.m_InputToInputWeights =

1829

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToInputWeights));

1830

layer->m_CifgParameters.m_RecurrentToInputWeights =

1831

std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToInputWeights));

1832

layer->m_CifgParameters.m_InputGateBias =

1833

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputGateBias));

1834

}

1835

1836

// QLstm Projection parameters

1837

if(descriptor.m_ProjectionEnabled)

1838

{

1839

if(params.m_ProjectionWeights == nullptr)

1840

{

1841

throw InvalidArgumentException("AddQLstmLayer: Projection Weights cannot be NULL");

1842

}

1843

1844

if(params.m_ProjectionBias == nullptr)

1845

{

1846

throw InvalidArgumentException("AddQLstmLayer: Projection Biases cannot be NULL");

1847

}

1848

1849

layer->m_ProjectionParameters.m_ProjectionWeights =

1850

std::make_unique<ScopedCpuTensorHandle>(*(params.m_ProjectionWeights));

1851

layer->m_ProjectionParameters.m_ProjectionBias =

1852

std::make_unique<ScopedCpuTensorHandle>(*(params.m_ProjectionBias));

1853

}

1854

1855

// QLstm Peephole params

1856

if(descriptor.m_PeepholeEnabled)

1857

{

1858

if(params.m_CellToForgetWeights == nullptr)

1859

{

1860

throw InvalidArgumentException("AddQLstmLayer: Cell To Forget Weights cannot be NULL");

1861

}

1862

1863

if(params.m_CellToOutputWeights == nullptr)

1864

{

1865

throw InvalidArgumentException("AddQLstmLayer: Cell To Output Weights cannot be NULL");

1866

}

1867

1868

if(!descriptor.m_CifgEnabled)

1869

{

1870

if(params.m_CellToInputWeights == nullptr)

1871

{

1872

throw InvalidArgumentException("AddQLstmLayer: Cell To Input Weights cannot be NULL");

1873

}

1874

1875

layer->m_PeepholeParameters.m_CellToInputWeights =

1876

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToInputWeights));

1877

}

1878

1879

layer->m_PeepholeParameters.m_CellToForgetWeights =

1880

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToForgetWeights));

1881

layer->m_PeepholeParameters.m_CellToOutputWeights =

1882

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToOutputWeights));

1883

}

1884

1885

// QLstm Layer Normalization params

1886

if(descriptor.m_LayerNormEnabled)

1887

{

1888

if(params.m_ForgetLayerNormWeights == nullptr)

1889

{

1890

throw InvalidArgumentException("AddQLstmLayer: Forget layer normalization weights cannot be NULL");

1891

}

1892

1893

if(params.m_CellLayerNormWeights == nullptr)

1894

{

1895

throw InvalidArgumentException("AddQLstmLayer: Cell layer normalization weights cannot be NULL");

1896

}

1897

1898

if(params.m_OutputLayerNormWeights == nullptr)

1899

{

1900

throw InvalidArgumentException("AddQLstmLayer: Output layer normalization weights cannot be NULL");

1901

}

1902

1903

if(!descriptor.m_CifgEnabled)

1904

{

1905

if(params.m_InputLayerNormWeights == nullptr)

1906

{

1907

throw InvalidArgumentException("AddQLstmLayer: Input layer normalization weights cannot be NULL");

1908

}

1909

1910

layer->m_LayerNormParameters.m_InputLayerNormWeights =

1911

std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputLayerNormWeights));

1912

}

1913

1914

layer->m_LayerNormParameters.m_ForgetLayerNormWeights =

1915

std::make_unique<ScopedCpuTensorHandle>(*(params.m_ForgetLayerNormWeights));

1916

layer->m_LayerNormParameters.m_CellLayerNormWeights =

1917

std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellLayerNormWeights));

1918

layer->m_LayerNormParameters.m_OutputLayerNormWeights =

1919

std::make_unique<ScopedCpuTensorHandle>(*(params.m_OutputLayerNormWeights));

}

return layer;

}

Mike Kelly

2019-02-11 17:01:27 +0000

[diff] [blame]

1924

void Network::Accept(ILayerVisitor& visitor) const

1925

{

1926

for (auto layer : GetGraph())

1927

{

1928

layer->Accept(visitor);

};

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1932

OptimizedNetwork::OptimizedNetwork(std::unique_ptr<Graph> graph)

Sadik Armagan

3184c90

2020-03-18 10:57:30 +0000

[diff] [blame]

1933

: m_Graph(std::move(graph)), m_Guid(profiling::ProfilingService::GetNextGuid())

telsoa01