Blame - src/armnnCaffeParser/CaffeParser.cpp - ml/armnn

2018-03-09 14:13:49 +0000

[diff] [blame]

2

David Beck

ecb56cd

2018-09-05 12:52:57 +0100

[diff] [blame]

3

// SPDX-License-Identifier: MIT

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

4

//

5

#include "CaffeParser.hpp"

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

6

#include "RecordByRecordCaffeParser.hpp"

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

7

Matthew Sloyan

ac001ee

2021-02-03 10:43:04 +0000

[diff] [blame]

8

#include "armnnCaffeParser/Version.hpp"

9

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

10

#include "armnn/Descriptors.hpp"

11

#include "armnn/INetwork.hpp"

12

#include "armnn/Utils.hpp"

13

#include "armnn/Exceptions.hpp"

14

15

#include "GraphTopologicalSort.hpp"

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

16

#include "VerificationHelpers.hpp"

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

17

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

18

#include <armnn/utility/Assert.hpp>

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

19

#include <armnn/utility/NumericCast.hpp>

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

20

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

21

#include <fmt/format.h>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

22

23

// Caffe

24

#include "caffe/proto/caffe.pb.h"

25

26

// ProtoBuf

27

#include <google/protobuf/io/coded_stream.h>

28

#include <google/protobuf/io/zero_copy_stream.h>

29

#include <google/protobuf/io/zero_copy_stream_impl.h>

30

#include <google/protobuf/text_format.h>

31

#include <google/protobuf/stubs/common.h>

32

#include <google/protobuf/stubs/once.h>

33

#include <google/protobuf/io/coded_stream.h>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

34

#include <google/protobuf/descriptor.h>

35

#include <google/protobuf/generated_message_reflection.h>

36

#include <google/protobuf/reflection_ops.h>

37

#include <google/protobuf/wire_format.h>

38

39

#include <cmath>

Matthew Sloyan

ac001ee

2021-02-03 10:43:04 +0000

[diff] [blame]

40

#include <iostream>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

#include <sstream>

#include <queue>

#include <fcntl.h>

/// Caffe networks are loaded from protobuf files (binary or text) using the protobuf library and the generated

46

/// code from caffe.pb.h. This gives us a caffe::NetParameter which is an in-memory version of the file.

47

/// This contains a flat list of Caffe 'layers' (e.g. convolution, pooling etc.).

48

/// Each layer has inputs (called "bottoms") and outputs (called "tops"). Data flows from bottom to top.

49

/// The bottoms of a layer refer to the tops of other layers, not their names.

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

50

/// The names of layers seem to be arbitrary (you could rename a layer and the network wouldn't

51

/// need any other changes).

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

52

///

53

/// Some layers (e.g. Relu) can be configured so that their top and bottom are both the same. This is called an

54

/// "in-place" layer and is a Caffe runtime feature used to reduce memory usage by modifying tensors in-place.

55

/// This isn't relevant to the parser and so we preprocess these layers to convert them to regular layers, to result

56

/// in a consistent graph structure.

57

58

namespace armnnCaffeParser

59

{

60

61

using namespace armnn;

62

using namespace caffe;

63

using namespace std;

64

using namespace google::protobuf::io;

65

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

66

ICaffeParser::ICaffeParser() : pCaffeParserImpl(new RecordByRecordCaffeParser()) {}

67

68

ICaffeParser::~ICaffeParser() = default;

69

70

ICaffeParser* ICaffeParser::CreateRaw()

71

{

72

return new ICaffeParser();

73

}

74

75

ICaffeParserPtr ICaffeParser::Create()

76

{

77

return ICaffeParserPtr(CreateRaw(), &ICaffeParser::Destroy);

78

}

79

80

void ICaffeParser::Destroy(ICaffeParser* parser)

{

delete parser;

}

armnn::INetworkPtr ICaffeParser::CreateNetworkFromTextFile(

86

const char* graphFile,

87

const std::map<std::string, armnn::TensorShape>& inputShapes,

88

const std::vector<std::string>& requestedOutputs)

89

{

90

return pCaffeParserImpl->CreateNetworkFromTextFile(graphFile, inputShapes, requestedOutputs);

91

}

92

93

armnn::INetworkPtr ICaffeParser::CreateNetworkFromBinaryFile(

94

const char* graphFile,

95

const std::map<std::string, armnn::TensorShape>& inputShapes,

96

const std::vector<std::string>& requestedOutputs)

97

{

98

return pCaffeParserImpl->CreateNetworkFromBinaryFile(graphFile, inputShapes,requestedOutputs);

99

}

100

101

armnn::INetworkPtr ICaffeParser::CreateNetworkFromString(

102

const char* protoText,

103

const std::map<std::string, armnn::TensorShape>& inputShapes,

104

const std::vector<std::string>& requestedOutputs)

105

{

106

return pCaffeParserImpl->CreateNetworkFromString(protoText, inputShapes, requestedOutputs);

107

}

108

109

BindingPointInfo ICaffeParser::GetNetworkInputBindingInfo(const std::string& name) const

110

{

111

return pCaffeParserImpl->GetNetworkInputBindingInfo(name);

112

}

113

114

BindingPointInfo ICaffeParser::GetNetworkOutputBindingInfo(const std::string& name) const

115

{

116

return pCaffeParserImpl->GetNetworkOutputBindingInfo(name);

117

}

118

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

119

namespace

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

120

{

121

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

122

const float* GetArrayPtrFromBlob(const LayerParameter& layerParam, unsigned int blobIndex)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

123

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

124

auto nBlobs = layerParam.blobs_size();

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

125

if (blobIndex >= armnn::numeric_cast<unsigned int>(nBlobs))

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

126

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

127

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

128

fmt::format("Expected data blob at index {} in layer {} not found. nBlobs={}. {}",

blobIndex,

layerParam.name(),

nBlobs,

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

133

}

134

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

135

const BlobProto& blob = layerParam.blobs(armnn::numeric_cast<int>(blobIndex));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

136

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

137

const float* arrayPtr = blob.data().data();

return arrayPtr;

}

void GetDataFromBlob(const LayerParameter& layerParam, vector<float>& outData, unsigned int blobIndex)

142

{

143

auto nBlobs = layerParam.blobs_size();

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

144

if (blobIndex >= armnn::numeric_cast<unsigned int>(nBlobs))

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

145

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

146

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

147

fmt::format("Expected data blob at index {} in layer {} not found. {}",

148

blobIndex,

149

layerParam.name(),

150

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

151

}

152

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

153

const BlobProto& blob = layerParam.blobs(armnn::numeric_cast<int>(blobIndex));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

154

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

155

size_t blobSize = armnn::numeric_cast<size_t>(blob.data_size());

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

156

if (blobSize != outData.size())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

157

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

158

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

159

fmt::format("Data blob at index {} in layer {} has an unexpected size. "

160

"Expected {} elements but got {} elements. {}",

blobIndex,

layerParam.name(),

outData.size(),

blobSize,

CHECK_LOCATION().AsString()));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

166

}

167

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

168

int outSizeInt = armnn::numeric_cast<int>(outData.size());

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

169

for (int i = 0; i < outSizeInt; ++i)

170

{

171

outData[static_cast<size_t>(i)] = blob.data(i);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

175

template <typename T>

176

size_t SizeOfVectorData(const vector<T>& vec)

177

{

178

return vec.size() * sizeof(T);

179

}

180

181

void ValidateNumInputsOutputs(const caffe::LayerParameter& layerParameter,

182

unsigned int numInputs,

183

unsigned int numOutputs)

184

{

185

int numInputsActual = layerParameter.bottom_size();

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

186

if (numInputs != armnn::numeric_cast<unsigned int>(numInputsActual))

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

187

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

188

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

189

fmt::format("Invalid number of inputs requested {} for layer {} "

190

"while only {} present. {}",

191

numInputs,

192

layerParameter.name(),

193

numInputsActual,

194

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

195

}

196

197

int numOutputsActual = layerParameter.top_size();

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

198

if (numOutputs != armnn::numeric_cast<unsigned int>(numOutputsActual))

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

199

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

200

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

201

fmt::format("Invalid number of outputs requested {} for layer {} "

202

"while only {} present. {}",

203

numOutputs,

204

layerParameter.name(),

205

numOutputsActual,

206

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

210

template <typename ParamType, typename ExtractOptional, typename ExtractFallback, typename ValueType>

211

ValueType GetOptionalWithFallback(const ParamType& param,

212

ExtractOptional extractOptional,

213

ExtractFallback extractFallback,

214

ValueType defaultValue)

215

{

216

auto optValue = extractOptional(param, defaultValue);

217

if (optValue.first)

218

{

219

return optValue.second;

220

}

221

auto fallbackValue = extractFallback(param, defaultValue);

222

return fallbackValue.second;

223

}

224

225

#define GET_OPTIONAL_WITH_VECTOR_FALLBACK(PARAM, \

PARAM_TYPE, \

OPTIONAL_VALUE, \

FALLBACK_VECTOR, \

VALUE_TYPE, \

DEFAULT_VALUE) \

GetOptionalWithFallback( \

232

PARAM, \

233

[](const PARAM_TYPE & param, VALUE_TYPE defaultValue) \

234

{ \

235

if (param.has_##OPTIONAL_VALUE ()) \

236

{ \

237

return std::make_pair(true, param.OPTIONAL_VALUE ()); \

} \

else \

{ \

return std::make_pair(false, defaultValue); \

242

} \

243

}, \

244

[](const PARAM_TYPE & param, VALUE_TYPE defaultValue) \

245

{ \

246

if (param.FALLBACK_VECTOR##_size() > 0) \

247

{ \

248

return std::make_pair(true, (param.FALLBACK_VECTOR ()).Get(0)); \

} \

else \

{ \

return std::make_pair(false, defaultValue); \

} \

}, \

DEFAULT_VALUE)

#define GET_OPTIONAL_WITH_FALLBACK(PARAM, \

PARAM_TYPE, \

OPTIONAL_VALUE, \

FALLBACK_VALUE, \

VALUE_TYPE, \

DEFAULT_VALUE) \

GetOptionalWithFallback( \

264

PARAM, \

265

[](const PARAM_TYPE & param, VALUE_TYPE defaultValue) \

266

{ \

267

if (param.has_##OPTIONAL_VALUE ()) \

268

{ \

269

return std::make_pair(true, param.OPTIONAL_VALUE ()); \

} \

else \

{ \

return std::make_pair(false, defaultValue); \

274

} \

275

}, \

276

[](const PARAM_TYPE & param, VALUE_TYPE defaultValue) \

277

{ \

278

if (param.has_##FALLBACK_VALUE ()) \

279

{ \

280

return std::make_pair(true, param.FALLBACK_VALUE ()); \

} \

else \

{ \

return std::make_pair(false, defaultValue); \

} \

}, \

DEFAULT_VALUE)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

289

} // namespace <anonymous>

290

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

291

const std::map<std::string, ICaffeParser::CaffeParserImpl::OperationParsingFunction>

292

ICaffeParser::CaffeParserImpl::ms_CaffeLayerNameToParsingFunctions = {

293

{ "Input", &CaffeParserImpl::ParseInputLayer },

294

{ "Convolution", &CaffeParserImpl::ParseConvLayer },

295

{ "Deconvolution",&CaffeParserImpl::ParseDeconvLayer },

296

{ "Pooling", &CaffeParserImpl::ParsePoolingLayer },

297

{ "ReLU", &CaffeParserImpl::ParseReluLayer },

298

{ "LRN", &CaffeParserImpl::ParseLRNLayer },

299

{ "InnerProduct", &CaffeParserImpl::ParseInnerProductLayer },

300

{ "Softmax", &CaffeParserImpl::ParseSoftmaxLayer },

301

{ "Eltwise", &CaffeParserImpl::ParseEltwiseLayer },

302

{ "Concat", &CaffeParserImpl::ParseConcatLayer },

303

{ "BatchNorm", &CaffeParserImpl::ParseBatchNormLayer },

304

{ "Scale", &CaffeParserImpl::ParseScaleLayer },

305

{ "Split", &CaffeParserImpl::ParseSplitLayer },

306

{ "Dropout", &CaffeParserImpl::ParseDropoutLayer},

307

{ "ArgMax", &CaffeParserImpl::ParseArgmaxLayer},

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

308

};

309

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

310

ICaffeParser::CaffeParserImpl::CaffeParserImpl()

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

311

: m_Network(nullptr, nullptr)

{

}

CaffeParser::CaffeParser()

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

317

: CaffeParserImpl()

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

{

}

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

322

BindingPointInfo ICaffeParser::CaffeParserImpl::GetNetworkInputBindingInfo(const std::string& name) const

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

323

{

324

return GetBindingInfo(name, "input", m_NetworkInputsBindingInfo);

325

}

326

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

327

BindingPointInfo ICaffeParser::CaffeParserImpl::GetNetworkOutputBindingInfo(const std::string& name) const

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

328

{

329

return GetBindingInfo(name, "output", m_NetworkOutputsBindingInfo);

330

}

331

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

332

std::pair<armnn::LayerBindingId, armnn::TensorInfo> ICaffeParser::CaffeParserImpl::GetBindingInfo(

333

const std::string& layerName,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

334

const char* bindingPointDesc,

335

const std::unordered_map<std::string, BindingPointInfo>& nameToBindingInfo)

336

{

337

auto it = nameToBindingInfo.find(layerName);

338

if (it == nameToBindingInfo.end())

339

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

340

throw InvalidArgumentException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

341

fmt::format("Unknown binding {} for layer '{}'. {}",

342

bindingPointDesc,

343

layerName,

344

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

return it->second;

}

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

349

TensorInfo ICaffeParser::CaffeParserImpl::BlobShapeToTensorInfo(const caffe::BlobShape& blobShape) const

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

350

{

351

std::vector<unsigned int> shape;

352

for (int j = 0; j < blobShape.dim_size(); ++j)

353

{

354

shape.push_back(static_cast<unsigned int>(blobShape.dim(j)));

355

}

356

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

357

return TensorInfo(armnn::numeric_cast<unsigned int>(shape.size()), shape.data(), DataType::Float32);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

358

}

359

360

BlobShape TensorDescToBlobShape(const TensorInfo& desc)

361

{

362

BlobShape ret;

363

for (unsigned int i = 0; i < desc.GetNumDimensions(); ++i)

364

{

365

ret.add_dim(i);

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

366

ret.set_dim(armnn::numeric_cast<int>(i), desc.GetShape()[i]);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

return ret;

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

372

// Note: can move to CaffeParser when/if we optimise the text/string format

373

// to load on a layer by layer basis

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

374

vector<const LayerParameter*> ICaffeParser::CaffeParserImpl::GetInputs(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

375

{

376

std::vector<const caffe::LayerParameter*> ret;

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

377

ret.reserve(armnn::numeric_cast<size_t>(layerParam.bottom_size()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

378

for (int j = 0; j < layerParam.bottom_size(); ++j)

379

{

380

std::string inputName = layerParam.bottom(j);

381

auto inputIt = m_CaffeLayersByTopName.find(inputName);

382

if (inputIt == m_CaffeLayersByTopName.end())

383

{

384

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

385

fmt::format("Can't find Caffe layer with top called '{}', "

386

"which is listed as an input of '{}'. {}",

387

inputName,

388

layerParam.name(),

389

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

390

}

391

ret.push_back(inputIt->second);

}

return ret;

}

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

397

void ICaffeParser::CaffeParserImpl::ParseInputLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

398

{

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

399

ARMNN_ASSERT(layerParam.type() == "Input");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

400

ValidateNumInputsOutputs(layerParam, 0, 1);

401

402

const InputParameter& param = layerParam.input_param();

403

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

404

const armnn::LayerBindingId inputId = armnn::numeric_cast<armnn::LayerBindingId>(

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

405

m_NetworkInputsBindingInfo.size());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

406

armnn::IConnectableLayer* const inputLayer = m_Network->AddInputLayer(inputId, layerParam.name().c_str());

407

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

408

// Decides the tensor info for this input. This can be specified in the Caffe network but can also

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

409

// be overriden by user input (m_inputShapes).

410

armnn::TensorInfo inputTensorInfo;

411

412

const BlobShape* originalShape = param.shape_size() > 0 && param.shape(0).dim_size() > 0 ?

413

&param.shape(0) : nullptr;

414

if (originalShape)

415

{

416

inputTensorInfo = BlobShapeToTensorInfo(*originalShape);

417

}

418

419

auto overrideIt = m_InputShapes.find(layerParam.name());

420

if (overrideIt != m_InputShapes.end())

421

{

422

const TensorShape& overrideShape = overrideIt->second;

423

if (originalShape &&

424

( originalShape->dim(1) != overrideShape[1]

425

|| originalShape->dim(2) != overrideShape[2]

426

|| originalShape->dim(3) != overrideShape[3]))

427

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

428

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

429

fmt::format("Parsed input shape for '{}' is incompatible with the override provided. {}",

430

layerParam.name(),

431

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

432

}

433

inputTensorInfo.SetShape(overrideShape);

434

}

435

else if (!originalShape)

436

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

437

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

438

fmt::format("No input descriptor given for '{}' and no input shape found in caffe model. {}",

439

layerParam.name(),

440

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

441

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

442

TrackInputBinding(inputLayer, inputId, inputTensorInfo);

443

inputLayer->GetOutputSlot(0).SetTensorInfo(inputTensorInfo);

444

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), inputLayer->GetOutputSlot(0));

445

}

446

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

447

void ICaffeParser::CaffeParserImpl::AddConvLayerWithSplits(const caffe::LayerParameter& layerParam,

448

const armnn::Convolution2dDescriptor& desc,

449

unsigned int kernelW,

450

unsigned int kernelH)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

451

{

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

452

ARMNN_ASSERT(layerParam.type() == "Convolution");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

453

ValidateNumInputsOutputs(layerParam, 1, 1);

454

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

455

ConvolutionParameter convParam = layerParam.convolution_param();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

456

BlobShape inputShape = TensorDescToBlobShape(GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo());

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

457

const unsigned int numGroups = convParam.has_group() ? convParam.group() : 1;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

458

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

459

// asusme these were already verified by the caller ParseConvLayer() function

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

460

ARMNN_ASSERT(numGroups < inputShape.dim(1));

461

ARMNN_ASSERT(numGroups > 1);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

462

463

// Handle grouping

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

464

armnn::IOutputSlot& inputConnection = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0));

465

466

vector<string> convLayerNames(numGroups);

467

vector<armnn::IConnectableLayer*> convLayers(numGroups);

468

convLayerNames[0] = layerParam.name();

469

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

470

// This convolution is to be applied to chunks of the input data so add a splitter layer

471

472

// Redirect the convolution input to the splitter

473

unsigned int splitterDimSizes[4] = {static_cast<unsigned int>(inputShape.dim(0)),

474

static_cast<unsigned int>(inputShape.dim(1)),

475

static_cast<unsigned int>(inputShape.dim(2)),

476

static_cast<unsigned int>(inputShape.dim(3))};

477

478

// Split dimension 1 of the splitter output shape and conv input shapes

479

// according to the number of groups

480

481

splitterDimSizes[1] /= numGroups;

482

inputShape.set_dim(1, splitterDimSizes[1]);

483

484

// This is used to describe how the input is to be split

485

ViewsDescriptor splitterDesc(numGroups);

486

487

// Create an output node for each group, giving each a unique name

488

for (unsigned int g = 0; g < numGroups; ++g)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

489

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

490

// Work out the names of the splitter layers child convolutions

491

stringstream ss;

492

ss << layerParam.name() << "_" << g;

493

convLayerNames[g] = ss.str();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

494

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

495

splitterDesc.SetViewOriginCoord(g, 1, splitterDimSizes[1] * g);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

496

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

497

// Set the size of the views.

498

for (unsigned int dimIdx=0; dimIdx < 4; dimIdx++)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

499

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

500

splitterDesc.SetViewSize(g, dimIdx, splitterDimSizes[dimIdx]);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

504

const std::string splitterLayerName = std::string("splitter_") + layerParam.bottom(0);

505

armnn::IConnectableLayer* splitterLayer = m_Network->AddSplitterLayer(splitterDesc, splitterLayerName.c_str());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

506

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

507

inputConnection.Connect(splitterLayer->GetInputSlot(0));

508

for (unsigned int i = 0; i < splitterLayer->GetNumOutputSlots(); i++)

509

{

510

splitterLayer->GetOutputSlot(i).SetTensorInfo(BlobShapeToTensorInfo(inputShape));

511

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

512

513

unsigned int numFilters = convParam.num_output();

514

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

515

// Populates convolution output tensor descriptor dimensions.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

516

BlobShape outputShape;

517

outputShape.add_dim(0);

518

outputShape.set_dim(0, inputShape.dim(0));

519

outputShape.add_dim(1);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

520

// Ensures that dimension 1 of the convolution output is split according to the number of groups.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

521

outputShape.set_dim(1, numFilters / numGroups);

522

outputShape.add_dim(2);

523

outputShape.set_dim(

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

524

2, (static_cast<int>(

Keith Mok

2020-12-20 13:45:51 -0800

[diff] [blame]

525

static_cast<float>(inputShape.dim(2) + 2 * desc.m_PadBottom - (desc.m_DilationX * (kernelH - 1) + 1)) /

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

526

static_cast<float>(desc.m_StrideY)) + 1));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

527

outputShape.add_dim(3);

528

outputShape.set_dim(

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

529

3, (static_cast<int>(

Keith Mok

2020-12-20 13:45:51 -0800

[diff] [blame]

530

static_cast<float>(inputShape.dim(3) + 2 * desc.m_PadRight - (desc.m_DilationY * (kernelW - 1) + 1)) /

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

531

static_cast<float>(desc.m_StrideX)) + 1));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

532

533

// Load the weight data for ALL groups

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

534

vector<float> weightData(armnn::numeric_cast<size_t>(numGroups *

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

535

inputShape.dim(1) * // number of input channels

536

outputShape.dim(1) * // number of output channels

537

kernelH *

538

kernelW));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

539

GetDataFromBlob(layerParam, weightData, 0);

540

541

const unsigned int weightDimSizes[4] = {

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

542

static_cast<unsigned int>(outputShape.dim(1)),

543

static_cast<unsigned int>(inputShape.dim(1)),

544

kernelH,

545

kernelW};

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

546

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

547

TensorInfo biasInfo;

548

vector<float> biasData;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

549

550

if (desc.m_BiasEnabled)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

551

{

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

552

biasData.resize(armnn::numeric_cast<size_t>(numGroups * outputShape.dim(1)), 1.f);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

553

GetDataFromBlob(layerParam, biasData, 1);

554

555

const unsigned int biasDimSizes[1] = {static_cast<unsigned int>(outputShape.dim(1))};

556

biasInfo = TensorInfo(1, biasDimSizes, DataType::Float32);

557

}

558

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

559

const unsigned int numWeightsPerGroup = armnn::numeric_cast<unsigned int>(weightData.size()) / numGroups;

560

const unsigned int numBiasesPerGroup = armnn::numeric_cast<unsigned int>(biasData.size()) / numGroups;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

561

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

562

for (unsigned int g = 0; g < numGroups; ++g)

563

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

564

// Sets the slot index, group 0 should be connected to the 0th output of the splitter

565

// group 1 should be connected to the 1st output of the splitter.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

566

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

567

// Pulls out the weights for this group from that loaded from the model file earlier.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

568

ConstTensor weights(TensorInfo(4, weightDimSizes, DataType::Float32),

569

weightData.data() + numWeightsPerGroup * g);

570

571

IConnectableLayer* convLayer = nullptr;

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

572

Optional<ConstTensor> optionalBiases;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

573

if (desc.m_BiasEnabled)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

574

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

575

// Pulls out the biases for this group from that loaded from the model file earlier.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

576

ConstTensor biases(biasInfo, biasData.data() + numBiasesPerGroup * g);

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

577

optionalBiases = Optional<ConstTensor>(biases);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

578

}

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

579

convLayer = m_Network->AddConvolution2dLayer(desc,

580

weights,

581

optionalBiases,

582

convLayerNames[g].c_str());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

583

convLayers[g] = convLayer;

584

585

// If we have more than one group then the input to the nth convolution the splitter layer's nth output,

586

// otherwise it's the regular input to this layer.

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

587

armnn::IOutputSlot& splitterInputConnection =

588

splitterLayer ? splitterLayer->GetOutputSlot(g) : inputConnection;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

589

splitterInputConnection.Connect(convLayer->GetInputSlot(0));

590

convLayer->GetOutputSlot(0).SetTensorInfo(BlobShapeToTensorInfo(outputShape));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

591

}

592

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

593

// If the convolution was performed in chunks, add a layer to concatenate the results

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

594

595

// The merge input shape matches that of the convolution output

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

596

unsigned int concatDimSizes[4] = {static_cast<unsigned int>(outputShape.dim(0)),

597

static_cast<unsigned int>(outputShape.dim(1)),

598

static_cast<unsigned int>(outputShape.dim(2)),

599

static_cast<unsigned int>(outputShape.dim(3))};

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

600

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

601

// This is used to describe how the input is to be concatenated

602

OriginsDescriptor concatDesc(numGroups);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

603

604

// Now create an input node for each group, using the name from

605

// the output of the corresponding convolution

606

for (unsigned int g = 0; g < numGroups; ++g)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

607

{

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

608

concatDesc.SetViewOriginCoord(g, 1, concatDimSizes[1] * g);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

609

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

610

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

611

// Make sure the output from the concat is the correct size to hold the data for all groups

612

concatDimSizes[1] *= numGroups;

613

outputShape.set_dim(1, concatDimSizes[1]);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

614

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

615

// Finally add the concat layer

616

IConnectableLayer* concatLayer = m_Network->AddConcatLayer(concatDesc, layerParam.name().c_str());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

617

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

618

if (!concatLayer)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

619

{

620

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

621

fmt::format("Failed to create final concat layer for Split+Convolution+Concat. "

622

"Layer={} #groups={} #filters={} {}",

layerParam.name(),

numGroups,

numFilters,

CHECK_LOCATION().AsString()));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

627

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

628

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

629

for (unsigned int g = 0; g < numGroups; ++g)

630

{

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

631

convLayers[g]->GetOutputSlot(0).Connect(concatLayer->GetInputSlot(g));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

632

}

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

633

concatLayer->GetOutputSlot(0).SetTensorInfo(armnn::TensorInfo(4, concatDimSizes, DataType::Float32));

634

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), concatLayer->GetOutputSlot(0));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

635

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

636

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

637

void ICaffeParser::CaffeParserImpl::AddDeconvLayerWithSplits(const caffe::LayerParameter& layerParam,

638

const armnn::TransposeConvolution2dDescriptor& desc,

639

unsigned int kernelW,

640

unsigned int kernelH)

Keith Mok

9801b17

2020-12-20 19:47:25 -0800

[diff] [blame]

641

{

642

ARMNN_ASSERT(layerParam.type() == "Deconvolution");

643

ValidateNumInputsOutputs(layerParam, 1, 1);

644

645

ConvolutionParameter convParam = layerParam.convolution_param();

646

BlobShape inputShape = TensorDescToBlobShape(GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo());

647

const unsigned int numGroups = convParam.has_group() ? convParam.group() : 1;

648

649

// asusme these were already verified by the caller ParseDeconvLayer() function

650

ARMNN_ASSERT(numGroups <= inputShape.dim(1));

651

ARMNN_ASSERT(numGroups > 1);

652

653

// Handle grouping

654

armnn::IOutputSlot& inputConnection = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0));

655

656

vector<string> convLayerNames(numGroups);

657

vector<armnn::IConnectableLayer*> convLayers(numGroups);

658

convLayerNames[0] = layerParam.name();

659

660

// This deconvolution is to be applied to chunks of the input data so add a splitter layer

661

662

// Redirect the deconvolution input to the splitter

663

unsigned int splitterDimSizes[4] = {static_cast<unsigned int>(inputShape.dim(0)),

664

static_cast<unsigned int>(inputShape.dim(1)),

665

static_cast<unsigned int>(inputShape.dim(2)),

666

static_cast<unsigned int>(inputShape.dim(3))};

667

668

// Split dimension 1 of the splitter output shape and deconv input shapes

669

// according to the number of groups

670

671

splitterDimSizes[1] /= numGroups;

672

inputShape.set_dim(1, splitterDimSizes[1]);

673

674

// This is used to describe how the input is to be split

675

ViewsDescriptor splitterDesc(numGroups);

676

677

// Create an output node for each group, giving each a unique name

678

for (unsigned int g = 0; g < numGroups; ++g)

679

{

680

// Work out the names of the splitter layers child deconvolutions

681

stringstream ss;

682

ss << layerParam.name() << "_" << g;

683

convLayerNames[g] = ss.str();

684

685

splitterDesc.SetViewOriginCoord(g, 1, splitterDimSizes[1] * g);

686

687

// Set the size of the views.

688

for (unsigned int dimIdx=0; dimIdx < 4; dimIdx++)

689

{

690

splitterDesc.SetViewSize(g, dimIdx, splitterDimSizes[dimIdx]);

}

}

const std::string splitterLayerName = std::string("splitter_") + layerParam.bottom(0);

695

armnn::IConnectableLayer* splitterLayer = m_Network->AddSplitterLayer(splitterDesc, splitterLayerName.c_str());

696

697

inputConnection.Connect(splitterLayer->GetInputSlot(0));

698

for (unsigned int i = 0; i < splitterLayer->GetNumOutputSlots(); i++)

699

{

700

splitterLayer->GetOutputSlot(i).SetTensorInfo(BlobShapeToTensorInfo(inputShape));

701

}

702

703

unsigned int numFilters = convParam.num_output();

704

705

// Populates deconvolution output tensor descriptor dimensions.

706

BlobShape outputShape;

707

outputShape.add_dim(0);

708

outputShape.set_dim(0, inputShape.dim(0));

709

outputShape.add_dim(1);

710

// Ensures that dimension 1 of the deconvolution output is split according to the number of groups.

711

outputShape.set_dim(1, numFilters / numGroups);

712

outputShape.add_dim(2);

713

outputShape.set_dim(

714

2, (static_cast<int>(

715

desc.m_StrideY * (inputShape.dim(2) - 1) - 2 * desc.m_PadBottom + kernelH)));

716

outputShape.add_dim(3);

717

outputShape.set_dim(

718

3, (static_cast<int>(

719

desc.m_StrideX * (inputShape.dim(3) - 1) - 2 * desc.m_PadRight + kernelW)));

720

721

// Load the weight data for ALL groups

722

vector<float> weightData(armnn::numeric_cast<size_t>(numGroups *

723

inputShape.dim(1) * // number of input channels

724

outputShape.dim(1) * // number of output channels

725

kernelH *

726

kernelW));

727

GetDataFromBlob(layerParam, weightData, 0);

728

729

const unsigned int weightDimSizes[4] = {

730

static_cast<unsigned int>(outputShape.dim(1)),

731

static_cast<unsigned int>(inputShape.dim(1)),

kernelH,

kernelW};

TensorInfo biasInfo;

vector<float> biasData;

737

738

if (desc.m_BiasEnabled)

739

{

740

biasData.resize(armnn::numeric_cast<size_t>(numGroups * outputShape.dim(1)), 1.f);

741

GetDataFromBlob(layerParam, biasData, 1);

742

743

const unsigned int biasDimSizes[1] = {static_cast<unsigned int>(outputShape.dim(1))};

744

biasInfo = TensorInfo(1, biasDimSizes, DataType::Float32);

745

}

746

747

const unsigned int numWeightsPerGroup = armnn::numeric_cast<unsigned int>(weightData.size()) / numGroups;

748

const unsigned int numBiasesPerGroup = armnn::numeric_cast<unsigned int>(biasData.size()) / numGroups;

749

750

for (unsigned int g = 0; g < numGroups; ++g)

751

{

752

// Sets the slot index, group 0 should be connected to the 0th output of the splitter

753

// group 1 should be connected to the 1st output of the splitter.

754

755

// Pulls out the weights for this group from that loaded from the model file earlier.

756

ConstTensor weights(TensorInfo(4, weightDimSizes, DataType::Float32),

757

weightData.data() + numWeightsPerGroup * g);

758

759

IConnectableLayer* deconvLayer = nullptr;

760

Optional<ConstTensor> optionalBiases;

761

if (desc.m_BiasEnabled)

762

{

763

// Pulls out the biases for this group from that loaded from the model file earlier.

764

ConstTensor biases(biasInfo, biasData.data() + numBiasesPerGroup * g);

765

optionalBiases = Optional<ConstTensor>(biases);

766

}

767

deconvLayer = m_Network->AddTransposeConvolution2dLayer(desc,

768

weights,

769

optionalBiases,

770

convLayerNames[g].c_str());

771

convLayers[g] = deconvLayer;

772

773

// If we have more than one group then the input to the nth deconvolution the splitter layer's nth output,

774

// otherwise it's the regular input to this layer.

775

armnn::IOutputSlot& splitterInputConnection =

776

splitterLayer ? splitterLayer->GetOutputSlot(g) : inputConnection;

777

splitterInputConnection.Connect(deconvLayer->GetInputSlot(0));

778

deconvLayer->GetOutputSlot(0).SetTensorInfo(BlobShapeToTensorInfo(outputShape));

779

}

780

781

// If the deconvolution was performed in chunks, add a layer to concatenate the results

782

783

// The merge input shape matches that of the deconvolution output

784

unsigned int concatDimSizes[4] = {static_cast<unsigned int>(outputShape.dim(0)),

785

static_cast<unsigned int>(outputShape.dim(1)),

786

static_cast<unsigned int>(outputShape.dim(2)),

787

static_cast<unsigned int>(outputShape.dim(3))};

788

789

// This is used to describe how the input is to be concatenated

790

OriginsDescriptor concatDesc(numGroups);

791

792

// Now create an input node for each group, using the name from

793

// the output of the corresponding deconvolution

794

for (unsigned int g = 0; g < numGroups; ++g)

795

{

796

concatDesc.SetViewOriginCoord(g, 1, concatDimSizes[1] * g);

797

}

798

799

// Make sure the output from the concat is the correct size to hold the data for all groups

800

concatDimSizes[1] *= numGroups;

801

outputShape.set_dim(1, concatDimSizes[1]);

802

803

// Finally add the concat layer

804

IConnectableLayer* concatLayer = m_Network->AddConcatLayer(concatDesc, layerParam.name().c_str());

if (!concatLayer)

{

throw ParseException(

809

fmt::format("Failed to create final concat layer for Split+Deconvolution+Concat. "

810

"Layer={} #groups={} #filters={} {}",

layerParam.name(),

numGroups,

numFilters,

CHECK_LOCATION().AsString()));

815

}

816

817

for (unsigned int g = 0; g < numGroups; ++g)

818

{

819

convLayers[g]->GetOutputSlot(0).Connect(concatLayer->GetInputSlot(g));

820

}

821

concatLayer->GetOutputSlot(0).SetTensorInfo(armnn::TensorInfo(4, concatDimSizes, DataType::Float32));

822

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), concatLayer->GetOutputSlot(0));

823

}

824

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

825

void ICaffeParser::CaffeParserImpl::AddConvLayerWithDepthwiseConv(const caffe::LayerParameter& layerParam,

826

const armnn::Convolution2dDescriptor& convDesc,

827

unsigned int kernelW,

828

unsigned int kernelH)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

829

{

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

830

ARMNN_ASSERT(layerParam.type() == "Convolution");

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

831

ValidateNumInputsOutputs(layerParam, 1, 1);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

832

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

833

ConvolutionParameter convParam = layerParam.convolution_param();

834

BlobShape inputShape = TensorDescToBlobShape(GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

835

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

836

DepthwiseConvolution2dDescriptor desc;

837

desc.m_PadLeft = convDesc.m_PadLeft;

838

desc.m_PadRight = convDesc.m_PadRight;

839

desc.m_PadTop = convDesc.m_PadTop;

840

desc.m_PadBottom = convDesc.m_PadBottom;

841

desc.m_StrideX = convDesc.m_StrideX;

842

desc.m_StrideY = convDesc.m_StrideY;

Keith Mok

2020-12-20 13:45:51 -0800

[diff] [blame]

843

desc.m_DilationX = convDesc.m_DilationX;

844

desc.m_DilationY = convDesc.m_DilationY;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

845

desc.m_BiasEnabled = convDesc.m_BiasEnabled;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

846

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

847

unsigned int numFilters = convParam.num_output();

848

849

BlobShape outputShape;

850

outputShape.add_dim(0);

851

outputShape.set_dim(0, inputShape.dim(0));

852

outputShape.add_dim(1);

853

outputShape.set_dim(1, numFilters);

854

outputShape.add_dim(2);

855

outputShape.set_dim(

856

2, (static_cast<int>(

Keith Mok

2020-12-20 13:45:51 -0800

[diff] [blame]

857

static_cast<float>(inputShape.dim(2) + 2 * desc.m_PadBottom - (desc.m_DilationX * (kernelH - 1) + 1)) /

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

858

static_cast<float>(desc.m_StrideY)) + 1));

859

outputShape.add_dim(3);

860

outputShape.set_dim(

861

3, (static_cast<int>(

Keith Mok

2020-12-20 13:45:51 -0800

[diff] [blame]

862

static_cast<float>(inputShape.dim(3) + 2 * desc.m_PadRight - (desc.m_DilationY * (kernelW - 1) + 1)) /

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

863

static_cast<float>(desc.m_StrideX)) + 1));

864

865

// Load the weight data

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

866

size_t allWeightsSize = armnn::numeric_cast<size_t>(inputShape.dim(1) * kernelH * kernelW);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

867

vector<float> weightData(allWeightsSize);

868

869

GetDataFromBlob(layerParam, weightData, 0);

870

871

// depth multiplier will be 1 for the depthwise convolution

872

const unsigned int weightDimSizes[4] = {

873

static_cast<unsigned int>(1), // depth multiplier

874

static_cast<unsigned int>(inputShape.dim(1)), // #channels

kernelH,

kernelW};

armnn::IConnectableLayer* returnLayer = nullptr;

879

ConstTensor weights(TensorInfo(4, weightDimSizes, DataType::Float32), weightData.data());

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

880

Optional<ConstTensor> optionalBiases;

881

vector<float> biasData;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

882

if (desc.m_BiasEnabled)

883

{

884

TensorInfo biasInfo;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

885

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

886

biasData.resize(armnn::numeric_cast<size_t>(outputShape.dim(1)), 1.f);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

887

GetDataFromBlob(layerParam, biasData, 1);

888

889

const unsigned int biasDimSizes[1] = {static_cast<unsigned int>(outputShape.dim(1))};

890

biasInfo = TensorInfo(1, biasDimSizes, DataType::Float32);

891

892

ConstTensor biases(biasInfo, biasData.data());

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

893

optionalBiases = Optional<ConstTensor>(biases);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

894

}

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

895

returnLayer = m_Network->AddDepthwiseConvolution2dLayer(desc,

896

weights,

897

optionalBiases,

898

layerParam.name().c_str());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

899

surmeh01

3537c2c

2018-05-18 16:31:43 +0100

[diff] [blame]

900

if (!returnLayer)

901

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

902

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

903

fmt::format("Failed to create depthwise convolution layer. "

904

"Layer={} #filters={} {}",

905

layerParam.name(),

906

numFilters,

907

CHECK_LOCATION().AsString()));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

908

}

909

armnn::IOutputSlot& inputConnection = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0));

910

inputConnection.Connect(returnLayer->GetInputSlot(0));

911

returnLayer->GetOutputSlot(0).SetTensorInfo(BlobShapeToTensorInfo(outputShape));

912

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), returnLayer->GetOutputSlot(0));

913

}

914

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

915

void ICaffeParser::CaffeParserImpl::ParseConvLayer(const LayerParameter& layerParam)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

916

{

917

// Ignored Caffe Parameters

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

// * Weight Filler

// * Bias Filler

// * Engine

// * Force nd_im2col

// * Axis

// Not Available ArmNN Interface Parameters

925

// * Rounding policy;

926

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

927

ARMNN_ASSERT(layerParam.type() == "Convolution");

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

928

ValidateNumInputsOutputs(layerParam, 1, 1);

929

930

ConvolutionParameter convParam = layerParam.convolution_param();

931

BlobShape inputShape = TensorDescToBlobShape(GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo());

932

const unsigned int numGroups = convParam.has_group() ? convParam.group() : 1;

933

unsigned int numFilters = convParam.num_output();

934

935

const auto notFound = std::numeric_limits<unsigned int>::max();

936

937

unsigned int kernelH = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

938

kernel_h, kernel_size, unsigned int, notFound);

939

unsigned int kernelW = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

940

kernel_w, kernel_size, unsigned int, notFound);

941

942

unsigned int strideH = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

943

stride_h, stride, unsigned int, 1u);

944

unsigned int strideW = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

945

stride_w, stride, unsigned int, 1u);

946

947

unsigned int padH = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

948

pad_h, pad, unsigned int, 0u);

949

unsigned int padW = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

950

pad_w, pad, unsigned int, 0u);

951

Keith Mok

2020-12-20 13:45:51 -0800

[diff] [blame]

952

unsigned int dilationH = convParam.dilation_size() > 0 ? convParam.dilation(0) : 1;

953

unsigned int dilationW = convParam.dilation_size() > 1 ? convParam.dilation(1) :

954

convParam.dilation_size() > 0 ? convParam.dilation(0) : 1;

955

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

956

Convolution2dDescriptor convolution2dDescriptor;

957

convolution2dDescriptor.m_PadLeft = padW;

958

convolution2dDescriptor.m_PadRight = padW;

959

convolution2dDescriptor.m_PadTop = padH;

960

convolution2dDescriptor.m_PadBottom = padH;

961

convolution2dDescriptor.m_StrideX = strideW;

962

convolution2dDescriptor.m_StrideY = strideH;

Keith Mok

2020-12-20 13:45:51 -0800

[diff] [blame]

963

convolution2dDescriptor.m_DilationX = dilationW;

964

convolution2dDescriptor.m_DilationY = dilationH;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

965

convolution2dDescriptor.m_BiasEnabled = convParam.has_bias_term() ? convParam.bias_term() : true;

966

967

if (numGroups > numFilters)

968

{

969

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

970

fmt::format("Error parsing Convolution: {}. "

971

"The 'group'={} parameter cannot be larger than the "

972

"number of filters supplied ='{}'. {}",

layerParam.name(),

numGroups,

numFilters,

CHECK_LOCATION().AsString()));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

977

}

978

979

if (inputShape.dim_size() != 4)

980

{

981

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

982

fmt::format("Convolution input shape is expected to have 4 dimensions. "

983

"{}'s input has only {}. {}",

984

layerParam.name(),

985

inputShape.dim_size(),

986

CHECK_LOCATION().AsString()));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

}

if (numGroups > 1)

{

if (numGroups > inputShape.dim(1))

992

{

993

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

994

fmt::format("Error parsing Convolution: {}. "

995

"The 'group'={} parameter cannot be larger than the "

996

"channel of the input shape={} (in NCHW format). {}",

layerParam.name(),

numGroups,

inputShape.dim(1),

CHECK_LOCATION().AsString()));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1001

}

1002

else if (numGroups == inputShape.dim(1))

1003

{

1004

// we use a depthwise convolution here, because the number of groups equals to the

1005

// input channels

1006

AddConvLayerWithDepthwiseConv(layerParam, convolution2dDescriptor, kernelW, kernelH);

return;

}

else

{

// we split the input by channels into channels/groups separate convolutions

Jim Flynn

2019-05-22 14:24:13 +0100

[diff] [blame]

1012

// and concatenate the results afterwards

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1013

AddConvLayerWithSplits(layerParam, convolution2dDescriptor, kernelW, kernelH);

return;

}

}

// NOTE: at this point we only need to handle #group=1 case, all other cases should be

1019

// handled by the AddConvLayer* helpers

1020

1021

// Populate convolution output tensor descriptor dimensions

1022

BlobShape outputShape;

1023

outputShape.add_dim(0);

1024

outputShape.set_dim(0, inputShape.dim(0));

1025

outputShape.add_dim(1);

1026

outputShape.set_dim(1, numFilters);

1027

outputShape.add_dim(2);

1028

outputShape.set_dim(

1029

2, (static_cast<int>(

Keith Mok

2020-12-20 13:45:51 -0800

[diff] [blame]

1030

static_cast<float>(inputShape.dim(2) + 2 * padH - (dilationH * (kernelH - 1) + 1)) /

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1031

static_cast<float>(strideH)) + 1));

1032

outputShape.add_dim(3);

1033

outputShape.set_dim(

1034

3, (static_cast<int>(

Keith Mok

2020-12-20 13:45:51 -0800

[diff] [blame]

1035

static_cast<float>(inputShape.dim(3) + 2 * padW - (dilationW * (kernelW - 1) + 1)) /

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1036

static_cast<float>(strideW)) + 1));

1037

1038

// Load the weight data for ALL groups

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

1039

vector<float> weightData(armnn::numeric_cast<size_t>(inputShape.dim(1) *

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

outputShape.dim(1) *

kernelH *

kernelW));

GetDataFromBlob(layerParam, weightData, 0);

1044

1045

const unsigned int weightDimSizes[4] = {

1046

static_cast<unsigned int>(outputShape.dim(1)), // output channels

1047

static_cast<unsigned int>(inputShape.dim(1)), // input channels

kernelH,

kernelW};

armnn::IConnectableLayer* returnLayer = nullptr;

1052

1053

// Pull out the weights for this group from that loaded from the model file earlier

1054

ConstTensor weights(TensorInfo(4, weightDimSizes, DataType::Float32), weightData.data());

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

1055

Optional<ConstTensor> optionalBiases;

1056

vector<float> biasData;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1057

if (convolution2dDescriptor.m_BiasEnabled)

1058

{

1059

TensorInfo biasInfo;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1060

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

1061

biasData.resize(armnn::numeric_cast<size_t>(outputShape.dim(1)), 1.f);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1062

GetDataFromBlob(layerParam, biasData, 1);

1063

1064

const unsigned int biasDimSizes[1] = {static_cast<unsigned int>(outputShape.dim(1))};

1065

biasInfo = TensorInfo(1, biasDimSizes, DataType::Float32);

1066

1067

// Pull out the biases for this group from that loaded from the model file earlier

1068

ConstTensor biases(biasInfo, biasData.data());

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

1069

optionalBiases = Optional<ConstTensor>(biases);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1070

}

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

1071

returnLayer = m_Network->AddConvolution2dLayer(convolution2dDescriptor,

1072

weights,

1073

optionalBiases,

1074

layerParam.name().c_str());

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1075

1076

armnn::IOutputSlot& inputConnection = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0));

1077

inputConnection.Connect(returnLayer->GetInputSlot(0));

1078

returnLayer->GetOutputSlot(0).SetTensorInfo(BlobShapeToTensorInfo(outputShape));

if (!returnLayer)

{

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1083

fmt::format("Failed to create Convolution layer. "

1084

"Layer={} #groups={} #filters={} {}",

layerParam.name(),

numGroups,

numFilters,

CHECK_LOCATION().AsString()));

surmeh01

3537c2c

2018-05-18 16:31:43 +0100

[diff] [blame]

1089

}

1090

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1091

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), returnLayer->GetOutputSlot(0));

1092

}

1093

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1094

void ICaffeParser::CaffeParserImpl::ParseDeconvLayer(const LayerParameter& layerParam)

Keith Mok

9801b17

2020-12-20 19:47:25 -0800

[diff] [blame]

1095

{

1096

// Ignored Caffe Parameters

// * Weight Filler

// * Bias Filler

// * Engine

// * Force nd_im2col

// * Axis

// Not Available ArmNN Interface Parameters

1104

// * Rounding policy;

1105

1106

ARMNN_ASSERT(layerParam.type() == "Deconvolution");

1107

ValidateNumInputsOutputs(layerParam, 1, 1);

1108

1109

ConvolutionParameter convParam = layerParam.convolution_param();

1110

BlobShape inputShape = TensorDescToBlobShape(GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo());

1111

const unsigned int numGroups = convParam.has_group() ? convParam.group() : 1;

1112

unsigned int numFilters = convParam.num_output();

1113

1114

const auto notFound = std::numeric_limits<unsigned int>::max();

1115

1116

unsigned int kernelH = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

1117

kernel_h, kernel_size, unsigned int, notFound);

1118

unsigned int kernelW = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

1119

kernel_w, kernel_size, unsigned int, notFound);

1120

1121

unsigned int strideH = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

1122

stride_h, stride, unsigned int, 1u);

1123

unsigned int strideW = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

1124

stride_w, stride, unsigned int, 1u);

1125

1126

unsigned int padH = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

1127

pad_h, pad, unsigned int, 0u);

1128

unsigned int padW = GET_OPTIONAL_WITH_VECTOR_FALLBACK(convParam, ConvolutionParameter,

1129

pad_w, pad, unsigned int, 0u);

1130

1131

unsigned int dilationH = convParam.dilation_size() > 0 ? convParam.dilation(0) : 1;

1132

unsigned int dilationW = convParam.dilation_size() > 1 ? convParam.dilation(1) :

1133

convParam.dilation_size() > 0 ? convParam.dilation(0) : 1;

1134

1135

if (dilationH != 1 || dilationW != 1) {

1136

fmt::format("Dilated decnvolution is not supported. "

1137

"{}'s input has dilation {} {}. {}",

1138

layerParam.name(),

1139

dilationW, dilationH,

1140

CHECK_LOCATION().AsString());

1141

}

1142

1143

TransposeConvolution2dDescriptor deconvolution2dDescriptor;

1144

deconvolution2dDescriptor.m_PadLeft = padW;

1145

deconvolution2dDescriptor.m_PadRight = padW;

1146

deconvolution2dDescriptor.m_PadTop = padH;

1147

deconvolution2dDescriptor.m_PadBottom = padH;

1148

deconvolution2dDescriptor.m_StrideX = strideW;

1149

deconvolution2dDescriptor.m_StrideY = strideH;

1150

deconvolution2dDescriptor.m_BiasEnabled = convParam.has_bias_term() ? convParam.bias_term() : true;

1151

1152

if (numGroups > numFilters)

1153

{

1154

throw ParseException(

1155

fmt::format("Error parsing Deconvolution: {}. "

1156

"The 'group'={} parameter cannot be larger than the "

1157

"number of filters supplied ='{}'. {}",

layerParam.name(),

numGroups,

numFilters,

CHECK_LOCATION().AsString()));

1162

}

1163

1164

if (inputShape.dim_size() != 4)

1165

{

1166

throw ParseException(

1167

fmt::format("Deconvolution input shape is expected to have 4 dimensions. "

1168

"{}'s input has only {}. {}",

1169

layerParam.name(),

1170

inputShape.dim_size(),

1171

CHECK_LOCATION().AsString()));

}

if (numGroups > 1)

{

if (numGroups > inputShape.dim(1))

1177

{

1178

throw ParseException(

1179

fmt::format("Error parsing Deconvolution: {}. "

1180

"The 'group'={} parameter cannot be larger than the "

1181

"channel of the input shape={} (in NCHW format). {}",

layerParam.name(),

numGroups,

inputShape.dim(1),

CHECK_LOCATION().AsString()));

}

else

{

// we split the input by channels into channels/groups separate convolutions

1190

// and concatenate the results afterwards

1191

AddDeconvLayerWithSplits(layerParam, deconvolution2dDescriptor, kernelW, kernelH);

return;

}

}

// NOTE: at this point we only need to handle #group=1 case, all other cases should be

1197

// handled by the AddDeconvLayer* helpers

1198

1199

// Populate deconvolution output tensor descriptor dimensions

1200

BlobShape outputShape;

1201

outputShape.add_dim(0);

1202

outputShape.set_dim(0, inputShape.dim(0));

1203

outputShape.add_dim(1);

1204

outputShape.set_dim(1, numFilters);

1205

outputShape.add_dim(2);

1206

outputShape.set_dim(

1207

2, (static_cast<int>(

1208

strideH * (inputShape.dim(2) - 1) - 2 * padH + (dilationH * (kernelH - 1) + 1))));

1209

outputShape.add_dim(3);

1210

outputShape.set_dim(

1211

3, (static_cast<int>(

1212

strideW * (inputShape.dim(3) - 1) - 2 * padW + (dilationW * (kernelW - 1) + 1))));

1213

1214

// Load the weight data for ALL groups

1215

vector<float> weightData(armnn::numeric_cast<size_t>(inputShape.dim(1) *

outputShape.dim(1) *

kernelH *

kernelW));

GetDataFromBlob(layerParam, weightData, 0);

1220

1221

const unsigned int weightDimSizes[4] = {

1222

static_cast<unsigned int>(outputShape.dim(1)), // output channels

1223

static_cast<unsigned int>(inputShape.dim(1)), // input channels

kernelH,

kernelW};

armnn::IConnectableLayer* returnLayer = nullptr;

1228

1229

// Pull out the weights for this group from that loaded from the model file earlier

1230

ConstTensor weights(TensorInfo(4, weightDimSizes, DataType::Float32), weightData.data());

1231

Optional<ConstTensor> optionalBiases;

1232

vector<float> biasData;

1233

if (deconvolution2dDescriptor.m_BiasEnabled)

{

TensorInfo biasInfo;

biasData.resize(armnn::numeric_cast<size_t>(outputShape.dim(1)), 1.f);

1238

GetDataFromBlob(layerParam, biasData, 1);

1239

1240

const unsigned int biasDimSizes[1] = {static_cast<unsigned int>(outputShape.dim(1))};

1241

biasInfo = TensorInfo(1, biasDimSizes, DataType::Float32);

1242

1243

// Pull out the biases for this group from that loaded from the model file earlier

1244

ConstTensor biases(biasInfo, biasData.data());

1245

optionalBiases = Optional<ConstTensor>(biases);

1246

}

1247

returnLayer = m_Network->AddTransposeConvolution2dLayer(deconvolution2dDescriptor,

1248

weights,

1249

optionalBiases,

1250

layerParam.name().c_str());

1251

1252

armnn::IOutputSlot& inputConnection = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0));

1253

inputConnection.Connect(returnLayer->GetInputSlot(0));

1254

returnLayer->GetOutputSlot(0).SetTensorInfo(BlobShapeToTensorInfo(outputShape));

if (!returnLayer)

{

throw ParseException(

1259

fmt::format("Failed to create Deconvolution layer. "

1260

"Layer={} #groups={} #filters={} {}",

layerParam.name(),

numGroups,

numFilters,

CHECK_LOCATION().AsString()));

1265

}

1266

1267

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), returnLayer->GetOutputSlot(0));

1268

}

1269

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1270

void ICaffeParser::CaffeParserImpl::ParsePoolingLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1271

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1272

// Ignored Caffe Parameters

1273

// Stochastic Pooling

1274

// Engine

1275

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1276

ValidateNumInputsOutputs(layerParam, 1, 1);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1277

PoolingParameter param = layerParam.pooling_param();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1278

const TensorInfo& inputInfo = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo();

1279

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1280

const auto notFound = std::numeric_limits<unsigned int>::max();

1281

1282

unsigned int kernel_h = GET_OPTIONAL_WITH_FALLBACK(param, PoolingParameter,

1283

kernel_h, kernel_size, unsigned int, notFound);

1284

unsigned int kernel_w = GET_OPTIONAL_WITH_FALLBACK(param, PoolingParameter,

1285

kernel_w, kernel_size, unsigned int, notFound);

1286

1287

if ((kernel_h == notFound || kernel_w == notFound) && param.has_global_pooling())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1288

{

1289

kernel_h = inputInfo.GetShape()[2];

1290

kernel_w = inputInfo.GetShape()[3];

1291

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1292

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1293

unsigned int stride_h = GET_OPTIONAL_WITH_FALLBACK(param, PoolingParameter,

1294

stride_h, stride, unsigned int, notFound);

1295

unsigned int stride_w = GET_OPTIONAL_WITH_FALLBACK(param, PoolingParameter,

1296

stride_h, stride, unsigned int, notFound);

1297

1298

if ((stride_h == notFound || stride_w == notFound) && param.has_global_pooling())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1299

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1300

stride_h = 1;

1301

stride_w = 1;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1302

}

1303

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1304

unsigned int pad_h = GET_OPTIONAL_WITH_FALLBACK(param, PoolingParameter,

1305

pad_h, pad, unsigned int, 0u);

1306

unsigned int pad_w = GET_OPTIONAL_WITH_FALLBACK(param, PoolingParameter,

1307

pad_w, pad, unsigned int, 0u);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1308

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1309

// Populate Weight and Bias Filter Descriptor

1310

Pooling2dDescriptor pooling2dDescriptor;

1311

if (param.has_pool())

1312

{

1313

PoolingParameter_PoolMethod p = param.pool();

1314

switch (p)

1315

{

1316

case PoolingParameter_PoolMethod_MAX:

1317

{

1318

pooling2dDescriptor.m_PoolType = PoolingAlgorithm::Max;

1319

break;

1320

}

1321

case PoolingParameter_PoolMethod_AVE:

1322

{

1323

pooling2dDescriptor.m_PoolType = PoolingAlgorithm::Average;

1324

break;

1325

}

1326

case PoolingParameter_PoolMethod_STOCHASTIC:

1327

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1328

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1329

fmt::format("Pooling Layer: Stochastic Pooling Not Supported. Layer={} {}",

1330

layerParam.name(),

1331

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1332

}

1333

default:

1334

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1335

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1336

fmt::format("Pooling Layer: unknown pooling method: {} for layer: {} {}",

1337

p,

1338

layerParam.name(),

1339

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

}

else

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1345

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1346

fmt::format("No Pooling Method Defined for {} {}",

1347

layerParam.name(),

1348

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1349

}

1350

1351

pooling2dDescriptor.m_PadLeft = pad_w;

1352

pooling2dDescriptor.m_PadRight = pad_w;

1353

pooling2dDescriptor.m_PadTop = pad_h;

1354

pooling2dDescriptor.m_PadBottom = pad_h;

1355

pooling2dDescriptor.m_StrideX = stride_w;

1356

pooling2dDescriptor.m_StrideY = stride_h;

1357

pooling2dDescriptor.m_PoolWidth = kernel_w;

1358

pooling2dDescriptor.m_PoolHeight = kernel_h;

1359

1360

pooling2dDescriptor.m_OutputShapeRounding = OutputShapeRounding::Ceiling;

1361

pooling2dDescriptor.m_PaddingMethod = PaddingMethod::IgnoreValue;

1362

1363

armnn::IConnectableLayer* poolingLayer = m_Network->AddPooling2dLayer(pooling2dDescriptor,

1364

layerParam.name().c_str());

1365

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1366

TensorInfo outputInfo(

1367

{ inputInfo.GetShape()[0],

1368

inputInfo.GetShape()[1],

1369

static_cast<unsigned int>(ceil(

1370

static_cast<float>(inputInfo.GetShape()[2] + 2 * pad_h - kernel_h) /

Matthew Sloyan

24ac859

2020-09-23 16:57:23 +0100

[diff] [blame]

1371

armnn::numeric_cast<float>(stride_h))) + 1,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1372

static_cast<unsigned int>(ceil(

1373

static_cast<float>(inputInfo.GetShape()[3] + 2 * pad_w - kernel_w) /

Matthew Sloyan

24ac859

2020-09-23 16:57:23 +0100

[diff] [blame]

1374

armnn::numeric_cast<float>(stride_w))) + 1 },

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1375

DataType::Float32);

1376

1377

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).Connect(poolingLayer->GetInputSlot(0));

1378

poolingLayer->GetOutputSlot(0).SetTensorInfo(outputInfo);

1379

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), poolingLayer->GetOutputSlot(0));

1380

}

1381

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1382

void ICaffeParser::CaffeParserImpl::ParseArgmaxLayer(const LayerParameter& layerParam)

Keith Mok

9801b17

2020-12-20 19:47:25 -0800

[diff] [blame]

1383

{

1384

ValidateNumInputsOutputs(layerParam, 1, 1);

1385

ArgMaxParameter param = layerParam.argmax_param();

1386

1387

BlobShape inputShape = TensorDescToBlobShape(GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo());

1388

1389

const unsigned int topK = param.has_top_k() ? param.top_k() : 1;

1390

if (topK != 1) {

1391

throw ParseException(

1392

fmt::format("ArgMaxLayer: Only support top_k equals to 1. Layer={} {}",

1393

layerParam.name(),

1394

CHECK_LOCATION().AsString()));

1395

}

1396

1397

const unsigned int outMaxVal = param.has_out_max_val() ? param.out_max_val() : false;

1398

if (outMaxVal) {

1399

throw ParseException(

1400

fmt::format("ArgMaxLayer: Does not support out_max_val. Layer={} {}",

1401

layerParam.name(),

1402

CHECK_LOCATION().AsString()));

1403

}

1404

1405

int axis = param.has_axis() ? param.axis() : 1;

1406

if (axis < 0) {

1407

axis = inputShape.dim_size() - axis;

1408

}

1409

if ((axis < 0) || (axis >= inputShape.dim_size())) {

1410

throw ParseException(

1411

fmt::format("ArgMaxLayer: Invalid axis value which outside range of input dims. "

1412

"{}'s input has input dim_size {}, requested axis: {}. {}",

1413

layerParam.name(),

1414

inputShape.dim_size(),

1415

axis,

1416

CHECK_LOCATION().AsString()));

1417

}

1418

1419

ArgMinMaxDescriptor desc;

1420

desc.m_Axis = axis;

1421

desc.m_Output_Type = armnn::DataType::Signed32;

1422

desc.m_Function = ArgMinMaxFunction::Max;

1423

1424

armnn::IConnectableLayer* argmaxLayer = m_Network->AddArgMinMaxLayer(desc,

1425

layerParam.name().c_str());

1426

1427

TensorShape outputShape(static_cast<unsigned int>(inputShape.dim_size() - 1));

1428

int j = 0;

1429

// remove the flatten axis

1430

for (int i = 0; i < inputShape.dim_size(); ++i)

1431

{

1432

if (i == axis) continue;

1433

outputShape[static_cast<unsigned int>(j++)] = static_cast<unsigned int>(inputShape.dim(i));

1434

}

1435

TensorInfo outputInfo(outputShape, DataType::Signed32);

1436

1437

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).Connect(argmaxLayer->GetInputSlot(0));

1438

argmaxLayer->GetOutputSlot(0).SetTensorInfo(outputInfo);

1439

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), argmaxLayer->GetOutputSlot(0));

1440

}

1441

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1442

void ICaffeParser::CaffeParserImpl::ParseReluLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1443

{

1444

ValidateNumInputsOutputs(layerParam, 1, 1);

1445

1446

const string& name = layerParam.name();

1447

const ReLUParameter& param = layerParam.relu_param();

1448

1449

ActivationDescriptor activationDescriptor;

1450

const float negativeSlope = param.negative_slope();

1451

if (negativeSlope == 0.0f)

1452

{

1453

activationDescriptor.m_Function = ActivationFunction::ReLu;

}

else

{

activationDescriptor.m_Function = ActivationFunction::LeakyReLu;

1458

activationDescriptor.m_A = negativeSlope;

1459

}

1460

1461

const TensorInfo& inputInfo = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo();

1462

IConnectableLayer* const activationLayer = m_Network->AddActivationLayer(activationDescriptor, name.c_str());

1463

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).Connect(activationLayer->GetInputSlot(0));

1464

activationLayer->GetOutputSlot(0).SetTensorInfo(inputInfo);

1465

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), activationLayer->GetOutputSlot(0));

1466

}

1467

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1468

void ICaffeParser::CaffeParserImpl::ParseLRNLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1469

{

1470

ValidateNumInputsOutputs(layerParam, 1, 1);

1471

1472

LRNParameter param = layerParam.lrn_param();

1473

1474

const TensorInfo& inputInfo = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo();

1475

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1476

// Ignored BATCH NORMALIZATION Caffe Parameters.

1477

// Ignored MVN Caffe Parameters.

1478

// Ignored LRN Caffe Parameters.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1479

// Engine

1480

1481

NormalizationDescriptor normalizationDescriptor;

1482

if (param.has_norm_region())

1483

{

1484

LRNParameter_NormRegion n = param.norm_region();

1485

switch (n)

1486

{

1487

case LRNParameter_NormRegion_ACROSS_CHANNELS:

1488

{

1489

normalizationDescriptor.m_NormChannelType = NormalizationAlgorithmChannel::Across;

1490

break;

1491

}

1492

case LRNParameter_NormRegion_WITHIN_CHANNEL:

1493

{

1494

normalizationDescriptor.m_NormChannelType = NormalizationAlgorithmChannel::Within;

1495

break;

1496

}

1497

default:

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1498

{

1499

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1500

fmt::format("Unknown region {} for LRN layer {} {}",

1501

n,

1502

layerParam.name(),

1503

CHECK_LOCATION().AsString()));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1504

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

else

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1509

// Caffe defaults to normalization across channels.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1510

normalizationDescriptor.m_NormChannelType = NormalizationAlgorithmChannel::Across;

1511

}

1512

1513

normalizationDescriptor.m_NormMethodType = NormalizationAlgorithmMethod::LocalBrightness;

1514

if (param.has_local_size())

1515

{

1516

normalizationDescriptor.m_NormSize = param.local_size();

1517

}

1518

else

1519

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1520

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1521

fmt::format("local_size not defined for LRN layer {} {}",

1522

layerParam.name(),

1523

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1524

}

1525

1526

if (param.has_alpha())

1527

{

1528

normalizationDescriptor.m_Alpha = param.alpha();

Matthew Sloyan

24ac859

2020-09-23 16:57:23 +0100

[diff] [blame]

1529

normalizationDescriptor.m_Alpha /= armnn::numeric_cast<float>(param.local_size());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1530

}

1531

else

1532

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1533

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1534

fmt::format("Alpha not defined for LRN layer {} {}",

1535

layerParam.name(),

1536

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1537

}

1538

if (param.has_beta())

1539

{

1540

normalizationDescriptor.m_Beta = param.beta();

1541

}

1542

else

1543

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1544

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1545

fmt::format("Beta not defined for LRN layer {} {}",

1546

layerParam.name(),

1547

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1548

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1549

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1550

if (param.has_k())

1551

{

1552

normalizationDescriptor.m_K = param.k();

1553

}

1554

else

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1555

{

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1556

normalizationDescriptor.m_K = 1;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1557

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1558

1559

IConnectableLayer* const normLayer = m_Network->AddNormalizationLayer(normalizationDescriptor,

1560

layerParam.name().c_str());

1561

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).Connect(normLayer->GetInputSlot(0));

1562

normLayer->GetOutputSlot(0).SetTensorInfo(inputInfo);

1563

1564

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), normLayer->GetOutputSlot(0));

1565

}

1566

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1567

void ICaffeParser::CaffeParserImpl::ParseInnerProductLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1568

{

1569

InnerProductParameter param = layerParam.inner_product_param();

1570

1571

ValidateNumInputsOutputs(layerParam, 1, 1);

1572

1573

unsigned int outputSize = param.num_output();

1574

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1575

// Ignored Caffe Parameters:

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

// Weight Filler

// Bias Filler

// Engine

// Axis

FullyConnectedDescriptor tensorFullyConnectedDescriptor;

1582

1583

if (param.has_transpose())

1584

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1585

// If true, assumes transposed weights.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1586

tensorFullyConnectedDescriptor.m_TransposeWeightMatrix = param.transpose();

1587

}

1588

else

1589

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1590

// Caffe defaults to transposed.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1591

tensorFullyConnectedDescriptor.m_TransposeWeightMatrix = true;

1592

}

1593

1594

const TensorInfo& inputInfo = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo();

1595

1596

TensorInfo weightInfo;

1597

TensorInfo biasInfo;

1598

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1599

// Allows implicit flattening of extra dimensions.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1600

unsigned int inputSize = inputInfo.GetShape()[1];

1601

for (unsigned int i = 2; i < inputInfo.GetNumDimensions(); ++i)

1602

{

1603

inputSize *= inputInfo.GetShape()[i];

1604

}

1605

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1606

const float* weightDataPtr = GetArrayPtrFromBlob(layerParam, 0);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1607

const unsigned int swTD[2] = { outputSize, inputSize };

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1608

ConstTensor weights(TensorInfo(2, swTD, DataType::Float32), weightDataPtr);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1609

1610

tensorFullyConnectedDescriptor.m_BiasEnabled = true;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1611

// Todo: check whether bias enabled.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1612

armnn::IConnectableLayer* fullyConnectedLayer = nullptr;

1613

if (tensorFullyConnectedDescriptor.m_BiasEnabled)

1614

{

1615

// BIAS VALUE

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1616

const float* biasDataPtr = GetArrayPtrFromBlob(layerParam, 1);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1617

1618

const unsigned int sbTD[1] = { outputSize };

1619

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1620

ConstTensor biases(TensorInfo(1, sbTD, DataType::Float32), biasDataPtr);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1621

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

1622

fullyConnectedLayer = m_Network->AddFullyConnectedLayer(tensorFullyConnectedDescriptor,

1623

weights,

1624

Optional<ConstTensor>(biases),

1625

layerParam.name().c_str());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1626

}

1627

else

1628

{

Matteo Martincigh

2019-05-14 10:36:13 +0100

[diff] [blame]

1629

fullyConnectedLayer = m_Network->AddFullyConnectedLayer(tensorFullyConnectedDescriptor,

1630

weights,

1631

EmptyOptional(),

1632

layerParam.name().c_str());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1633

}

1634

1635

TensorInfo outputInfo({ inputInfo.GetShape()[0], outputSize }, DataType::Float32);

1636

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).Connect(fullyConnectedLayer->GetInputSlot(0));

1637

fullyConnectedLayer->GetOutputSlot(0).SetTensorInfo(outputInfo);

1638

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), fullyConnectedLayer->GetOutputSlot(0));

1639

}

1640

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1641

void ICaffeParser::CaffeParserImpl::ParseSoftmaxLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1642

{

1643

ValidateNumInputsOutputs(layerParam, 1, 1);

1644

1645

SoftmaxParameter param = layerParam.softmax_param();

1646

1647

const TensorInfo& inputInfo = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo();

1648

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1649

// Ignored Caffe Parameters:

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

// axis

// Engine

armnn::SoftmaxDescriptor softmaxDescriptor;

Teresa Charlin

4320c92

2020-08-12 16:04:41 +0100

[diff] [blame]

1654

softmaxDescriptor.m_Axis = 1;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1655

armnn::IConnectableLayer* const softmaxLayer = m_Network->AddSoftmaxLayer(

1656

softmaxDescriptor,

1657

layerParam.name().c_str());

1658

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).Connect(softmaxLayer->GetInputSlot(0));

1659

softmaxLayer->GetOutputSlot(0).SetTensorInfo(inputInfo);

1660

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), softmaxLayer->GetOutputSlot(0));

1661

}

1662

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1663

void ICaffeParser::CaffeParserImpl::ParseEltwiseLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1664

{

1665

ValidateNumInputsOutputs(layerParam, 2, 1);

1666

1667

const TensorInfo& inputInfo = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo();

1668

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1669

// Ignored Caffe Parameters:

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1670

// coeff

1671

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1672

EltwiseParameter_EltwiseOp operation = EltwiseParameter_EltwiseOp_SUM; // Defaults to sum as per caffe.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1673

1674

if (layerParam.has_eltwise_param() && layerParam.eltwise_param().has_operation())

1675

{

1676

operation = layerParam.eltwise_param().operation();

1677

}

1678

1679

armnn::IConnectableLayer* newLayer = nullptr;

1680

switch (operation)

1681

{

1682

case EltwiseParameter_EltwiseOp_SUM:

1683

{

1684

newLayer = m_Network->AddAdditionLayer(layerParam.name().c_str());

1685

break;

1686

}

1687

case EltwiseParameter_EltwiseOp_PROD:

1688

{

1689

newLayer = m_Network->AddMultiplicationLayer(layerParam.name().c_str());

break;

}

default:

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1694

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1695

fmt::format("Unsupported operation {} in Eltwise layer {} {}",

1696

operation,

1697

layerParam.name(),

1698

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).Connect(newLayer->GetInputSlot(0));

1703

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(1)).Connect(newLayer->GetInputSlot(1));

1704

newLayer->GetOutputSlot(0).SetTensorInfo(inputInfo);

1705

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), newLayer->GetOutputSlot(0));

1706

}

1707

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1708

void ICaffeParser::CaffeParserImpl::ParseConcatLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1709

{

1710

unsigned int numInputs = static_cast<unsigned int>(layerParam.bottom_size());

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1711

// We assume concat happens along the channel dimension, which is 1 in (0, 1, 2, 3).

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1712

unsigned int concatDim = 1;

1713

unsigned int numOfDims = 4;

1714

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1715

// we only consider 4-D tensor here

1716

OriginsDescriptor concatDescriptor(static_cast<uint32_t>(numInputs), numOfDims);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1717

std::vector<unsigned int>mergeDimSizes(numOfDims, 0u);

1718

1719

unsigned int mergeDim = 0;

1720

for (unsigned int viewIndex = 0; viewIndex < numInputs; ++viewIndex)

1721

{

1722

const TensorInfo& inputInfo = GetArmnnOutputSlotForCaffeTop(

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

1723

layerParam.bottom(armnn::numeric_cast<int>(viewIndex))).GetTensorInfo();

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1724

// Checks whether the dimensions of the input tensors are actually 4.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1725

if (inputInfo.GetNumDimensions()!=4)

1726

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1727

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1728

fmt::format("The number of dimensions for input tensors of "

1729

"the concatenation op should be 4. Inputs of {} has "

1730

"{} dimensions. {}",

1731

layerParam.name(),

1732

inputInfo.GetNumDimensions(),

1733

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1734

}

1735

1736

mergeDimSizes[0] = inputInfo.GetShape()[0];

1737

mergeDimSizes[1] = inputInfo.GetShape()[1];

1738

mergeDimSizes[2] = inputInfo.GetShape()[2];

1739

mergeDimSizes[3] = inputInfo.GetShape()[3];

1740

1741

for (unsigned int j = 0; j < concatDim; ++j)

1742

{

1743

concatDescriptor.SetViewOriginCoord(viewIndex, j, 0);

1744

}

1745

1746

concatDescriptor.SetViewOriginCoord(viewIndex, concatDim, mergeDim);

1747

mergeDim += mergeDimSizes[concatDim];

1748

1749

for (unsigned int j = concatDim+1; j < numOfDims; ++j)

1750

{

1751

concatDescriptor.SetViewOriginCoord(viewIndex, j, 0);

1752

}

1753

}

1754

mergeDimSizes[concatDim] = mergeDim;

1755

Jim Flynn

906f946

2019-05-10 13:55:21 +0100

[diff] [blame]

1756

armnn::IConnectableLayer* concatlayer = m_Network->AddConcatLayer(concatDescriptor, layerParam.name().c_str());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1757

for (unsigned int i = 0; i < numInputs; ++i)

1758

{

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

1759

armnn::IOutputSlot& outputSlot = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(armnn::numeric_cast<int>(i)));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1760

outputSlot.Connect(concatlayer->GetInputSlot(i));

1761

}

1762

1763

concatlayer->GetOutputSlot(0).SetTensorInfo(armnn::TensorInfo(numOfDims, mergeDimSizes.data(), DataType::Float32));

1764

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), concatlayer->GetOutputSlot(0));

1765

}

1766

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1767

void ICaffeParser::CaffeParserImpl::ParseBatchNormLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1768

{

1769

ValidateNumInputsOutputs(layerParam, 1, 1);

1770

1771

const TensorInfo& inputInfo = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo();

1772

1773

string name = layerParam.name();

1774

1775

BatchNormParameter param = layerParam.batch_norm_param();

1776

// If use_global_stats is not explicitly set in the model, assume it to be true (its default value

1777

// when the network is in the testing phase).

1778

if (param.has_use_global_stats())

1779

{

1780

if (!param.use_global_stats())

1781

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1782

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1783

fmt::format("Error parsing Batch Norm layer '{}': "

1784

"Parameter 'use_global_stats' is set to false, which is "

1785

"unsupported (value used for training). {}",

1786

name,

1787

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

BatchNormalizationDescriptor desc;

1792

desc.m_Eps = param.eps();

1793

1794

unsigned int channels = inputInfo.GetShape()[1];

1795

unsigned int shape[] = {channels};

1796

1797

vector<float> meanData(channels);

1798

GetDataFromBlob(layerParam, meanData, 0);

1799

1800

vector<float> varianceData(channels);

1801

GetDataFromBlob(layerParam, varianceData, 1);

1802

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1803

// Reads moving average factor and applies scaling (if required).

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

1804

const BlobProto& blob = layerParam.blobs(armnn::numeric_cast<int>(2));

1805

const float movingAverageFactor = blob.data(armnn::numeric_cast<int>(0));

surmeh01

3537c2c

2018-05-18 16:31:43 +0100

[diff] [blame]

1806

if(movingAverageFactor != 0.0f)

1807

{

1808

const float scaleFactor = 1.0f / movingAverageFactor;

1809

auto scaleFunction = [scaleFactor](float f) -> float { return f * scaleFactor; };

1810

1811

std::transform(varianceData.begin(), varianceData.end(), varianceData.begin(), scaleFunction);

1812

std::transform(meanData.begin(), meanData.end(), meanData.begin(), scaleFunction);

1813

}

1814

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1815

// Identifies scale operation.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1816

vector<float> betaData(channels, 0.0f);

1817

vector<float> gammaData(channels, 1.0f);

1818

1819

ConstTensor mean(TensorInfo(1, shape, armnn::DataType::Float32), meanData);

1820

ConstTensor variance(TensorInfo(1, shape, armnn::DataType::Float32), varianceData);

1821

ConstTensor beta(TensorInfo(1, shape, armnn::DataType::Float32), betaData);

1822

ConstTensor gamma(TensorInfo(1, shape, armnn::DataType::Float32), gammaData);

1823

1824

armnn::IConnectableLayer* const batchNormLayer = m_Network->AddBatchNormalizationLayer(desc,

1825

mean, variance, beta, gamma, name.c_str());

1826

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).Connect(batchNormLayer->GetInputSlot(0));

1827

batchNormLayer->GetOutputSlot(0).SetTensorInfo(inputInfo);

1828

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), batchNormLayer->GetOutputSlot(0));

1829

}

1830

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1831

void ICaffeParser::CaffeParserImpl::ParseScaleLayer(const LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1832

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1833

// Current unoptimal solution: add a batchnormalization layer with 0 mean and 1 variance.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1834

ValidateNumInputsOutputs(layerParam, 1, 1);

1835

1836

const TensorInfo& inputInfo = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).GetTensorInfo();

1837

1838

string name = layerParam.name();

1839

1840

ScaleParameter param = layerParam.scale_param();

1841

if (param.axis() != 1)

1842

{

1843

// Would have to use something other than BatchNormalizationLayer in this case

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1844

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1845

fmt::format("Loading Scale Layer: Only axis 1 is supported currently. "

1846

"Layer={} Axis={} {}",

1847

layerParam.name(),

1848

param.axis(),

1849

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1850

}

1851

1852

unsigned int channels = inputInfo.GetShape()[1];

1853

unsigned int shape[] = {channels};

1854

1855

BatchNormalizationDescriptor desc;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1856

desc.m_Eps = 0.0f; // Don't need epsilon if variance is 1.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1857

vector<float> meanData(channels, 0.0f);

1858

vector<float> varianceData(channels, 1.0f);

1859

vector<float> betaData(channels, 0.0f);

1860

vector<float> gammaData(channels);

1861

1862

GetDataFromBlob(layerParam, gammaData, 0);

1863

1864

if(param.has_bias_term())

1865

{

1866

GetDataFromBlob(layerParam, betaData, 1);

1867

}

1868

1869

ConstTensor mean(TensorInfo(1, shape, armnn::DataType::Float32), meanData);

1870

ConstTensor variance(TensorInfo(1, shape, armnn::DataType::Float32), varianceData);

1871

ConstTensor beta(TensorInfo(1, shape, armnn::DataType::Float32), betaData);

1872

ConstTensor gamma(TensorInfo(1, shape, armnn::DataType::Float32), gammaData);

1873

1874

armnn::IConnectableLayer* const batchNormLayer = m_Network->AddBatchNormalizationLayer(desc,

1875

mean, variance, beta, gamma, name.c_str());

1876

GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)).Connect(batchNormLayer->GetInputSlot(0));

1877

batchNormLayer->GetOutputSlot(0).SetTensorInfo(inputInfo);

1878

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), batchNormLayer->GetOutputSlot(0));

1879

}

1880

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1881

void ICaffeParser::CaffeParserImpl::ParseSplitLayer(const caffe::LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1882

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1883

// Used in caffe to duplicate memory - not necessary in armnn.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1884

if (layerParam.bottom_size() != 1)

1885

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1886

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1887

fmt::format("Split layer '{}' should have exactly 1 bottom. "

1888

"#bottoms={} {}",

1889

layerParam.name(),

1890

layerParam.bottom_size(),

1891

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1892

}

1893

armnn::IOutputSlot& outputSlot = GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0));

1894

for (int i = 0; i < layerParam.top_size(); i++)

1895

{

1896

SetArmnnOutputSlotForCaffeTop(layerParam.top(i), outputSlot);

}

}

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1900

void ICaffeParser::CaffeParserImpl::ParseDropoutLayer(const caffe::LayerParameter& layerParam)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1901

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1902

// Ignored for inference, so patch the single input to its single output.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1903

if (layerParam.bottom_size() != 1 || layerParam.top_size() != 1)

1904

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1905

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1906

fmt::format("Dropout layer '{}' should have exactly 1 bottom and 1 top. "

1907

"#bottoms={} #tops={} {}",

1908

layerParam.name(),

1909

layerParam.bottom_size(),

1910

layerParam.top_size(),

1911

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1912

}

1913

SetArmnnOutputSlotForCaffeTop(layerParam.top(0), GetArmnnOutputSlotForCaffeTop(layerParam.bottom(0)));

1914

}

1915

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1916

void ICaffeParser::CaffeParserImpl::TrackInputBinding(armnn::IConnectableLayer* layer,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1917

armnn::LayerBindingId id,

1918

const armnn::TensorInfo& tensorInfo)

1919

{

1920

return TrackBindingPoint(layer, id, tensorInfo, layer->GetName(), m_NetworkInputsBindingInfo);

1921

}

1922

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1923

void ICaffeParser::CaffeParserImpl::TrackOutputBinding(armnn::IConnectableLayer* layer,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1924

armnn::LayerBindingId id,

1925

const armnn::TensorInfo& tensorInfo)

1926

{

1927

return TrackBindingPoint(layer, id, tensorInfo, layer->GetName(), m_NetworkOutputsBindingInfo);

1928

}

1929

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1930

void ICaffeParser::CaffeParserImpl::TrackBindingPoint(armnn::IConnectableLayer* layer,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1931

armnn::LayerBindingId id,

1932

const armnn::TensorInfo& tensorInfo,

1933

const char* bindingPointDesc,

1934

std::unordered_map<std::string, BindingPointInfo>& nameToBindingInfo)

1935

{

1936

const std::string layerName = layer->GetName();

1937

auto it = nameToBindingInfo.find(layerName);

1938

if (it == nameToBindingInfo.end())

1939

{

1940

nameToBindingInfo[layerName] = std::make_pair(id, tensorInfo);

1941

}

1942

else

1943

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1944

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1945

fmt::format("Id {} used by more than one {} layer {}",

1946

id,

1947

bindingPointDesc,

1948

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1952

armnn::IOutputSlot& ICaffeParser::CaffeParserImpl::GetArmnnOutputSlotForCaffeTop(const std::string& caffeTopName) const

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1953

{

1954

auto it = m_ArmnnOutputSlotForCaffeTop.find(caffeTopName);

1955

if (it != m_ArmnnOutputSlotForCaffeTop.end())

{

return *it->second;

}

else

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1961

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1962

fmt::format("Could not find armnn output slot for Caffe top '{}' {}",

1963

caffeTopName,

1964

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1968

void ICaffeParser::CaffeParserImpl::SetArmnnOutputSlotForCaffeTop(

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1969

const std::string& caffeTopName, armnn::IOutputSlot& armnnOutputSlot)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1970

{

1971

auto it = m_ArmnnOutputSlotForCaffeTop.find(caffeTopName);

1972

if (it == m_ArmnnOutputSlotForCaffeTop.end())

1973

{

1974

m_ArmnnOutputSlotForCaffeTop[caffeTopName] = &armnnOutputSlot;

1975

}

1976

else

1977

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1978

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

1979

fmt::format("Attempting to add duplicate entry for Caffe top '{}' {}",

1980

caffeTopName,

1981

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1985

// Note: can move to CaffeParser when/if we optimise the text/string format

1986

// to load on a layer by layer basis

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

1987

void ICaffeParser::CaffeParserImpl::ResolveInPlaceLayers(caffe::NetParameter& netParameter)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1988

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1989

// Finds layers with the same top.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1990

std::map<std::string, std::vector<caffe::LayerParameter*>> layersByTop;

1991

for (int layerIdx = 0; layerIdx < netParameter.layer_size(); ++layerIdx)

1992

{

1993

caffe::LayerParameter& layer = *netParameter.mutable_layer(layerIdx);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1994

std::string name = layer.name();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1995

for (int i = 0; i < layer.top_size(); ++i)

1996

{

1997

layersByTop[layer.top(i)].push_back(&layer);

}

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2001

// For each set of layers with the same top, resolves them to a linear chain rather than in-place layers.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2002

// Note that for 'regular' layers, there will be a single layer in each group and so this will be a no-op.

2003

for (auto layersWithSameTopIt : layersByTop)

2004

{

2005

const std::string& top = layersWithSameTopIt.first;

2006

const std::vector<caffe::LayerParameter*>& layersWithSameTop = layersWithSameTopIt.second;

2007

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2008

// Chains the layers together in the order that they are listed in the prototxt (hopefully this is correct).

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2009

// Note that the last layer will not have its top modified so that other layers will continue to reference it.

2010

for (unsigned int layerIdx = 0; layerIdx < layersWithSameTop.size() - 1; ++layerIdx)

2011

{

2012

caffe::LayerParameter& layer1 = *layersWithSameTop[layerIdx];

2013

caffe::LayerParameter& layer2 = *layersWithSameTop[layerIdx+1];

2014

if (layer1.top_size() != 1)

2015

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2016

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2017

fmt::format("Node '{}' is an in-place layer but doesn't have exactly one "

2018

"top. It has {} instead. {}",

2019

layer1.name(),

2020

layer1.top_size(),

2021

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2022

}

2023

std::string newTop = layer1.name() + "_top";

2024

layer1.set_top(0, newTop);

2025

if (layer2.bottom_size() != 1 || layer2.bottom(0) != top)

2026

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2027

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2028

fmt::format("Node '{}' is an in-place layer but "

2029

"doesn't have exactly one bottom, or it doesn't match its top. "

2030

"#bottoms={}, first bottom is {}, top is {} {}",

layer2.name(),

layer2.bottom(0),

top,

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2035

}

2036

layer2.set_bottom(0, newTop);

}

}

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2041

// Note: can move to CaffeParser when/if we optimise the text/string format

2042

// to load on a layer by layer basis

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

2043

void ICaffeParser::CaffeParserImpl::LoadNetParam(NetParameter& netParameter)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2044

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2045

// Caffe models sometimes have an implicit input layer.

2046

// In that case, add an explicit one.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2047

if (netParameter.input_size() > 0)

2048

{

2049

LayerParameter* newLayer = netParameter.add_layer();

2050

2051

newLayer->set_type("Input");

2052

newLayer->set_name(netParameter.input(0));

2053

newLayer->add_top(netParameter.input(0));

2054

2055

InputParameter* inputParam = newLayer->mutable_input_param();

2056

BlobShape* shape = inputParam->add_shape();

2057

2058

int dim_size = netParameter.input_dim_size();

2059

for (int i = 0; i < dim_size; ++i)

2060

{

2061

shape->add_dim(netParameter.input_dim(i));

}

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2065

// Replaces in-place layers with regular ones to make the rest of the parsing easier.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2066

ResolveInPlaceLayers(netParameter);

2067

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2068

// Creates a lookup of Caffe layers by name.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2069

for (int i = 0; i < netParameter.layer_size(); ++i)

2070

{

2071

const caffe::LayerParameter& layer = netParameter.layer(i);

2072

for (int i = 0; i < layer.top_size(); ++i)

2073

{

2074

m_CaffeLayersByTopName[layer.top(i)] = &layer;

}

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2078

// Finds the output layers the user requested.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2079

std::vector<const caffe::LayerParameter*> targetLayers;

2080

for (const std::string& requestedOutputName : m_RequestedOutputs)

2081

{

2082

auto nodeIt = m_CaffeLayersByTopName.find(requestedOutputName);

2083

if (nodeIt == m_CaffeLayersByTopName.end())

2084

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2085

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2086

fmt::format("Couldn't find requested output layer '{}' in graph {}",

2087

requestedOutputName,

2088

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2089

}

2090

targetLayers.push_back(nodeIt->second);

2091

}

2092

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2093

// Sorts them into a linear ordering such that all inputs of a node are before the node itself.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2094

std::vector<const caffe::LayerParameter*> sortedNodes;

2095

if (!armnnUtils::GraphTopologicalSort<const caffe::LayerParameter*>(

2096

targetLayers,

2097

[this](const caffe::LayerParameter* node)

2098

{

2099

return GetInputs(*node);

2100

},

2101

sortedNodes))

2102

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2103

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2104

fmt::format("Cycle detected in graph. #nodes: {} {}",

2105

sortedNodes.size(),

2106

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2107

}

2108

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2109

// Parses each node in order, knowing that all inputs of a node will be processed before the node itself.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2110

for (const caffe::LayerParameter* current : sortedNodes)

2111

{

2112

auto it = ms_CaffeLayerNameToParsingFunctions.find(current->type());

2113

if (it == ms_CaffeLayerNameToParsingFunctions.end())

2114

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2115

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2116

fmt::format("Unsupported layer type: '{}' for layer {} {}",

2117

current->type(),

2118

current->name(),

2119

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2120

}

2121

auto func = it->second;

2122

(this->*func)(*current);

2123

}

2124

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2125

// Adds ArmNN output layers connected to each requested output.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2126

for (const std::string& requestedOutput : m_RequestedOutputs)

2127

{

2128

armnn::IOutputSlot& outputSlot = GetArmnnOutputSlotForCaffeTop(requestedOutput);

2129

Matthew Sloyan

2020-09-11 16:17:48 +0100

[diff] [blame]

2130

const armnn::LayerBindingId outputId = armnn::numeric_cast<armnn::LayerBindingId>(

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2131

m_NetworkOutputsBindingInfo.size());

2132

armnn::IConnectableLayer* const outputLayer = m_Network->AddOutputLayer(outputId, requestedOutput.c_str());

2133

outputSlot.Connect(outputLayer->GetInputSlot(0));

2134

2135

TrackOutputBinding(outputLayer, outputId, outputLayer->GetInputSlot(0).GetConnection()->GetTensorInfo());

}

}

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

2139

INetworkPtr ICaffeParser::CaffeParserImpl::CreateNetworkFromTextFile(const char* graphFile,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2140

const std::map<std::string, armnn::TensorShape>& inputShapes,

2141

const std::vector<std::string>& requestedOutputs)

2142

{

2143

FILE* fd = fopen(graphFile, "r");

2144

2145

if (fd == nullptr)

2146

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2147

throw FileNotFoundException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2148

fmt::format("Failed to open graph file: {} {}",

2149

graphFile,

2150

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2151

}

2152

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2153

// Parses the file into a message.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2154

NetParameter netParam;

2155

auto input = new google::protobuf::io::FileInputStream(fileno(fd));

2156

bool success = google::protobuf::TextFormat::Parse(input, &netParam);

delete input;

fclose(fd);

if (!success)

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2162

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2163

fmt::format("Failed to parse graph file: {} {}",

2164

graphFile,

2165

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2166

}

2167

2168

return CreateNetworkFromNetParameter(netParam, inputShapes, requestedOutputs);

2169

}

2170

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

2171

INetworkPtr ICaffeParser::CaffeParserImpl::CreateNetworkFromString(const char* protoText,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2172

const std::map<std::string, armnn::TensorShape>& inputShapes,

2173

const std::vector<std::string>& requestedOutputs)

2174

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2175

// Parses the string into a message.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2176

NetParameter netParam;

2177

bool success = google::protobuf::TextFormat::ParseFromString(protoText, &netParam);

2178

2179

if (!success)

2180

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2181

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2182

fmt::format("Failed to parse graph string {}",

2183

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2184

}

2185

2186

return CreateNetworkFromNetParameter(netParam, inputShapes, requestedOutputs);

2187

}

2188

2189

INetworkPtr CaffeParser::CreateNetworkFromBinaryFile(const char* graphFile,

2190

const std::map<std::string, armnn::TensorShape>& inputShapes,

2191

const std::vector<std::string>& requestedOutputs)

2192

{

2193

FILE* fd = fopen(graphFile, "rb");

2194

2195

if (fd == nullptr)

2196

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2197

throw FileNotFoundException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2198

fmt::format("Failed to open graph file at: {} {}",

2199

graphFile,

2200

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2201

}

2202

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2203

// Parses the file into a message.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2204

NetParameter netParam;

2205

2206

FileInputStream inStream(fileno(fd));

2207

CodedInputStream codedStream(&inStream);

Nikhil Raj

e518153

2020-10-09 14:52:25 +0100

[diff] [blame]

2208

codedStream.SetTotalBytesLimit(INT_MAX);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2209

bool success = netParam.ParseFromCodedStream(&codedStream);

fclose(fd);

if (!success)

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2214

throw ParseException(

James Ward

2020-09-11 17:32:44 +0100

[diff] [blame]

2215

fmt::format("Failed to parse protobuf file: {} {}",

2216

graphFile,

2217

CHECK_LOCATION().AsString()));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2218

}

2219

2220

return CreateNetworkFromNetParameter(netParam, inputShapes, requestedOutputs);

2221

}

2222

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2223

// Note: can move to CaffeParser when/if we optimise the text/string format

2224

// to load on a layer by layer basis

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

2225

INetworkPtr ICaffeParser::CaffeParserImpl::CreateNetworkFromNetParameter(NetParameter& netParam,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2226

const std::map<std::string, armnn::TensorShape>& inputShapes,

2227

const std::vector<std::string>& requestedOutputs)

2228

{

2229

m_NetworkInputsBindingInfo.clear();

2230

m_NetworkOutputsBindingInfo.clear();

2231

2232

m_Network = INetwork::Create();

2233

2234

m_InputShapes = inputShapes;

2235

if (requestedOutputs.size() == 0)

2236

{

2237

throw ParseException("requestedOutputs must have at least one entry");

2238

}

2239

m_RequestedOutputs = requestedOutputs;

try

{

LoadNetParam(netParam);

2244

}

2245

catch (const ParseException& e)

{

Cleanup();

throw e;

}

Cleanup();

return move(m_Network);

2254

}

2255

Matthew Sloyan

ac001ee

2021-02-03 10:43:04 +0000

[diff] [blame]

2256

const std::string ICaffeParser::CaffeParserImpl::GetVersion()

2257

{

2258

return CAFFE_PARSER_VERSION;

2259

}

2260

Kevin May

2021-01-29 14:24:57 +0000

[diff] [blame]

2261

void ICaffeParser::CaffeParserImpl::Cleanup() {

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2262

// cleanup, in case we reuse this parser

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

2263

m_InputShapes.clear();

2264

m_RequestedOutputs.clear();

2265

m_ArmnnOutputSlotForCaffeTop.clear();

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

2266

// NOTE: when we get the text/string format

2267

// optimised for memory then this data structure can

2268

// also move to the CaffeParser class

2269

m_CaffeLayersByTopName.clear();

telsoa01