Blame - 1.2/HalPolicy.cpp - ml/android-nn-driver

2019-06-11 16:35:25 +0100

[diff] [blame]

1

//

2

3

// SPDX-License-Identifier: MIT

4

//

5

6

#include "HalPolicy.hpp"

7

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

8

#include "Utils.hpp"

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

9

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

10

#include "../1.0/HalPolicy.hpp"

11

#include "../1.1/HalPolicy.hpp"

12

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

13

#include <DataLayoutIndexed.hpp>

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

14

#include <Half.hpp>

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

#include <cmath>

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

18

namespace armnn_driver

{

namespace hal_1_2

{

bool HandledByV1_0(V1_2::OperationType operationType)

24

{

25

switch (static_cast<V1_0::OperationType>(operationType))

26

{

27

case V1_0::OperationType::ADD:

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

28

case V1_0::OperationType::DEPTH_TO_SPACE:

29

case V1_0::OperationType::DEQUANTIZE:

30

case V1_0::OperationType::EMBEDDING_LOOKUP:

31

case V1_0::OperationType::FLOOR:

32

case V1_0::OperationType::FULLY_CONNECTED:

33

case V1_0::OperationType::HASHTABLE_LOOKUP:

34

case V1_0::OperationType::L2_NORMALIZATION:

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

35

case V1_0::OperationType::LOCAL_RESPONSE_NORMALIZATION:

36

case V1_0::OperationType::LOGISTIC:

37

case V1_0::OperationType::LSH_PROJECTION:

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

38

case V1_0::OperationType::MUL:

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

39

case V1_0::OperationType::RESHAPE:

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

40

case V1_0::OperationType::RNN:

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

41

case V1_0::OperationType::SVDF:

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

42

case V1_0::OperationType::OEM_OPERATION:

return true;

default:

return false;

}

}

bool HandledByV1_1(V1_2::OperationType operationType)

50

{

51

if (HandledByV1_0(operationType))

{

return true;

}

switch (static_cast<V1_1::OperationType>(operationType))

56

{

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

57

case V1_1::OperationType::DIV:

58

case V1_1::OperationType::MEAN:

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

59

case V1_1::OperationType::SQUEEZE:

60

case V1_1::OperationType::STRIDED_SLICE:

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

61

case V1_1::OperationType::TRANSPOSE:

return true;

default:

return false;

}

}

bool HandledByV1_0(const V1_2::Operation& operation)

69

{

70

return HandledByV1_0(operation.type);

71

}

72

73

bool HandledByV1_1(const V1_2::Operation& operation)

74

{

75

return HandledByV1_1(operation.type);

76

}

77

78

V1_0::OperationType CastToV1_0(V1_2::OperationType type)

79

{

80

return static_cast<V1_0::OperationType>(type);

81

}

82

83

V1_1::OperationType CastToV1_1(V1_2::OperationType type)

84

{

85

return static_cast<V1_1::OperationType>(type);

86

}

87

88

V1_0::Operation ConvertToV1_0(const V1_2::Operation& operation)

89

{

90

V1_0::Operation op;

91

op.type = CastToV1_0(operation.type);

92

op.inputs = operation.inputs;

93

op.outputs = operation.outputs;

return op;

}

V1_1::Operation ConvertToV1_1(const V1_2::Operation& operation)

98

{

99

V1_1::Operation op;

100

op.type = CastToV1_1(operation.type);

101

op.inputs = operation.inputs;

102

op.outputs = operation.outputs;

return op;

}

bool HalPolicy::ConvertOperation(const Operation& operation, const Model& model, ConversionData& data)

107

{

108

if (HandledByV1_0(operation) && compliantWithV1_0(model))

109

{

110

hal_1_0::HalPolicy::Operation v10Operation = ConvertToV1_0(operation);

111

hal_1_0::HalPolicy::Model v10Model = convertToV1_0(model);

112

113

return hal_1_0::HalPolicy::ConvertOperation(v10Operation, v10Model, data);

114

}

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

115

116

if (HandledByV1_1(operation) && compliantWithV1_1(model))

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

117

{

118

hal_1_1::HalPolicy::Operation v11Operation = ConvertToV1_1(operation);

119

hal_1_1::HalPolicy::Model v11Model = convertToV1_1(model);

120

121

return hal_1_1::HalPolicy::ConvertOperation(v11Operation, v11Model, data);

122

}

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

123

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

124

switch (operation.type)

125

{

Sadik Armagan

15d63e2

2019-07-26 16:59:35 +0100

[diff] [blame]

126

case V1_2::OperationType::AVERAGE_POOL_2D:

127

return ConvertAveragePool2d(operation, model, data);

Finn Williams

23b87b3

2019-07-30 11:44:05 +0100

[diff] [blame]

128

case V1_2::OperationType::BATCH_TO_SPACE_ND:

129

return ConvertBatchToSpaceNd(operation, model, data);

Mike Kelly

b880520

2019-07-31 17:25:43 +0100

[diff] [blame]

130

case V1_2::OperationType::CONCATENATION:

131

return ConvertConcatenation(operation, model, data);

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

132

case V1_2::OperationType::CONV_2D:

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

133

return ConvertConv2d(operation, model, data);

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

134

case V1_2::OperationType::DEPTHWISE_CONV_2D:

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

135

return ConvertDepthwiseConv2d(operation, model, data);

Sadik Armagan

15d63e2

2019-07-26 16:59:35 +0100

[diff] [blame]

136

case V1_2::OperationType::L2_POOL_2D:

137

return ConvertL2Pool2d(operation, model, data);

138

case V1_2::OperationType::MAX_POOL_2D:

139

return ConvertMaxPool2d(operation, model, data);

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

140

case V1_2::OperationType::MAXIMUM:

141

return ConvertMaximum(operation, model, data);

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

142

case V1_2::OperationType::MINIMUM:

143

return ConvertMinimum(operation, model, data);

Mike Kelly

3c67394

2019-07-25 09:26:06 +0100

[diff] [blame]

144

case V1_2::OperationType::PAD:

Aron Virginas-Tar

c921f6b

2019-07-25 10:14:33 +0100

[diff] [blame]

145

return ConvertPad(operation, model, data);

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

146

case V1_2::OperationType::PAD_V2:

147

return ConvertPadV2(operation, model, data);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

148

case V1_2::OperationType::PRELU:

149

return ConvertPrelu(operation, model, data);

Sadik Armagan

5a476a8

2019-07-30 09:43:18 +0100

[diff] [blame]

150

case V1_2::OperationType::QUANTIZE:

151

return ConvertQuantize(operation, model, data);

Ellen Norris-Thompson

7efb46d

2019-07-24 17:39:19 +0100

[diff] [blame^]

152

case V1_2::OperationType::QUANTIZED_16BIT_LSTM:

153

return ConvertQuantizedLstm(operation, model, data);

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

154

case V1_2::OperationType::RELU:

155

return ConvertReLu(operation, model, data);

156

case V1_2::OperationType::RELU1:

157

return ConvertReLu1(operation, model, data);

158

case V1_2::OperationType::RELU6:

159

return ConvertReLu6(operation, model, data);

Aron Virginas-Tar

2019-07-04 11:59:48 +0100

[diff] [blame]

160

case V1_2::OperationType::RESIZE_BILINEAR:

161

return ConvertResize(operation, model, data, armnn::ResizeMethod::Bilinear);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

162

case V1_2::OperationType::RESIZE_NEAREST_NEIGHBOR:

Aron Virginas-Tar

2019-07-04 11:59:48 +0100

[diff] [blame]

163

return ConvertResize(operation, model, data, armnn::ResizeMethod::NearestNeighbor);

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

164

case V1_2::OperationType::TRANSPOSE_CONV_2D:

Aron Virginas-Tar

8b99168

2019-07-31 12:54:59 +0100

[diff] [blame]

165

return ConvertTransposeConv2d(operation, model, data);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

166

case V1_2::OperationType::SOFTMAX:

167

return ConvertSoftmax(operation, model, data);

Finn Williams

d74c505

2019-07-30 17:06:00 +0100

[diff] [blame]

168

case V1_2::OperationType::SPACE_TO_BATCH_ND :

169

return ConvertSpaceToBatchNd(operation, model, data);

Aron Virginas-Tar

ad1ab53

2019-07-25 11:24:42 +0100

[diff] [blame]

170

case V1_2::OperationType::SPACE_TO_DEPTH:

171

return ConvertSpaceToDepth(operation, model, data);

Mike Kelly

0a87936

2019-07-29 16:56:31 +0100

[diff] [blame]

172

case V1_2::OperationType::SUB:

173

return ConvertSub(operation, model, data);

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

174

case V1_2::OperationType::TANH:

175

return ConvertTanH(operation, model, data);

Ferran Balaguer

b2397fd

2019-07-25 12:12:39 +0100

[diff] [blame]

176

case V1_2::OperationType::LSTM:

177

return ConvertLstm(operation, model, data);

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

178

default:

179

return Fail("%s: Operation type %s not supported in ArmnnDriver",

180

__func__, toString(operation.type).c_str());

}

}

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

184

bool HalPolicy::ConvertAveragePool2d(const Operation& operation, const Model& model, ConversionData& data)

185

{

186

ALOGV("hal_1_2::HalPolicy::ConvertAveragePool2d()");

187

return ConvertPooling2d<hal_1_2::HalPolicy>(operation, __func__, armnn::PoolingAlgorithm::Average, model, data);

188

}

189

Finn Williams

23b87b3

2019-07-30 11:44:05 +0100

[diff] [blame]

190

bool HalPolicy::ConvertBatchToSpaceNd(const Operation& operation, const Model& model, ConversionData& data)

191

{

192

ALOGV("hal_1_2::HalPolicy::ConvertBatchToSpaceNd()");

193

return ::ConvertBatchToSpaceNd<hal_1_2::HalPolicy>(operation, model, data);

194

}

195

Mike Kelly

b880520

2019-07-31 17:25:43 +0100

[diff] [blame]

196

bool HalPolicy::ConvertConcatenation(const Operation& operation, const Model& model, ConversionData& data)

197

{

198

ALOGV("hal_1_2::HalPolicy::ConvertConcatenation()");

199

return ::ConvertConcatenation<hal_1_2::HalPolicy>(operation, model, data);

200

}

201

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

202

bool HalPolicy::ConvertConv2d(const Operation& operation, const Model& model, ConversionData& data)

203

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

204

ALOGV("hal_1_2::HalPolicy::ConvertConv2d()");

205

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

206

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

207

if (!input.IsValid())

208

{

209

return Fail("%s: Operation has invalid inputs", __func__);

210

}

211

212

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

213

if (!output)

214

{

215

return Fail("%s: Could not read output 0", __func__);

216

}

217

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

218

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

219

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

220

221

if (IsDynamicTensor(outputInfo))

222

{

223

return Fail("%s: Dynamic output tensors are not supported", __func__);

224

}

Aron Virginas-Tar

366e0a6

2019-07-10 13:01:41 +0100

[diff] [blame]

225

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

226

armnn::Convolution2dDescriptor desc;

227

desc.m_DataLayout = armnn::DataLayout::NHWC;

228

229

// Determine whether padding is implicit or explicit

230

bool implicitPadding = operation.inputs.size() == 7 ||

231

(operation.inputs.size() >= 8 &&

232

GetInputOperand<hal_1_2::HalPolicy>(operation, 7, model)->type == OperandType::BOOL);

if (implicitPadding)

{

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 7, model, data);

237

}

238

else if (operation.inputs.size() >= 10)

239

{

240

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 10, model, data);

241

}

242

243

const armnn::PermutationVector OHWIToOIHW = {0, 2, 3, 1};

244

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

245

// ArmNN does not currently support non-fixed weights or bias

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

246

// The NNAPI filter is always OHWI [depth_out, filter_height, filter_width, depth_in] but ArmNN expects the

247

// filter's height and width indices to match the input's height and width indices so we permute it to OIHW if

248

// the DataLayout is NCHW

249

const ConstTensorPin weightsPin = (desc.m_DataLayout == armnn::DataLayout::NCHW) ?

250

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data, OHWIToOIHW) :

251

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

252

const ConstTensorPin biasPin =

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

253

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

254

255

if (!weightsPin.IsValid())

256

{

257

return Fail("%s: Operation has invalid weights", __func__);

258

}

259

260

if (!biasPin.IsValid())

261

{

262

return Fail("%s: Operation has invalid biases", __func__);

263

}

264

265

armnn::ConstTensor weights = weightsPin.GetConstTensor();

266

armnn::ConstTensor bias = biasPin.GetConstTensor();

267

SanitizeBiasQuantizationScale(bias.GetInfo(), weights.GetInfo(), inputInfo);

268

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

269

ActivationFn activation;

270

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

271

if (implicitPadding)

272

{

273

android::nn::PaddingScheme paddingScheme;

274

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 3, paddingScheme, model, data) ||

275

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_StrideX, model, data) ||

276

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_StrideY, model, data) ||

277

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 6, activation, model, data) ||

278

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 8, desc, model, data))

279

{

280

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

281

}

282

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

283

armnnUtils::DataLayoutIndexed dataLayoutIndexed(desc.m_DataLayout);

284

unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

285

unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

286

const uint32_t kernelX = weights.GetShape()[widthIndex];

287

const uint32_t kernelY = weights.GetShape()[heightIndex];

288

const uint32_t inputX = inputInfo.GetShape()[widthIndex];

289

const uint32_t inputY = inputInfo.GetShape()[heightIndex];

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

290

Mike Kelly

86b36d4

2019-07-12 16:39:33 +0100

[diff] [blame]

291

CalcPadding(inputX, kernelX, desc.m_StrideX, desc.m_DilationX, desc.m_PadLeft, desc.m_PadRight, paddingScheme);

292

CalcPadding(inputY, kernelY, desc.m_StrideY, desc.m_DilationY, desc.m_PadTop, desc.m_PadBottom, paddingScheme);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

293

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

294

}

295

else if (operation.inputs.size() >= 10)

296

{

297

// explicit padding

298

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

299

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

300

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

301

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

302

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

303

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

304

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 9, activation, model, data) ||

305

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 11, desc, model, data))

306

{

307

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

308

}

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

313

}

314

315

desc.m_BiasEnabled = true;

316

armnn::Optional<armnn::TensorInfo> biases(bias.GetInfo());

317

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

318

bool isSupported = false;

319

FORWARD_LAYER_SUPPORT_FUNC(__func__,

320

IsConvolution2dSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc,

weights.GetInfo(),

biases);

Aron Virginas-Tar

2b17312

2019-07-15 14:29:09 +0100

[diff] [blame]

328

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

329

if (!isSupported)

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* startLayer =

335

data.m_Network->AddConvolution2dLayer(desc, weights, armnn::Optional<armnn::ConstTensor>(bias));

if (!startLayer)

{

return Fail("%s: AddConvolution2dLayer failed", __func__);

340

}

341

342

armnn::IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, startLayer, data);

if (!endLayer)

{

return Fail("%s: ProcessActivation failed", __func__);

347

}

348

349

input.Connect(startLayer->GetInputSlot(0));

350

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

351

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *endLayer, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

352

}

353

354

bool HalPolicy::ConvertDepthwiseConv2d(const Operation& operation, const Model& model, ConversionData& data)

355

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

356

ALOGV("hal_1_2::HalPolicy::ConvertDepthwiseConv2d()");

357

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

358

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

359

360

if (!input.IsValid())

361

{

362

return Fail("%s: Operation has invalid inputs", __func__);

363

}

364

365

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

if (!output)

{

return Fail("%s: Could not read output 0", __func__);

370

}

371

372

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

373

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

374

375

if (IsDynamicTensor(outputInfo))

376

{

377

return Fail("%s: Dynamic output tensors are not supported", __func__);

378

}

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

379

380

// ArmNN does not currently support non-fixed weights or bias

381

// Find the shape of the weights tensor. In AndroidNN this will be [ 1, H, W, I * M ]

382

const Operand* weightsOperand = GetInputOperand<hal_1_2::HalPolicy>(operation, 1, model);

383

384

if (weightsOperand == nullptr)

385

{

386

return Fail("%s: Operand is invalid", __func__);

387

}

388

armnn::DepthwiseConvolution2dDescriptor desc;

389

desc.m_DataLayout = armnn::DataLayout::NHWC;

390

391

// Determine whether padding is implicit or explicit

392

bool implicitPadding = operation.inputs.size() == 8 ||

393

(operation.inputs.size() >= 9 &&

394

GetInputOperand<hal_1_2::HalPolicy>(operation, 8, model)->type == OperandType::BOOL);

395

396

// Look ahead to find the optional DataLayout, if present

397

const uint32_t dataLayoutFlagIndex = implicitPadding ? 8 : 11;

398

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, dataLayoutFlagIndex, model, data);

399

400

armnnUtils::DataLayoutIndexed dataLayoutIndexed(desc.m_DataLayout);

401

unsigned int channelsIndex = dataLayoutIndexed.GetChannelsIndex();

402

unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

403

unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

404

405

// Reinterpret weight data as [ H, W, I, M ]

406

armnn::TensorShape weightsShape({ weightsOperand->dimensions[1],

407

weightsOperand->dimensions[2],

408

inputInfo.GetShape()[channelsIndex],

409

weightsOperand->dimensions[3] / inputInfo.GetShape()[channelsIndex] });

410

411

// Swizzle weight data [ H, W, I, M ] -> [ M, I, H, W ]

412

const armnn::PermutationVector HWIMToMIHW = { 2U, 3U, 1U, 0U };

413

414

const ConstTensorPin weightsPin =

415

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

1,

model,

data,

HWIMToMIHW,

&weightsShape);

// Bias is a 1D tensor

423

const ConstTensorPin biasPin =

424

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

425

426

if (!weightsPin.IsValid())

427

{

428

return Fail("%s: Operation has invalid weights", __func__);

429

}

430

431

if (!biasPin.IsValid())

432

{

433

return Fail("%s: Operation has invalid biases", __func__);

434

}

435

436

armnn::ConstTensor weights = weightsPin.GetConstTensor();

437

armnn::ConstTensor bias = biasPin.GetConstTensor();

438

SanitizeBiasQuantizationScale(bias.GetInfo(), weights.GetInfo(), inputInfo);

439

440

ActivationFn activation;

if (implicitPadding)

{

android::nn::PaddingScheme paddingScheme;

445

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 3, paddingScheme, model, data) ||

446

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_StrideX, model, data) ||

447

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_StrideY, model, data) ||

448

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 7, activation, model, data) ||

449

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 9, desc, model, data))

450

{

451

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

452

}

453

454

const uint32_t kernelX = weights.GetShape()[3];

455

const uint32_t kernelY = weights.GetShape()[2];

456

const uint32_t inputX = inputInfo.GetShape()[widthIndex];

457

const uint32_t inputY = inputInfo.GetShape()[heightIndex];

458

Mike Kelly

86b36d4

2019-07-12 16:39:33 +0100

[diff] [blame]

459

CalcPadding(inputX, kernelX, desc.m_StrideX, desc.m_DilationX, desc.m_PadLeft, desc.m_PadRight, paddingScheme);

460

CalcPadding(inputY, kernelY, desc.m_StrideY, desc.m_DilationY, desc.m_PadTop, desc.m_PadBottom, paddingScheme);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

461

}

462

else if (operation.inputs.size() >= 11)

463

{

464

// explicit padding

465

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

466

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

467

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

468

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

469

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

470

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

471

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 10, activation, model, data) ||

472

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 12, desc, model, data))

473

{

474

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

}

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

480

}

481

482

desc.m_BiasEnabled = true;

483

armnn::Optional<armnn::TensorInfo> biases(bias.GetInfo());

484

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

485

bool isSupported = false;

486

FORWARD_LAYER_SUPPORT_FUNC(__func__,

487

IsDepthwiseConvolutionSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc,

weights.GetInfo(),

biases);

Aron Virginas-Tar

9fd3739

2019-07-15 18:04:32 +0100

[diff] [blame]

495

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

496

if (!isSupported)

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* startLayer =

502

data.m_Network->AddDepthwiseConvolution2dLayer(desc, weights, armnn::Optional<armnn::ConstTensor>(bias));

Aron Virginas-Tar

9fd3739

2019-07-15 18:04:32 +0100

[diff] [blame]

503

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

504

if (!startLayer)

505

{

506

return Fail("%s: AddDepthwiseConvolution2dLayer failed", __func__);

507

}

508

509

armnn::IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, startLayer, data);

510

if (!endLayer)

511

{

512

return Fail("%s: ProcessActivation failed", __func__);

513

}

514

515

input.Connect(startLayer->GetInputSlot(0));

516

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

517

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *endLayer, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

518

}

519

Sadik Armagan

15d63e2

2019-07-26 16:59:35 +0100

[diff] [blame]

520

bool HalPolicy::ConvertL2Pool2d(const Operation& operation, const Model& model, ConversionData& data)

521

{

522

ALOGV("hal_1_2::HalPolicy::ConvertL2Pool2d()");

523

return ConvertPooling2d<hal_1_2::HalPolicy>(operation, __func__, armnn::PoolingAlgorithm::L2, model, data);

524

}

525

526

bool HalPolicy::ConvertMaxPool2d(const Operation& operation, const Model& model, ConversionData& data)

527

{

528

ALOGV("hal_1_2::HalPolicy::ConvertMaxPool2d()");

529

return ConvertPooling2d<hal_1_2::HalPolicy>(operation, __func__, armnn::PoolingAlgorithm::Max, model, data);

530

}

531

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

532

bool HalPolicy::ConvertMaximum(const Operation& operation, const Model& model, ConversionData& data)

533

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

534

ALOGV("hal_1_2::HalPolicy::ConvertMaximum()");

535

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

536

LayerInputHandle input0 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

537

LayerInputHandle input1 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

538

539

if (!input0.IsValid() || !input1.IsValid())

540

{

541

return Fail("%s: Operation has invalid inputs", __func__);

542

}

543

544

const Operand* outputOperand = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

545

if (!outputOperand)

546

{

547

return Fail("%s: Could not read output", __func__);

548

}

549

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

550

const armnn::TensorInfo& outInfo = GetTensorInfoForOperand(*outputOperand);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

551

if (IsDynamicTensor(outInfo))

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

552

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

553

return Fail("%s: Dynamic output tensors are not supported", __func__);

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

554

}

555

Aron Virginas-Tar

d759323

2019-07-16 13:17:06 +0100

[diff] [blame]

556

bool isSupported = false;

557

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsMaximumSupported,

data.m_Backends,

isSupported,

input0.GetTensorInfo(),

562

input1.GetTensorInfo(),

563

outInfo);

564

565

if (!isSupported)

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* layer = data.m_Network->AddMaximumLayer();

571

assert(layer != nullptr);

572

BroadcastTensor(input0, input1, layer, *data.m_Network);

573

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

574

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

575

}

576

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

577

bool HalPolicy::ConvertMinimum(const Operation& operation, const Model& model, ConversionData& data)

578

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

579

ALOGV("hal_1_2::HalPolicy::ConvertMinimum()");

580

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

581

LayerInputHandle input0 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

582

LayerInputHandle input1 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

583

584

if (!input0.IsValid() || !input1.IsValid())

585

{

586

return Fail("%s: Operation has invalid inputs", __func__);

587

}

588

589

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

590

if (!output)

591

{

592

return Fail("%s: Could not read output 0", __func__);

593

}

594

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

595

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

596

if (IsDynamicTensor(outputInfo))

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

597

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

598

return Fail("%s: Dynamic output tensors are not supported", __func__);

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

599

}

600

601

bool isSupported = false;

602

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsMinimumSupported,

data.m_Backends,

isSupported,

input0.GetTensorInfo(),

607

input1.GetTensorInfo(),

outputInfo);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddMinimumLayer();

616

assert(layer != nullptr);

617

BroadcastTensor(input0, input1, layer, *data.m_Network);

618

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

619

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

620

}

621

Aron Virginas-Tar

c921f6b

2019-07-25 10:14:33 +0100

[diff] [blame]

622

bool HalPolicy::ConvertPad(const Operation& operation, const Model& model, ConversionData& data)

623

{

624

ALOGV("hal_1_2::HalPolicy::ConvertPad()");

625

return ::ConvertPad<hal_1_2::HalPolicy>(operation, model, data);

626

}

627

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

628

bool HalPolicy::ConvertPadV2(const Operation& operation, const Model& model, ConversionData& data)

629

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

630

ALOGV("hal_1_2::HalPolicy::ConvertPadV2()");

631

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

632

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

633

if (!input.IsValid())

634

{

635

return Fail("%s: Could not read input 0", __func__);

636

}

637

Aron Virginas-Tar

366e0a6

2019-07-10 13:01:41 +0100

[diff] [blame]

638

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

639

if (!output)

640

{

641

return Fail("%s: Could not read output", __func__);

642

}

643

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

644

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

645

unsigned int rank = inputInfo.GetNumDimensions();

646

647

armnn::PadDescriptor descriptor;

648

if (!ConvertPaddings<hal_1_2::HalPolicy>(operation, model, data, rank, descriptor))

649

{

650

return Fail("%s: Could not convert paddings", __func__);

651

}

652

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

653

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

654

if (IsDynamicTensor(outputInfo))

Sadik Armagan

310d8ff

2019-07-11 10:53:38 +0100

[diff] [blame]

655

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

656

return Fail("%s: Dynamic output tensors are not supported", __func__);

Sadik Armagan

310d8ff

2019-07-11 10:53:38 +0100

[diff] [blame]

657

}

658

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

659

// Determine type of padding value

660

OperandType operandType0;

661

OperandType operandType2;

662

663

if (!GetOperandType<hal_1_2::HalPolicy>(operation, 0, model, operandType0) ||

664

!GetOperandType<hal_1_2::HalPolicy>(operation, 2, model, operandType2))

665

{

666

return Fail("%s: Operation has invalid inputs", __func__);

667

}

668

669

// Read value to use for padding

670

if (operandType0 == OperandType::TENSOR_FLOAT16 && operandType2 == OperandType::FLOAT16)

671

{

672

armnn::Half f16PadValue;

673

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 2, operandType2, f16PadValue, model, data))

674

{

675

return Fail("%s: Could not read input 2 (FLOAT16)", __func__);

676

}

677

678

descriptor.m_PadValue = f16PadValue;

679

}

680

else if (operandType0 == OperandType::TENSOR_FLOAT32 && operandType2 == OperandType::FLOAT32)

681

{

682

if (!GetInputFloat32<hal_1_2::HalPolicy>(operation, 2, descriptor.m_PadValue, model, data))

683

{

684

return Fail("%s: Could not read input 2 (FLOAT32)", __func__);

685

}

686

}

687

else if (operandType0 == OperandType::TENSOR_QUANT8_ASYMM && operandType2 == OperandType::INT32)

688

{

Mike Kelly

3c67394

2019-07-25 09:26:06 +0100

[diff] [blame]

689

int32_t intPadValue = 0;

690

if (!GetInputInt32<hal_1_2::HalPolicy>(operation, 2, intPadValue, model, data))

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

691

{

692

return Fail("%s: Could not read input 2 (INT32)", __func__);

693

}

Mike Kelly

3c67394

2019-07-25 09:26:06 +0100

[diff] [blame]

694

descriptor.m_PadValue = intPadValue;

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

}

else

{

return Fail("%s: Operation has invalid inputs: type mismatch", __func__);

699

}

700

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

701

bool isSupported = false;

702

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsPadSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

descriptor);

if (!isSupported)

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddPadLayer(descriptor);

715

assert(layer != nullptr);

716

input.Connect(layer->GetInputSlot(0));

717

layer->GetOutputSlot(0).SetTensorInfo(outputInfo);

718

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

719

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

720

}

721

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

722

bool HalPolicy::ConvertPrelu(const Operation& operation, const Model& model, ConversionData& data)

723

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

724

ALOGV("hal_1_2::HalPolicy::ConvertPrelu()");

725

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

726

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

727

LayerInputHandle alpha = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

728

729

if (!input.IsValid() || !alpha.IsValid())

730

{

731

return Fail("%s: Operation has invalid inputs", __func__);

732

}

733

734

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

735

736

if (!output)

737

{

Matteo Martincigh

0bd89a8

2019-07-02 16:53:10 +0100

[diff] [blame]

738

return Fail("%s: Could not read output", __func__);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

739

}

740

741

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

742

const armnn::TensorInfo& alphaInfo = alpha.GetTensorInfo();

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

743

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

744

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

745

if (IsDynamicTensor(outputInfo))

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

746

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

747

return Fail("%s: Dynamic output tensors are not supported", __func__);

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

748

}

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

749

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

750

bool isSupported = false;

751

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsPreluSupported,

data.m_Backends,

isSupported,

inputInfo,

alphaInfo,

outputInfo);

if (!isSupported)

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddPreluLayer();

if (!layer)

{

return Fail("%s: AddPreluLayer failed", __func__);

768

}

769

Matteo Martincigh

0bd89a8

2019-07-02 16:53:10 +0100

[diff] [blame]

770

BroadcastTensor(input, alpha, layer, *data.m_Network);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

771

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

772

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

773

}

774

Sadik Armagan

5a476a8

2019-07-30 09:43:18 +0100

[diff] [blame]

775

bool HalPolicy::ConvertQuantize(const Operation& operation, const Model& model, ConversionData& data)

776

{

777

ALOGV("hal_1_2::HalPolicy::ConvertQuantize()");

778

779

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

780

if (!input.IsValid())

781

{

782

return Fail("%s: Operation has invalid input", __func__);

783

}

784

785

const Operand* const outputOperand = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

786

if (!outputOperand)

787

{

788

return Fail("%s: Operation has invalid outputs", __func__);

789

}

790

791

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*outputOperand);

792

if (IsDynamicTensor(outputInfo))

793

{

794

return Fail("%s: Dynamic output tensors are not supported", __func__);

795

}

796

797

bool isSupported = false;

798

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsQuantizeSupported,

data.m_Backends,

isSupported,

input.GetTensorInfo(),

outputInfo);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddQuantizeLayer();

810

assert(layer != nullptr);

811

input.Connect(layer->GetInputSlot(0));

812

813

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

814

}

815

Ellen Norris-Thompson

7efb46d

2019-07-24 17:39:19 +0100

[diff] [blame^]

816

bool HalPolicy::ConvertQuantizedLstm(const Operation& operation, const Model& model, ConversionData& data)

817

{

818

ALOGV("hal_1_2::HalPolicy::ConvertQuantizedLstm()");

819

820

//Inputs:

821

// 0: The input: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape [numBatches, inputSize]

822

// specifying the input to the LSTM cell. Tensor is quantized with a fixed quantization range of -1, 127/128.

823

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

824

if (!input.IsValid())

825

{

826

return Fail("%s: Could not read input 0: input", __func__);

827

}

828

829

//13: The previous cell state: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT16_SYMM and shape

830

// [numBatches, outputSize] specifying the cell state from the previous time step of the LSTM cell.

831

// It is quantized using a quantization range of -2^4, 2^4 * 32767/32768.

832

LayerInputHandle previousCellStateIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 13, model, data);

833

if (!previousCellStateIn.IsValid())

834

{

835

return Fail("%s: Could not read input 13: previousCellStateIn", __func__);

836

}

837

838

// 14: The previous output state: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

839

// [numBathes, outputSize] specifying the output of the LSTM cell from previous time-step. Tensor

840

// is quantized with a fixed quantization range of -1, 127/128.

841

LayerInputHandle previousOutputIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 14, model, data);

842

if (!previousOutputIn.IsValid())

843

{

844

return Fail("%s: Could not read input 14: previousOutputIn", __func__);

845

}

846

847

// Get the input tensors:

848

// 1: The input-to-input weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

849

// [outputSize, inputSize] specifying input-to-input part of weights for fully-connected layer inside the

850

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

851

const ConstTensorPin inputToInputWeightsPin =

852

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 0, model, data);

853

854

// 2: The input-to-forget weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

855

// [outputSize, inputSize] specifying input-to-forget part of weights for fully-connected layer inside the

856

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

857

const ConstTensorPin inputToForgetWeightsPin =

858

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

859

860

// 3: The input-to-cell weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

861

// [outputSize, inputSize] specifying input-to-cell part of weights for fully-connected layer inside the

862

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

863

const ConstTensorPin inputToCellWeightsPin =

864

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

865

866

// 4: The input-to-output weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

867

// [outputSize, inputSize] specifying input-to-output part of weights for fully-connected layer inside the

868

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

869

const ConstTensorPin inputToOutputWeightsPin =

870

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 3, model, data);

871

872

// 5: The recurrent-to-input weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

873

// [outputSize, outputSize] specifying recurrent-to-input part of weights for fully-connected layer inside

874

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

875

const ConstTensorPin recurrentToInputWeightsPin =

876

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 4, model, data);

877

878

// 6: The recurrent-to-forget weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

879

// [outputSize, outputSize] specifying recurrent-to-forget part of weights for fully-connected layer inside

880

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

881

const ConstTensorPin recurrentToForgetWeightsPin =

882

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 5, model, data);

883

884

// 7: The recurrent-to-cell weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

885

// [outputSize, outputSize] specifying recurrent-to-cell part of weights for fully-connected layer inside

886

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

887

const ConstTensorPin recurrentToCellWeightsPin =

888

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 6, model, data);

889

890

// 8: The recurrent-to-output weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

891

// [outputSize, outputSize] specifying recurrent-to-output part of weights for fully-connected layer inside

892

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

893

const ConstTensorPin recurrentToOutputWeightsPin =

894

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 7, model, data);

895

896

// 9: The input gate bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying the

897

// bias for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product

898

// of input and weights scales and zeroPoint equal to 0.

899

const ConstTensorPin inputGateBiasPin =

900

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 8, model, data);

901

902

// 10: The forget gate bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying

903

// the bias for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product

904

// of input and weights scales and zeroPoint equal to 0.

905

const ConstTensorPin forgetGateBiasPin =

906

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 9, model, data);

907

908

// 11:The cell bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying the bias

909

// for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product of input

910

// and weights scales and zeroPoint equal to 0.

911

const ConstTensorPin cellBiasPin =

912

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 10, model, data);

913

914

// 12:The output gate bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying

915

// the bias for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product

916

// of input and weights scales and zeroPoint equal to 0.

917

const ConstTensorPin outputGateBiasPin =

918

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 11, model, data);

919

920

if (!inputToInputWeightsPin.IsValid() ||

921

!inputToForgetWeightsPin.IsValid() ||

922

!inputToCellWeightsPin.IsValid() ||

923

!inputToOutputWeightsPin.IsValid() ||

924

!recurrentToInputWeightsPin.IsValid() ||

925

!recurrentToForgetWeightsPin.IsValid() ||

926

!recurrentToCellWeightsPin.IsValid() ||

927

!recurrentToOutputWeightsPin.IsValid() ||

928

!inputGateBiasPin.IsValid() ||

929

!forgetGateBiasPin.IsValid() ||

930

!cellBiasPin.IsValid() ||

931

!outputGateBiasPin.IsValid())

932

{

933

return Fail("%s: Operation has invalid tensor inputs", __func__);

}

// Outputs:

// 0: The cell state: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT16_SYMM and shape [numBatches, outputSize]

938

// which contains a cell state from the current time step. Tensor is quantized using a quantization range

939

// of -2^4, 2^4 * 32767/32768.

940

const Operand* cellStateOut = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

941

if (!cellStateOut)

942

{

943

return Fail("%s: Could not read output 0: cellStateOut", __func__);

944

}

945

946

// 1: The output: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape [numBathes, outputSize] which

947

// contains the output value. Tensor is quantized with a fixed quantization range of -1, 127/128.

948

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 1, model);

949

if (!output)

950

{

951

return Fail("%s: Could not read output 1: output", __func__);

}

// Inputs

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

956

const armnn::TensorInfo& previousCellStateInInfo = previousCellStateIn.GetTensorInfo();

957

const armnn::TensorInfo& previousOutputInInfo = previousOutputIn.GetTensorInfo();

958

959

// Outputs

960

const armnn::TensorInfo& cellStateOutInfo = GetTensorInfoForOperand(*cellStateOut);

961

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

962

963

// Dynamic tensors currently not supported

964

if (IsDynamicTensor(cellStateOutInfo) || IsDynamicTensor(outputInfo))

965

{

966

return Fail("%s: Dynamic output tensors are not supported", __func__);

967

}

968

969

armnn::QuantizedLstmInputParams params;

970

971

params.m_InputToInputWeights = inputToInputWeightsPin.GetConstTensorPtr();

972

params.m_InputToForgetWeights = inputToForgetWeightsPin.GetConstTensorPtr();

973

params.m_InputToCellWeights = inputToCellWeightsPin.GetConstTensorPtr();

974

params.m_InputToOutputWeights = inputToOutputWeightsPin.GetConstTensorPtr();

975

params.m_RecurrentToInputWeights = recurrentToInputWeightsPin.GetConstTensorPtr();

976

params.m_RecurrentToForgetWeights = recurrentToForgetWeightsPin.GetConstTensorPtr();

977

params.m_RecurrentToCellWeights = recurrentToCellWeightsPin.GetConstTensorPtr();

978

params.m_RecurrentToOutputWeights = recurrentToOutputWeightsPin.GetConstTensorPtr();

979

params.m_InputGateBias = inputGateBiasPin.GetConstTensorPtr();

980

params.m_ForgetGateBias = forgetGateBiasPin.GetConstTensorPtr();

981

params.m_CellBias = cellBiasPin.GetConstTensorPtr();

982

params.m_OutputGateBias = outputGateBiasPin.GetConstTensorPtr();

983

984

armnn::QuantizedLstmInputParamsInfo paramsInfo;

985

paramsInfo.m_InputToInputWeights = &(params.m_InputToInputWeights->GetInfo());

986

paramsInfo.m_InputToForgetWeights = &(params.m_InputToForgetWeights->GetInfo());

987

paramsInfo.m_InputToCellWeights = &(params.m_InputToCellWeights->GetInfo());

988

paramsInfo.m_InputToOutputWeights = &(params.m_InputToOutputWeights->GetInfo());

989

paramsInfo.m_RecurrentToInputWeights = &(params.m_RecurrentToInputWeights->GetInfo());

990

paramsInfo.m_RecurrentToForgetWeights = &(params.m_RecurrentToForgetWeights->GetInfo());

991

paramsInfo.m_RecurrentToCellWeights = &(params.m_RecurrentToCellWeights->GetInfo());

992

paramsInfo.m_RecurrentToOutputWeights = &(params.m_RecurrentToOutputWeights->GetInfo());

993

paramsInfo.m_InputGateBias = &(params.m_InputGateBias->GetInfo());

994

paramsInfo.m_ForgetGateBias = &(params.m_ForgetGateBias->GetInfo());

995

paramsInfo.m_CellBias = &(params.m_CellBias->GetInfo());

996

paramsInfo.m_OutputGateBias = &(params.m_OutputGateBias->GetInfo());

997

998

bool isSupported = false;

999

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1000

IsQuantizedLstmSupported,

data.m_Backends,

isSupported,

inputInfo,

previousCellStateInInfo,

1005

previousOutputInInfo,

cellStateOutInfo,

outputInfo,

paramsInfo);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddQuantizedLstmLayer(params, "QuantizedLstm");

1016

input.Connect(layer->GetInputSlot(0));

1017

previousOutputIn.Connect(layer->GetInputSlot(1));

1018

previousCellStateIn.Connect(layer->GetInputSlot(2));

1019

1020

return (SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, 0, model, data) &&

1021

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 1, *layer, 1, model, data));

1022

}

1023

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

1024

bool HalPolicy::ConvertReLu(const Operation& operation, const Model& model, ConversionData& data)

1025

{

1026

ALOGV("hal_1_2::HalPolicy::ConvertReLu()");

1027

return ::ConvertReLu<hal_1_2::HalPolicy>(operation, model, data);

1028

}

1029

1030

bool HalPolicy::ConvertReLu1(const Operation& operation, const Model& model, ConversionData& data)

1031

{

1032

ALOGV("hal_1_2::HalPolicy::ConvertReLu1()");

1033

return ::ConvertReLu1<hal_1_2::HalPolicy>(operation, model, data);

1034

}

1035

1036

bool HalPolicy::ConvertReLu6(const Operation& operation, const Model& model, ConversionData& data)

1037

{

1038

ALOGV("hal_1_2::HalPolicy::ConvertReLu6()");

1039

return ::ConvertReLu6<hal_1_2::HalPolicy>(operation, model, data);

1040

}

1041

Aron Virginas-Tar

2019-07-04 11:59:48 +0100

[diff] [blame]

1042

bool HalPolicy::ConvertResize(const Operation& operation,

1043

const Model& model,

1044

ConversionData& data,

1045

armnn::ResizeMethod resizeMethod)

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1046

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1047

ALOGV("hal_1_2::HalPolicy::ConvertResize()");

1048

1049

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1050

if (!input.IsValid())

1051

{

1052

return Fail("%s: Could not read input 0", __func__);

1053

}

1054

1055

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1056

if (!output)

1057

{

1058

return Fail("%s: Could not read output 0", __func__);

1059

}

1060

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1061

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

1062

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1063

1064

if (IsDynamicTensor(outputInfo))

1065

{

1066

return Fail("%s: Dynamic output tensors are not supported", __func__);

1067

}

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1068

1069

armnn::ResizeDescriptor descriptor;

Aron Virginas-Tar

2019-07-04 11:59:48 +0100

[diff] [blame]

1070

descriptor.m_Method = resizeMethod;

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1071

descriptor.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 3, model, data);

1072

1073

OperandType operandType1;

1074

OperandType operandType2;

1075

1076

if (!GetOperandType<hal_1_2::HalPolicy>(operation, 1, model, operandType1) ||

1077

!GetOperandType<hal_1_2::HalPolicy>(operation, 2, model, operandType2))

1078

{

1079

return Fail("%s: Operation has invalid inputs", __func__);

1080

}

1081

1082

if (operandType1 != operandType2)

1083

{

1084

return Fail("%s: Operation has invalid inputs. Type of input 1 and 2 should be the same", __func__);

1085

}

1086

1087

if (operandType1 == OperandType::INT32)

1088

{

1089

// Case 1: resizing by shape

1090

int32_t targetWidth = 0;

1091

int32_t targetHeight = 0;

1092

1093

if (!GetInputInt32<hal_1_2::HalPolicy>(operation, 1, targetWidth, model, data) ||

1094

!GetInputInt32<hal_1_2::HalPolicy>(operation, 2, targetHeight, model, data))

1095

{

1096

return Fail("%s: Operation has invalid inputs for resizing by shape", __func__);

1097

}

1098

1099

if (targetWidth < 0 || targetHeight < 0)

1100

{

1101

return Fail("%s: Operation has invalid inputs for resizing by shape. "

1102

"Target width/height cannot be < 0", __func__);

1103

}

1104

1105

descriptor.m_TargetWidth = static_cast<uint32_t>(targetWidth);

Teresa Charlin

9843c01

2019-07-19 12:18:35 +0100

[diff] [blame]

1106

descriptor.m_TargetHeight = static_cast<uint32_t>(targetHeight);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1107

}

1108

else if (operandType1 == OperandType::FLOAT32)

1109

{

1110

// Case 2: resizing by scale

1111

float widthScale = 1.0f;

1112

float heightScale = 1.0f;

1113

1114

if (!GetInputFloat32<hal_1_2::HalPolicy>(operation, 1, widthScale, model, data) ||

1115

!GetInputFloat32<hal_1_2::HalPolicy>(operation, 2, heightScale, model, data))

1116

{

1117

return Fail("%s: Operation has invalid inputs for resizing by scale", __func__);

1118

}

1119

1120

const armnn::TensorShape& inputShape = inputInfo.GetShape();

1121

armnnUtils::DataLayoutIndexed dataLayoutIndexed(descriptor.m_DataLayout);

1122

1123

float width = inputShape[dataLayoutIndexed.GetWidthIndex()];

1124

float height = inputShape[dataLayoutIndexed.GetHeightIndex()];

1125

1126

descriptor.m_TargetWidth = std::floor(width * widthScale);

1127

descriptor.m_TargetHeight = std::floor(height * heightScale);

}

else

{

// NOTE: FLOAT16 scales are not supported

return false;

}

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1135

bool isSupported = false;

1136

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsResizeSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

descriptor);

Aron Virginas-Tar

be5d356

2019-07-16 11:32:29 +0100

[diff] [blame]

1143

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1144

if (!isSupported)

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* layer = data.m_Network->AddResizeLayer(descriptor);

1150

1151

assert(layer != nullptr);

1152

1153

layer->GetOutputSlot(0).SetTensorInfo(outputInfo);

1154

input.Connect(layer->GetInputSlot(0));

1155

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1156

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1157

}

1158

Finn Williams

d74c505

2019-07-30 17:06:00 +0100

[diff] [blame]

1159

bool HalPolicy::ConvertSpaceToBatchNd(const Operation& operation, const Model& model, ConversionData& data)

1160

{

1161

ALOGV("hal_1_2::HalPolicy::ConvertSpaceToBatchNd()");

1162

return ::ConvertSpaceToBatchNd<hal_1_2::HalPolicy>(operation, model, data);

1163

}

1164

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1165

bool HalPolicy::ConvertSpaceToDepth(const Operation& operation, const Model& model, ConversionData& data)

1166

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1167

ALOGV("hal_1_2::HalPolicy::ConvertSpaceToDepth()");

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1168

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1169

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1170

if (!input.IsValid() )

1171

{

1172

return Fail("%s: Operation has invalid inputs", __func__);

1173

}

1174

1175

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

1176

unsigned int rank = inputInfo.GetNumDimensions();

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1177

if (rank != 4)

1178

{

1179

return Fail("%s: Only inputs with rank 4 are supported", __func__);

1180

}

1181

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1182

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1183

if (!output)

1184

{

1185

return Fail("%s: Could not read output 0", __func__);

1186

}

1187

1188

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1189

if (IsDynamicTensor(outputInfo))

1190

{

1191

return Fail("%s: Dynamic output tensors are not supported", __func__);

1192

}

1193

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1194

armnn::SpaceToDepthDescriptor desc;

1195

1196

GetInputScalar<hal_1_2::HalPolicy>(operation, 1, OperandType::INT32, desc.m_BlockSize, model, data);

1197

1198

if (desc.m_BlockSize <= 1)

1199

{

1200

return Fail("%s: Block size must be at least 1 in all dimensions");

1201

}

1202

1203

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 2, model, data);

1204

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1205

bool isSupported = false;

1206

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1207

IsSpaceToDepthSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc);

if (!isSupported)

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddSpaceToDepthLayer(desc);

1219

assert(layer != nullptr);

1220

input.Connect(layer->GetInputSlot(0));

1221

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1222

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1223

}

1224

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1225

bool HalPolicy::ConvertSoftmax(const Operation& operation, const Model& model, ConversionData& data)

1226

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1227

ALOGV("hal_1_2::HalPolicy::ConvertSoftmax()");

1228

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1229

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1230

if (!input.IsValid())

1231

{

1232

return Fail("%s: Operation has invalid inputs", __func__);

1233

}

1234

1235

const Operand* outputOperand = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1236

if (!outputOperand)

1237

{

1238

return Fail("%s: Operation has no outputs", __func__);

1239

}

1240

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1241

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*outputOperand);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

1242

if (IsDynamicTensor(outputInfo))

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1243

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1244

return Fail("%s: Dynamic output tensors are not supported", __func__);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1245

}

1246

1247

armnn::SoftmaxDescriptor desc;

1248

if (!GetInputFloat32<hal_1_2::HalPolicy>(operation, 1, desc.m_Beta, model, data))

1249

{

1250

return Fail("%s: Operation has invalid inputs", __func__);

1251

}

1252

1253

if (operation.inputs.size() > 2 && !GetInputScalar<hal_1_2::HalPolicy>(operation,

1254

2,

1255

HalPolicy::OperandType::INT32,

desc.m_Axis,

model,

data))

{

return Fail("%s: Operation has invalid inputs", __func__);

1261

}

1262

1263

bool isSupported = false;

1264

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsSoftmaxSupported,

data.m_Backends,

isSupported,

input.GetTensorInfo(),

outputInfo,

desc);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* layer = data.m_Network->AddSoftmaxLayer(desc);

1277

assert(layer != nullptr);

1278

input.Connect(layer->GetInputSlot(0));

1279

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1280

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1281

}

1282

Mike Kelly

0a87936

2019-07-29 16:56:31 +0100

[diff] [blame]

1283

bool HalPolicy::ConvertSub(const Operation& operation, const Model& model, ConversionData& data)

1284

{

1285

ALOGV("hal_1_2::HalPolicy::ConvertSub()");

1286

return ::ConvertSub<hal_1_2::HalPolicy>(operation, model, data);

1287

}

1288

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

1289

bool HalPolicy::ConvertTanH(const Operation& operation, const Model& model, ConversionData& data)

1290

{

1291

ALOGV("hal_1_2::HalPolicy::ConvertTanH()");

1292

return ::ConvertTanH<hal_1_2::HalPolicy>(operation, model, data);

1293

}

1294

Ferran Balaguer

b2397fd

2019-07-25 12:12:39 +0100

[diff] [blame]

1295

bool HalPolicy::ConvertLstm(const Operation& operation, const Model& model, ConversionData& data)

1296

{

1297

// Inputs:

1298

// 00: The input: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, input_size], where

1299

// “batch_size” corresponds to the batching dimension, and “input_size” is the size of the input.

1300

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1301

if (!input.IsValid())

1302

{

1303

return Fail("%s: Could not read input 0: input", __func__);

1304

}

1305

// 18: The output state: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, output_size].

1306

LayerInputHandle outputStateIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 18, model, data);

1307

if (!outputStateIn.IsValid())

1308

{

1309

return Fail("%s: Could not read input 18: outputStateIn", __func__);

1310

}

1311

// 19: The cell state: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, num_units].

1312

LayerInputHandle cellStateIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 19, model, data);

1313

if (!cellStateIn.IsValid())

1314

{

1315

return Fail("%s: Could not read input 19: cellStateIn", __func__);

1316

}

1317

1318

// Get the mandatory input tensors:

1319

// 02: The input-to-forget weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1320

// [num_units, input_size].

1321

const ConstTensorPin inputToForgetWeightsPin =

1322

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

1323

// 03: The input-to-cell weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1324

// [num_units, input_size].

1325

const ConstTensorPin inputToCellWeightsPin =

1326

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 3, model, data);

1327

// 04: The input-to-output weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1328

// [num_units, input_size].

1329

const ConstTensorPin inputToOutputWeightsPin =

1330

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 4, model, data);

1331

// 06: The recurrent-to-forget weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1332

// [num_units, output_size].

1333

const ConstTensorPin recurrentToForgetWeightsPin =

1334

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 6, model, data);

1335

// 07: The recurrent-to-cell weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1336

// [num_units, output_size].

1337

const ConstTensorPin recurrentToCellWeightsPin =

1338

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 7, model, data);

1339

// 08: The recurrent-to-output weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1340

// [num_units, output_size].

1341

const ConstTensorPin recurrentToOutputWeightsPin =

1342

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 8, model, data);

1343

// 13: The forget gate bias: A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1344

const ConstTensorPin forgetGateBiasPin =

1345

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 13, model, data);

1346

// 14: The cell bias: A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1347

const ConstTensorPin cellBiasPin =

1348

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 14, model, data);

1349

// 15: The output gate bias: A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1350

const ConstTensorPin outputGateBiasPin =

1351

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 15, model, data);

1352

1353

if (!inputToForgetWeightsPin.IsValid() ||

1354

!inputToCellWeightsPin.IsValid() ||

1355

!inputToOutputWeightsPin.IsValid() ||

1356

!recurrentToForgetWeightsPin.IsValid() ||

1357

!recurrentToCellWeightsPin.IsValid() ||

1358

!recurrentToOutputWeightsPin.IsValid() ||

1359

!forgetGateBiasPin.IsValid() ||

1360

!cellBiasPin.IsValid() ||

1361

!outputGateBiasPin.IsValid())

1362

{

1363

return Fail("%s: Operation has invalid tensor inputs", __func__);

1364

}

1365

1366

// Get the optional input tensors:

1367

// 01: The input-to-input weights: Optional. A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1368

// [num_units, input_size], where “num_units” corresponds to the number of cell units.

1369

const ConstTensorPin inputToInputWeightsPin =

1370

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

1,

model,

data,

g_DontPermute,

nullptr,

true);

// 05: The recurrent-to-input weights: Optional. A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1379

// [num_units, output_size], where “output_size” corresponds to either the number of cell units (i.e.,

1380

// “num_units”), or the second dimension of the “projection_weights”, if defined.

1381

const ConstTensorPin recurrentToInputWeightsPin =

1382

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

5,

model,

data,

g_DontPermute,

nullptr,

true);

// 09: The cell-to-input weights: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1391

const ConstTensorPin cellToInputWeightsPin =

1392

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

9,

model,

data,

g_DontPermute,

nullptr,

true);

// 10: The cell-to-forget weights: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1401

const ConstTensorPin cellToForgetWeightsPin =

1402

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

10,

model,

data,

g_DontPermute,

nullptr,

true);

// 11: The cell-to-output weights: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1411

const ConstTensorPin cellToOutputWeightsPin =

1412

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

11,

model,

data,

g_DontPermute,

nullptr,

true);

// 12: The input gate bias: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1421

const ConstTensorPin inputGateBiasPin =

1422

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

12,

model,

data,

g_DontPermute,

nullptr,

true);

// 16: The projection weights: Optional. A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1431

// [output_size, num_units].

1432

const ConstTensorPin projectionWeightsPin =

1433

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

16,

model,

data,

g_DontPermute,

nullptr,

true);

// 17: The projection bias: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [output_size].

1442

const ConstTensorPin projectionBiasPin =

1443

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

17,

model,

data,

g_DontPermute,

nullptr,

true);

if ((!inputToInputWeightsPin.IsValid() && !inputToInputWeightsPin.IsOptional()) ||

1452

(!recurrentToInputWeightsPin.IsValid() && !recurrentToInputWeightsPin.IsOptional()) ||

1453

(!cellToInputWeightsPin.IsValid() && !cellToInputWeightsPin.IsOptional()) ||

1454

(!cellToForgetWeightsPin.IsValid() && !cellToForgetWeightsPin.IsOptional()) ||

1455

(!cellToOutputWeightsPin.IsValid() && !cellToOutputWeightsPin.IsOptional()) ||

1456

(!inputGateBiasPin.IsValid() && !inputGateBiasPin.IsOptional()) ||

1457

(!projectionWeightsPin.IsValid() && !projectionWeightsPin.IsOptional()) ||

1458

(!projectionBiasPin.IsValid() && !projectionBiasPin.IsOptional()))

1459

{

1460

return Fail("%s: Operation has invalid tensor inputs", __func__);

1461

}

1462

1463

// Get the mandatory input scalars (actually 1-D tensors of size 1):

1464

// 20: The activation function: A value indicating the activation function:

1465

// 0: None; 1: Relu; 3: Relu6; 4: Tanh; 6: Sigmoid.

1466

// 21: The clipping threshold: for the cell state, such that values are bound within [-cell_clip, cell_clip].

1467

// If set to 0.0 then clipping is disabled.

1468

// 22: The clipping threshold: for the output from the projection layer, such that values are bound within

1469

// [-proj_clip, proj_clip]. If set to 0.0 then clipping is disabled.

1470

ActivationFn activation;

1471

float cellClip;

1472

float projClip;

1473

if (!GetInputActivationFunctionFromTensor<hal_1_2::HalPolicy>(operation, 20, activation, model, data) ||

1474

!GetInputScalar<hal_1_2::HalPolicy>(operation, 21, OperandType::FLOAT32, cellClip, model, data) ||

1475

!GetInputScalar<hal_1_2::HalPolicy>(operation, 22, OperandType::FLOAT32, projClip, model, data))

1476

{

1477

return Fail("%s: Operation has invalid scalar inputs", __func__);

1478

}

1479

1480

// Get the normalization tensors

1481

// 23: The input layer normalization weights. A 1-D tensor of shape [num_units].

1482

// Used to rescale normalized inputs to activation at input gate.

1483

const ConstTensorPin inputLayerNormWeightsPin =

1484

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

23,

model,

data,

g_DontPermute,

nullptr,

true);

// 24: The forget layer normalization weights. A 1-D tensor of shape [num_units].

1493

// Used to rescale normalized inputs to activation at forget gate.

1494

const ConstTensorPin forgetLayerNormWeightsPin =

1495

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

24,

model,

data,

g_DontPermute,

nullptr,

true);

// 25: The cell layer normalization weights. A 1-D tensor of shape [num_units].

1504

// Used to rescale normalized inputs to activation at cell gate.

1505

const ConstTensorPin cellLayerNormWeightsPin =

1506

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

25,

model,

data,

g_DontPermute,

nullptr,

true);

// 26: The output layer normalization weights. A 1-D tensor of shape [num_units].

1515

// Used to rescale normalized inputs to activation at output gate.

1516

const ConstTensorPin outputLayerNormWeightsPin =

1517

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

26,

model,

data,

g_DontPermute,

nullptr,

true);

// Outputs:

// 00: The scratch buffer: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, num_units * 4]

1527

// with CIFG, or [batch_size, num_units * 3] without CIFG.

1528

const Operand* scratchBuffer = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1529

if (!scratchBuffer)

1530

{

1531

return Fail("%s: Could not read output 0: scratchBuffer", __func__);

1532

}

1533

// 01: The output state (out): A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, output_size].

1534

const Operand* outputStateOut = GetOutputOperand<hal_1_2::HalPolicy>(operation, 1, model);

1535

if (!outputStateOut)

1536

{

1537

return Fail("%s: Could not read output 1: outputStateOut", __func__);

1538

}

1539

// 02: The cell state (out): A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, num_units].

1540

const Operand* cellStateOut = GetOutputOperand<hal_1_2::HalPolicy>(operation, 2, model);

1541

if (!cellStateOut)

1542

{

1543

return Fail("%s: Could not read output 2: cellStateOut", __func__);

1544

}

1545

// 03: The output: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, output_size]. This is

1546

// effectively the same as the current “output state (out)” value.

1547

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 3, model);

1548

if (!output)

1549

{

1550

return Fail("%s: Could not read output 3: output", __func__);

1551

}

1552

1553

// set the params structure for the AddLstmLayer call

1554

armnn::LstmInputParams params;

1555

params.m_InputToInputWeights = inputToInputWeightsPin.GetConstTensorPtr();

1556

params.m_InputToForgetWeights = inputToForgetWeightsPin.GetConstTensorPtr();

1557

params.m_InputToCellWeights = inputToCellWeightsPin.GetConstTensorPtr();

1558

params.m_InputToOutputWeights = inputToOutputWeightsPin.GetConstTensorPtr();

1559

params.m_RecurrentToInputWeights = recurrentToInputWeightsPin.GetConstTensorPtr();

1560

params.m_RecurrentToForgetWeights = recurrentToForgetWeightsPin.GetConstTensorPtr();

1561

params.m_RecurrentToCellWeights = recurrentToCellWeightsPin.GetConstTensorPtr();

1562

params.m_RecurrentToOutputWeights = recurrentToOutputWeightsPin.GetConstTensorPtr();

1563

params.m_CellToInputWeights = cellToInputWeightsPin.GetConstTensorPtr();

1564

params.m_CellToForgetWeights = cellToForgetWeightsPin.GetConstTensorPtr();

1565

params.m_CellToOutputWeights = cellToOutputWeightsPin.GetConstTensorPtr();

1566

params.m_InputGateBias = inputGateBiasPin.GetConstTensorPtr();

1567

params.m_ForgetGateBias = forgetGateBiasPin.GetConstTensorPtr();

1568

params.m_CellBias = cellBiasPin.GetConstTensorPtr();

1569

params.m_OutputGateBias = outputGateBiasPin.GetConstTensorPtr();

1570

params.m_ProjectionWeights = projectionWeightsPin.GetConstTensorPtr();

1571

params.m_ProjectionBias = projectionBiasPin.GetConstTensorPtr();

1572

params.m_InputLayerNormWeights = inputLayerNormWeightsPin.GetConstTensorPtr();

1573

params.m_ForgetLayerNormWeights = forgetLayerNormWeightsPin.GetConstTensorPtr();

1574

params.m_CellLayerNormWeights = cellLayerNormWeightsPin.GetConstTensorPtr();

1575

params.m_OutputLayerNormWeights = outputLayerNormWeightsPin.GetConstTensorPtr();

1576

1577

// set the layer descriptor

1578

armnn::LstmDescriptor desc;

1579

desc.m_ActivationFunc = activation;

1580

desc.m_ClippingThresCell = cellClip;

1581

desc.m_ClippingThresProj = projClip;

1582

desc.m_CifgEnabled = (params.m_InputToInputWeights == nullptr ||

1583

params.m_RecurrentToInputWeights == nullptr ||

1584

params.m_InputGateBias == nullptr);

1585

desc.m_PeepholeEnabled = (params.m_CellToForgetWeights != nullptr ||

1586

params.m_CellToOutputWeights != nullptr);

1587

desc.m_ProjectionEnabled = (params.m_ProjectionWeights != nullptr);

1588

desc.m_LayerNormEnabled = (params.m_InputLayerNormWeights != nullptr ||

1589

params.m_ForgetLayerNormWeights != nullptr ||

1590

params.m_CellLayerNormWeights != nullptr ||

1591

params.m_OutputLayerNormWeights != nullptr);

1592

1593

// validate the optional input groups

1594

if (desc.m_CifgEnabled &&

1595

(params.m_InputToInputWeights != nullptr ||

1596

params.m_RecurrentToInputWeights != nullptr ||

1597

params.m_InputGateBias != nullptr))

1598

{

1599

return Fail("%s: All, or none, of input-to-input weights, recurrent-to-input weights,"

1600

" and input gate bias must be provided", __func__);

1601

}

1602

1603

if (!desc.m_ProjectionEnabled && params.m_ProjectionBias != nullptr)

1604

{

1605

return Fail("%s: projection bias should not be provided without projection weights", __func__);

1606

}

1607

1608

if (desc.m_PeepholeEnabled &&

1609

(params.m_CellToForgetWeights == nullptr ||

1610

params.m_CellToOutputWeights == nullptr ||

1611

(!desc.m_CifgEnabled && params.m_CellToInputWeights == nullptr)))

1612

{

1613

return Fail("%s: All, or none, of cell-to-forget weights and cell-to-output weights must be provided"

1614

" and, if CIFG is not enabled, cell-to-input weights must also be provided", __func__);

1615

}

1616

1617

if (desc.m_LayerNormEnabled &&

1618

(params.m_ForgetLayerNormWeights == nullptr ||

1619

params.m_CellLayerNormWeights == nullptr ||

1620

params.m_OutputLayerNormWeights == nullptr ||

1621

(!desc.m_CifgEnabled && params.m_InputLayerNormWeights == nullptr)))

1622

{

1623

return Fail("%s: All, or none, of forget-norm weights, cell-norm weights and output-norm weights must be"

1624

" provided and, if CIFG is not enabled, input-norm weights must also be provided", __func__);

1625

}

1626

1627

// Check if the layer is supported

1628

// Inputs

1629

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

1630

const armnn::TensorInfo& outputStateInInfo = outputStateIn.GetTensorInfo();

1631

const armnn::TensorInfo& cellStateInInfo = cellStateIn.GetTensorInfo();

1632

1633

// Outputs

1634

const armnn::TensorInfo& scratchBufferInfo = GetTensorInfoForOperand(*scratchBuffer);

1635

const armnn::TensorInfo& outputStateOutInfo = GetTensorInfoForOperand(*outputStateOut);

1636

const armnn::TensorInfo& cellStateOutInfo = GetTensorInfoForOperand(*cellStateOut);

1637

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1638

Ferran Balaguer

a4a629a

2019-07-30 10:16:13 +0100

[diff] [blame]

1639

if (IsDynamicTensor(scratchBufferInfo) ||

1640

IsDynamicTensor(outputStateOutInfo) ||

1641

IsDynamicTensor(cellStateOutInfo) ||

1642

IsDynamicTensor(outputInfo))

1643

{

1644

return Fail("%s: Dynamic output tensors are not supported", __func__);

1645

}

1646

Ferran Balaguer

b2397fd

2019-07-25 12:12:39 +0100

[diff] [blame]

1647

// Basic parameters

1648

armnn::LstmInputParamsInfo paramsInfo;

1649

paramsInfo.m_InputToForgetWeights = &(params.m_InputToForgetWeights->GetInfo());

1650

paramsInfo.m_InputToCellWeights = &(params.m_InputToCellWeights->GetInfo());

1651

paramsInfo.m_InputToOutputWeights = &(params.m_InputToOutputWeights->GetInfo());

1652

paramsInfo.m_RecurrentToForgetWeights = &(params.m_RecurrentToForgetWeights->GetInfo());

1653

paramsInfo.m_RecurrentToCellWeights = &(params.m_RecurrentToCellWeights->GetInfo());

1654

paramsInfo.m_RecurrentToOutputWeights = &(params.m_RecurrentToOutputWeights->GetInfo());

1655

paramsInfo.m_ForgetGateBias = &(params.m_ForgetGateBias->GetInfo());

1656

paramsInfo.m_CellBias = &(params.m_CellBias->GetInfo());

1657

paramsInfo.m_OutputGateBias = &(params.m_OutputGateBias->GetInfo());

1658

1659

// Optional parameters

1660

if(!desc.m_CifgEnabled)

1661

{

1662

paramsInfo.m_InputToInputWeights = &(params.m_InputToInputWeights->GetInfo());

1663

paramsInfo.m_RecurrentToInputWeights = &(params.m_RecurrentToInputWeights->GetInfo());

1664

if (params.m_CellToInputWeights != nullptr)

1665

{

1666

paramsInfo.m_CellToInputWeights = &(params.m_CellToInputWeights->GetInfo());

1667

}

1668

paramsInfo.m_InputGateBias = &(params.m_InputGateBias->GetInfo());

1669

}

1670

1671

if(desc.m_ProjectionEnabled)

1672

{

1673

paramsInfo.m_ProjectionWeights = &(params.m_ProjectionWeights->GetInfo());

1674

if (params.m_ProjectionBias != nullptr)

1675

{

1676

paramsInfo.m_ProjectionBias = &(params.m_ProjectionBias->GetInfo());

}

}

if(desc.m_PeepholeEnabled)

1681

{

1682

paramsInfo.m_CellToForgetWeights = &(params.m_CellToForgetWeights->GetInfo());

1683

paramsInfo.m_CellToOutputWeights = &(params.m_CellToOutputWeights->GetInfo());

1684

}

1685

1686

if (desc.m_LayerNormEnabled)

1687

{

1688

if(!desc.m_CifgEnabled)

1689

{

1690

paramsInfo.m_InputLayerNormWeights = &(params.m_InputLayerNormWeights->GetInfo());

1691

}

1692

paramsInfo.m_ForgetLayerNormWeights = &(params.m_ForgetLayerNormWeights->GetInfo());

1693

paramsInfo.m_CellLayerNormWeights = &(params.m_CellLayerNormWeights->GetInfo());

1694

paramsInfo.m_OutputLayerNormWeights = &(params.m_OutputLayerNormWeights->GetInfo());

1695

}

1696

1697

bool isSupported = false;

1698

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsLstmSupported,

data.m_Backends,

isSupported,

inputInfo,

outputStateInInfo,

cellStateInInfo,

scratchBufferInfo,

outputStateOutInfo,

cellStateOutInfo,

outputInfo,

desc,

paramsInfo);

if (!isSupported)

{

return false;

}

// Add the layer

armnn::IConnectableLayer* layer = data.m_Network->AddLstmLayer(desc, params, "Lstm");

1718

1719

input.Connect(layer->GetInputSlot(0));

1720

outputStateIn.Connect(layer->GetInputSlot(1));

1721

cellStateIn.Connect(layer->GetInputSlot(2));

1722

1723

return (SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, 0, model, data) &&

1724

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 1, *layer, 1, model, data) &&

1725

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 2, *layer, 2, model, data) &&

1726

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 3, *layer, 3, model, data));

1727

}

1728

Aron Virginas-Tar

8b99168

2019-07-31 12:54:59 +0100

[diff] [blame]

1729

bool HalPolicy::ConvertTransposeConv2d(const Operation& operation, const Model& model, ConversionData& data)

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

1730

{

1731

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1732

1733

if (!input.IsValid())

1734

{

1735

return Fail("%s: Operation has invalid inputs", __func__);

1736

}

1737

1738

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

if (!output)

{

return Fail("%s: Could not read output 0", __func__);

1743

}

1744

1745

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

1746

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1747

if (IsDynamicTensor(outputInfo))

1748

{

1749

return Fail("%s: Dynamic output tensors are not supported", __func__);

1750

}

1751

1752

// ArmNN does not currently support non-fixed weights or bias

1753

// Find the shape of the weights tensor. In AndroidNN this will be [ 1, H, W, I * M ]

1754

const Operand* weightsOperand = GetInputOperand<hal_1_2::HalPolicy>(operation, 1, model);

1755

1756

if (weightsOperand == nullptr)

1757

{

1758

return Fail("%s: Operand is invalid", __func__);

1759

}

1760

armnn::TransposeConvolution2dDescriptor desc;

1761

desc.m_DataLayout = armnn::DataLayout::NHWC;

1762

1763

// Determine whether padding is implicit or explicit

1764

bool implicitPadding = operation.inputs.size() == 9;

1765

1766

if (implicitPadding )

1767

{

1768

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 8, model, data);

}

else

{

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 10, model, data);

1773

}

1774

1775

armnnUtils::DataLayoutIndexed dataLayoutIndexed(desc.m_DataLayout);

1776

unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

1777

unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

1778

1779

const armnn::PermutationVector OHWIToOIHW = {0, 2, 3, 1};

1780

1781

// The shape of the weight is [depth_out, filter_height, filter_width, depth_in].

1782

// We have to permute it to OIHW if the data layout is NCHW.

1783

const ConstTensorPin weightsPin = (desc.m_DataLayout == armnn::DataLayout::NCHW) ?

1784

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data, OHWIToOIHW) :

1785

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

1786

1787

// Bias is a 1D tensor

1788

const ConstTensorPin biasPin =

1789

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

1790

1791

if (!weightsPin.IsValid())

1792

{

1793

return Fail("%s: Operation has invalid weights", __func__);

1794

}

1795

1796

if (!biasPin.IsValid())

1797

{

1798

return Fail("%s: Operation has invalid biases", __func__);

1799

}

1800

1801

armnn::ConstTensor weights = weightsPin.GetConstTensor();

1802

armnn::ConstTensor bias = biasPin.GetConstTensor();

1803

SanitizeBiasQuantizationScale(bias.GetInfo(), weights.GetInfo(), inputInfo);

1804

1805

ActivationFn activation;

if (implicitPadding)

{

android::nn::PaddingScheme paddingScheme;

1810

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 4, paddingScheme, model, data) ||

1811

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_StrideX, model, data) ||

1812

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_StrideY, model, data) ||

1813

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 7, activation, model, data))

1814

{

1815

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

1816

}

1817

1818

const uint32_t kernelX = weights.GetShape()[widthIndex];

1819

const uint32_t kernelY = weights.GetShape()[heightIndex];

Narumol Prangnawarat

c8bdb39

2019-08-01 15:51:44 +0100

[diff] [blame]

1820

const uint32_t outputX = outputInfo.GetShape()[widthIndex];

1821

const uint32_t outputY = outputInfo.GetShape()[heightIndex];

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

1822

Narumol Prangnawarat

c8bdb39

2019-08-01 15:51:44 +0100

[diff] [blame]

int32_t padLeft{0};

int32_t padRight{0};

int32_t padTop{0};

int32_t padBottom{0};

1827

1828

CalcPaddingTransposeConv(outputX, kernelX, desc.m_StrideX, padLeft, padRight, paddingScheme);

1829

CalcPaddingTransposeConv(outputY, kernelY, desc.m_StrideY, padTop, padBottom, paddingScheme);

1830

1831

// NOTE: The Android NN API allows for negative padding values in TransposeConv2d,

1832

// but Arm NN only supports values >= 0

1833

if (padLeft < 0 || padRight < 0 || padTop < 0 || padBottom < 0)

1834

{

1835

return Fail("%s: Negative padding values are not supported", __func__);

1836

}

1837

1838

desc.m_PadLeft = boost::numeric_cast<uint32_t>(padLeft);

1839

desc.m_PadRight = boost::numeric_cast<uint32_t>(padRight);

1840

desc.m_PadTop = boost::numeric_cast<uint32_t>(padTop);

1841

desc.m_PadBottom = boost::numeric_cast<uint32_t>(padBottom);

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

1842

}

1843

else if (operation.inputs.size() == 11)

1844

{

1845

// explicit padding

1846

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

1847

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

1848

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

1849

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

1850

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

1851

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

1852

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 9, activation, model, data))

1853

{

1854

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

}

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

1860

}

1861

1862

desc.m_BiasEnabled = true;

1863

armnn::Optional<armnn::TensorInfo> biases(bias.GetInfo());

1864

1865

bool isSupported = false;

1866

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1867

IsTransposeConvolution2dSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc,

weights.GetInfo(),

biases);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* startLayer =

1881

data.m_Network->AddTransposeConvolution2dLayer(desc, weights, armnn::Optional<armnn::ConstTensor>(bias));

1882

if (!startLayer)

1883

{

1884

return Fail("%s: AddTransposeConvolution2dLayer failed", __func__);

1885

}

1886

1887

armnn::IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, startLayer, data);

1888

if (!endLayer)

1889

{

1890

return Fail("%s: ProcessActivation failed", __func__);

1891

}

1892

1893

input.Connect(startLayer->GetInputSlot(0));

1894

1895

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *endLayer, model, data);

1896

}

1897

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

1898

} // namespace hal_1_2

Matteo Martincigh