Blame - 1.2/HalPolicy.cpp - ml/android-nn-driver

2019-06-11 16:35:25 +0100

[diff] [blame]

1

//

2

3

// SPDX-License-Identifier: MIT

4

//

5

6

#include "HalPolicy.hpp"

7

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

8

#include "Utils.hpp"

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

9

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

10

#include <DataLayoutIndexed.hpp>

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

11

#include <Half.hpp>

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

#include <cmath>

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

15

namespace armnn_driver

{

namespace hal_1_2

{

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

20

bool HalPolicy::ConvertOperation(const Operation& operation, const Model& model, ConversionData& data)

21

{

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

22

switch (operation.type)

23

{

Kevin May

407718f

2019-09-09 14:46:41 +0100

[diff] [blame^]

24

case V1_2::OperationType::ABS:

25

return ConvertAbs(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

26

case V1_2::OperationType::ADD:

27

return ConvertAdd(operation, model, data);

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

28

case V1_2::OperationType::AVERAGE_POOL_2D:

29

return ConvertAveragePool2d(operation, model, data);

Finn Williams

23b87b3

2019-07-30 11:44:05 +0100

[diff] [blame]

30

case V1_2::OperationType::BATCH_TO_SPACE_ND:

31

return ConvertBatchToSpaceNd(operation, model, data);

Mike Kelly

b880520

2019-07-31 17:25:43 +0100

[diff] [blame]

32

case V1_2::OperationType::CONCATENATION:

33

return ConvertConcatenation(operation, model, data);

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

34

case V1_2::OperationType::CONV_2D:

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

35

return ConvertConv2d(operation, model, data);

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

36

case V1_2::OperationType::DEPTHWISE_CONV_2D:

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

37

return ConvertDepthwiseConv2d(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

38

case V1_2::OperationType::DEQUANTIZE:

39

return ConvertDequantize(operation, model, data);

40

case V1_2::OperationType::DIV:

41

return ConvertDiv(operation, model, data);

42

case V1_2::OperationType::FLOOR:

43

return ConvertFloor(operation, model, data);

44

case V1_2::OperationType::FULLY_CONNECTED:

45

return ConvertFullyConnected(operation, model, data);

46

case V1_2::OperationType::L2_NORMALIZATION:

47

return ConvertL2Normalization(operation, model, data);

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

48

case V1_2::OperationType::L2_POOL_2D:

49

return ConvertL2Pool2d(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

50

case V1_2::OperationType::LOCAL_RESPONSE_NORMALIZATION:

51

return ConvertLocalResponseNormalization(operation, model, data);

52

case V1_2::OperationType::LOGISTIC:

53

return ConvertLogistic(operation, model, data);

54

case V1_2::OperationType::LSTM:

55

return ConvertLstm(operation, model, data);

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

56

case V1_2::OperationType::MAX_POOL_2D:

57

return ConvertMaxPool2d(operation, model, data);

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

58

case V1_2::OperationType::MAXIMUM:

59

return ConvertMaximum(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

60

case V1_2::OperationType::MEAN:

61

return ConvertMean(operation, model, data);

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

62

case V1_2::OperationType::MINIMUM:

63

return ConvertMinimum(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

64

case V1_2::OperationType::MUL:

65

return ConvertMul(operation, model, data);

Mike Kelly

3c67394

2019-07-25 09:26:06 +0100

[diff] [blame]

66

case V1_2::OperationType::PAD:

Aron Virginas-Tar

c921f6b

2019-07-25 10:14:33 +0100

[diff] [blame]

67

return ConvertPad(operation, model, data);

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

68

case V1_2::OperationType::PAD_V2:

69

return ConvertPadV2(operation, model, data);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

70

case V1_2::OperationType::PRELU:

71

return ConvertPrelu(operation, model, data);

Sadik Armagan

5a476a8

2019-07-30 09:43:18 +0100

[diff] [blame]

72

case V1_2::OperationType::QUANTIZE:

73

return ConvertQuantize(operation, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

74

case V1_2::OperationType::QUANTIZED_16BIT_LSTM:

75

return ConvertQuantizedLstm(operation, model, data);

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

76

case V1_2::OperationType::RELU:

77

return ConvertReLu(operation, model, data);

78

case V1_2::OperationType::RELU1:

79

return ConvertReLu1(operation, model, data);

80

case V1_2::OperationType::RELU6:

81

return ConvertReLu6(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

82

case V1_2::OperationType::RESHAPE:

83

return ConvertReshape(operation, model, data);

Aron Virginas-Tar

2019-07-04 11:59:48 +0100

[diff] [blame]

84

case V1_2::OperationType::RESIZE_BILINEAR:

85

return ConvertResize(operation, model, data, armnn::ResizeMethod::Bilinear);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

86

case V1_2::OperationType::RESIZE_NEAREST_NEIGHBOR:

Aron Virginas-Tar

2019-07-04 11:59:48 +0100

[diff] [blame]

87

return ConvertResize(operation, model, data, armnn::ResizeMethod::NearestNeighbor);

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

88

case V1_2::OperationType::SQRT:

89

return ConvertSqrt(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

90

case V1_2::OperationType::SQUEEZE:

91

return ConvertSqueeze(operation, model, data);

92

case V1_2::OperationType::STRIDED_SLICE:

93

return ConvertStridedSlice(operation, model, data);

94

case V1_2::OperationType::TRANSPOSE:

95

return ConvertTranspose(operation, model, data);

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

96

case V1_2::OperationType::TRANSPOSE_CONV_2D:

Aron Virginas-Tar

8b99168

2019-07-31 12:54:59 +0100

[diff] [blame]

97

return ConvertTransposeConv2d(operation, model, data);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

98

case V1_2::OperationType::SOFTMAX:

99

return ConvertSoftmax(operation, model, data);

Finn Williams

d74c505

2019-07-30 17:06:00 +0100

[diff] [blame]

100

case V1_2::OperationType::SPACE_TO_BATCH_ND :

101

return ConvertSpaceToBatchNd(operation, model, data);

Aron Virginas-Tar

ad1ab53

2019-07-25 11:24:42 +0100

[diff] [blame]

102

case V1_2::OperationType::SPACE_TO_DEPTH:

103

return ConvertSpaceToDepth(operation, model, data);

Mike Kelly

0a87936

2019-07-29 16:56:31 +0100

[diff] [blame]

104

case V1_2::OperationType::SUB:

105

return ConvertSub(operation, model, data);

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

106

case V1_2::OperationType::TANH:

107

return ConvertTanH(operation, model, data);

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

108

default:

109

return Fail("%s: Operation type %s not supported in ArmnnDriver",

110

__func__, toString(operation.type).c_str());

}

}

Kevin May

2019-09-09 14:46:41 +0100

[diff] [blame^]

114

bool HalPolicy::ConvertAbs(const Operation& operation, const Model& model, ConversionData& data)

115

{

116

ALOGV("hal_1_2::HalPolicy::ConvertAbs()");

117

return ::ConvertAbs<hal_1_2::HalPolicy>(operation, model, data);

118

}

119

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

120

bool HalPolicy::ConvertAdd(const Operation& operation, const Model& model, ConversionData& data)

121

{

122

ALOGV("hal_1_2::HalPolicy::ConvertAdd()");

123

return ::ConvertAdd<hal_1_2::HalPolicy>(operation, model, data);

124

}

125

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

126

bool HalPolicy::ConvertAveragePool2d(const Operation& operation, const Model& model, ConversionData& data)

127

{

128

ALOGV("hal_1_2::HalPolicy::ConvertAveragePool2d()");

129

return ConvertPooling2d<hal_1_2::HalPolicy>(operation, __func__, armnn::PoolingAlgorithm::Average, model, data);

130

}

131

Finn Williams

23b87b3

2019-07-30 11:44:05 +0100

[diff] [blame]

132

bool HalPolicy::ConvertBatchToSpaceNd(const Operation& operation, const Model& model, ConversionData& data)

133

{

134

ALOGV("hal_1_2::HalPolicy::ConvertBatchToSpaceNd()");

135

return ::ConvertBatchToSpaceNd<hal_1_2::HalPolicy>(operation, model, data);

136

}

137

Mike Kelly

b880520

2019-07-31 17:25:43 +0100

[diff] [blame]

138

bool HalPolicy::ConvertConcatenation(const Operation& operation, const Model& model, ConversionData& data)

139

{

140

ALOGV("hal_1_2::HalPolicy::ConvertConcatenation()");

141

return ::ConvertConcatenation<hal_1_2::HalPolicy>(operation, model, data);

142

}

143

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

144

bool HalPolicy::ConvertConv2d(const Operation& operation, const Model& model, ConversionData& data)

145

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

146

ALOGV("hal_1_2::HalPolicy::ConvertConv2d()");

147

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

148

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

149

if (!input.IsValid())

150

{

151

return Fail("%s: Operation has invalid inputs", __func__);

152

}

153

154

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

155

if (!output)

156

{

157

return Fail("%s: Could not read output 0", __func__);

158

}

159

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

160

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

161

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

162

163

if (IsDynamicTensor(outputInfo))

164

{

165

return Fail("%s: Dynamic output tensors are not supported", __func__);

166

}

Aron Virginas-Tar

366e0a6

2019-07-10 13:01:41 +0100

[diff] [blame]

167

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

168

armnn::Convolution2dDescriptor desc;

169

desc.m_DataLayout = armnn::DataLayout::NHWC;

170

171

// Determine whether padding is implicit or explicit

172

bool implicitPadding = operation.inputs.size() == 7 ||

173

(operation.inputs.size() >= 8 &&

174

GetInputOperand<hal_1_2::HalPolicy>(operation, 7, model)->type == OperandType::BOOL);

if (implicitPadding)

{

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 7, model, data);

179

}

180

else if (operation.inputs.size() >= 10)

181

{

182

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 10, model, data);

183

}

184

185

const armnn::PermutationVector OHWIToOIHW = {0, 2, 3, 1};

186

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

187

// ArmNN does not currently support non-fixed weights or bias

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

188

// The NNAPI filter is always OHWI [depth_out, filter_height, filter_width, depth_in] but ArmNN expects the

189

// filter's height and width indices to match the input's height and width indices so we permute it to OIHW if

190

// the DataLayout is NCHW

191

const ConstTensorPin weightsPin = (desc.m_DataLayout == armnn::DataLayout::NCHW) ?

192

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data, OHWIToOIHW) :

193

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

194

const ConstTensorPin biasPin =

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

195

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

196

197

if (!weightsPin.IsValid())

198

{

199

return Fail("%s: Operation has invalid weights", __func__);

200

}

201

202

if (!biasPin.IsValid())

203

{

204

return Fail("%s: Operation has invalid biases", __func__);

205

}

206

207

armnn::ConstTensor weights = weightsPin.GetConstTensor();

208

armnn::ConstTensor bias = biasPin.GetConstTensor();

209

SanitizeBiasQuantizationScale(bias.GetInfo(), weights.GetInfo(), inputInfo);

210

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

211

ActivationFn activation;

212

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

213

if (implicitPadding)

214

{

215

android::nn::PaddingScheme paddingScheme;

216

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 3, paddingScheme, model, data) ||

217

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_StrideX, model, data) ||

218

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_StrideY, model, data) ||

219

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 6, activation, model, data) ||

220

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 8, desc, model, data))

221

{

222

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

223

}

224

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

225

armnnUtils::DataLayoutIndexed dataLayoutIndexed(desc.m_DataLayout);

226

unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

227

unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

228

const uint32_t kernelX = weights.GetShape()[widthIndex];

229

const uint32_t kernelY = weights.GetShape()[heightIndex];

230

const uint32_t inputX = inputInfo.GetShape()[widthIndex];

231

const uint32_t inputY = inputInfo.GetShape()[heightIndex];

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

232

Mike Kelly

86b36d4

2019-07-12 16:39:33 +0100

[diff] [blame]

233

CalcPadding(inputX, kernelX, desc.m_StrideX, desc.m_DilationX, desc.m_PadLeft, desc.m_PadRight, paddingScheme);

234

CalcPadding(inputY, kernelY, desc.m_StrideY, desc.m_DilationY, desc.m_PadTop, desc.m_PadBottom, paddingScheme);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

235

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

236

}

237

else if (operation.inputs.size() >= 10)

238

{

239

// explicit padding

240

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

241

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

242

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

243

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

244

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

245

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

246

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 9, activation, model, data) ||

247

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 11, desc, model, data))

248

{

249

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

250

}

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

255

}

256

257

desc.m_BiasEnabled = true;

258

armnn::Optional<armnn::TensorInfo> biases(bias.GetInfo());

259

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

260

bool isSupported = false;

261

FORWARD_LAYER_SUPPORT_FUNC(__func__,

262

IsConvolution2dSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc,

weights.GetInfo(),

biases);

Aron Virginas-Tar

2b17312

2019-07-15 14:29:09 +0100

[diff] [blame]

270

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

271

if (!isSupported)

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* startLayer =

277

data.m_Network->AddConvolution2dLayer(desc, weights, armnn::Optional<armnn::ConstTensor>(bias));

if (!startLayer)

{

return Fail("%s: AddConvolution2dLayer failed", __func__);

282

}

283

284

armnn::IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, startLayer, data);

if (!endLayer)

{

return Fail("%s: ProcessActivation failed", __func__);

289

}

290

291

input.Connect(startLayer->GetInputSlot(0));

292

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

293

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *endLayer, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

294

}

295

296

bool HalPolicy::ConvertDepthwiseConv2d(const Operation& operation, const Model& model, ConversionData& data)

297

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

298

ALOGV("hal_1_2::HalPolicy::ConvertDepthwiseConv2d()");

299

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

300

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

301

302

if (!input.IsValid())

303

{

304

return Fail("%s: Operation has invalid inputs", __func__);

305

}

306

307

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

if (!output)

{

return Fail("%s: Could not read output 0", __func__);

312

}

313

314

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

315

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

316

317

if (IsDynamicTensor(outputInfo))

318

{

319

return Fail("%s: Dynamic output tensors are not supported", __func__);

320

}

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

321

322

// ArmNN does not currently support non-fixed weights or bias

323

// Find the shape of the weights tensor. In AndroidNN this will be [ 1, H, W, I * M ]

324

const Operand* weightsOperand = GetInputOperand<hal_1_2::HalPolicy>(operation, 1, model);

325

326

if (weightsOperand == nullptr)

327

{

328

return Fail("%s: Operand is invalid", __func__);

329

}

330

armnn::DepthwiseConvolution2dDescriptor desc;

331

desc.m_DataLayout = armnn::DataLayout::NHWC;

332

333

// Determine whether padding is implicit or explicit

334

bool implicitPadding = operation.inputs.size() == 8 ||

335

(operation.inputs.size() >= 9 &&

336

GetInputOperand<hal_1_2::HalPolicy>(operation, 8, model)->type == OperandType::BOOL);

337

338

// Look ahead to find the optional DataLayout, if present

339

const uint32_t dataLayoutFlagIndex = implicitPadding ? 8 : 11;

340

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, dataLayoutFlagIndex, model, data);

341

342

armnnUtils::DataLayoutIndexed dataLayoutIndexed(desc.m_DataLayout);

343

unsigned int channelsIndex = dataLayoutIndexed.GetChannelsIndex();

344

unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

345

unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

346

347

// Reinterpret weight data as [ H, W, I, M ]

348

armnn::TensorShape weightsShape({ weightsOperand->dimensions[1],

349

weightsOperand->dimensions[2],

350

inputInfo.GetShape()[channelsIndex],

351

weightsOperand->dimensions[3] / inputInfo.GetShape()[channelsIndex] });

352

353

// Swizzle weight data [ H, W, I, M ] -> [ M, I, H, W ]

354

const armnn::PermutationVector HWIMToMIHW = { 2U, 3U, 1U, 0U };

355

356

const ConstTensorPin weightsPin =

357

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

1,

model,

data,

HWIMToMIHW,

&weightsShape);

// Bias is a 1D tensor

365

const ConstTensorPin biasPin =

366

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

367

368

if (!weightsPin.IsValid())

369

{

370

return Fail("%s: Operation has invalid weights", __func__);

371

}

372

373

if (!biasPin.IsValid())

374

{

375

return Fail("%s: Operation has invalid biases", __func__);

376

}

377

378

armnn::ConstTensor weights = weightsPin.GetConstTensor();

379

armnn::ConstTensor bias = biasPin.GetConstTensor();

380

SanitizeBiasQuantizationScale(bias.GetInfo(), weights.GetInfo(), inputInfo);

381

382

ActivationFn activation;

if (implicitPadding)

{

android::nn::PaddingScheme paddingScheme;

387

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 3, paddingScheme, model, data) ||

388

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_StrideX, model, data) ||

389

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_StrideY, model, data) ||

390

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 7, activation, model, data) ||

391

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 9, desc, model, data))

392

{

393

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

394

}

395

396

const uint32_t kernelX = weights.GetShape()[3];

397

const uint32_t kernelY = weights.GetShape()[2];

398

const uint32_t inputX = inputInfo.GetShape()[widthIndex];

399

const uint32_t inputY = inputInfo.GetShape()[heightIndex];

400

Mike Kelly

86b36d4

2019-07-12 16:39:33 +0100

[diff] [blame]

401

CalcPadding(inputX, kernelX, desc.m_StrideX, desc.m_DilationX, desc.m_PadLeft, desc.m_PadRight, paddingScheme);

402

CalcPadding(inputY, kernelY, desc.m_StrideY, desc.m_DilationY, desc.m_PadTop, desc.m_PadBottom, paddingScheme);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

403

}

404

else if (operation.inputs.size() >= 11)

405

{

406

// explicit padding

407

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

408

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

409

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

410

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

411

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

412

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

413

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 10, activation, model, data) ||

414

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 12, desc, model, data))

415

{

416

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

}

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

422

}

423

424

desc.m_BiasEnabled = true;

425

armnn::Optional<armnn::TensorInfo> biases(bias.GetInfo());

426

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

427

bool isSupported = false;

428

FORWARD_LAYER_SUPPORT_FUNC(__func__,

429

IsDepthwiseConvolutionSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc,

weights.GetInfo(),

biases);

Aron Virginas-Tar

9fd3739

2019-07-15 18:04:32 +0100

[diff] [blame]

437

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

438

if (!isSupported)

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* startLayer =

444

data.m_Network->AddDepthwiseConvolution2dLayer(desc, weights, armnn::Optional<armnn::ConstTensor>(bias));

Aron Virginas-Tar

9fd3739

2019-07-15 18:04:32 +0100

[diff] [blame]

445

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

446

if (!startLayer)

447

{

448

return Fail("%s: AddDepthwiseConvolution2dLayer failed", __func__);

449

}

450

451

armnn::IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, startLayer, data);

452

if (!endLayer)

453

{

454

return Fail("%s: ProcessActivation failed", __func__);

455

}

456

457

input.Connect(startLayer->GetInputSlot(0));

458

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

459

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *endLayer, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

460

}

461

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

462

bool HalPolicy::ConvertDequantize(const Operation& operation, const Model& model, ConversionData& data)

463

{

464

ALOGV("hal_1_2::HalPolicy::ConvertDequantize()");

465

return ::ConvertDequantize<hal_1_2::HalPolicy>(operation, model, data);

466

}

467

468

bool HalPolicy::ConvertDiv(const Operation& operation, const Model& model, ConversionData& data)

469

{

470

ALOGV("hal_1_2::HalPolicy::ConvertDiv()");

471

return ::ConvertDiv<hal_1_2::HalPolicy>(operation, model, data);

472

}

473

474

bool HalPolicy::ConvertFloor(const Operation& operation, const Model& model, ConversionData& data)

475

{

476

ALOGV("hal_1_2::HalPolicy::ConvertFloor()");

477

return ::ConvertFloor<hal_1_2::HalPolicy>(operation, model, data);

478

}

479

480

bool HalPolicy::ConvertFullyConnected(const Operation& operation, const Model& model, ConversionData& data)

481

{

482

ALOGV("hal_1_2::HalPolicy::ConvertFullyConnected()");

483

return ::ConvertFullyConnected<hal_1_2::HalPolicy>(operation, model, data);

484

}

485

486

bool HalPolicy::ConvertL2Normalization(const Operation& operation, const Model& model, ConversionData& data)

487

{

488

ALOGV("hal_1_2::HalPolicy::ConvertL2Normalization()");

489

return ::ConvertL2Normalization<hal_1_2::HalPolicy>(operation, model, data);

490

}

491

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

492

bool HalPolicy::ConvertL2Pool2d(const Operation& operation, const Model& model, ConversionData& data)

493

{

494

ALOGV("hal_1_2::HalPolicy::ConvertL2Pool2d()");

495

return ConvertPooling2d<hal_1_2::HalPolicy>(operation, __func__, armnn::PoolingAlgorithm::L2, model, data);

496

}

497

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

498

bool HalPolicy::ConvertLocalResponseNormalization(const Operation& operation,

499

const Model& model,

500

ConversionData& data)

501

{

502

ALOGV("hal_1_2::HalPolicy::ConvertLocalResponseNormalization()");

503

return ::ConvertLocalResponseNormalization<hal_1_2::HalPolicy>(operation, model, data);

504

}

505

506

bool HalPolicy::ConvertLogistic(const Operation& operation, const Model& model, ConversionData& data)

507

{

508

ALOGV("hal_1_2::HalPolicy::ConvertLogistic()");

509

return ::ConvertLogistic<hal_1_2::HalPolicy>(operation, model, data);

510

}

511

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

512

bool HalPolicy::ConvertMaxPool2d(const Operation& operation, const Model& model, ConversionData& data)

513

{

514

ALOGV("hal_1_2::HalPolicy::ConvertMaxPool2d()");

515

return ConvertPooling2d<hal_1_2::HalPolicy>(operation, __func__, armnn::PoolingAlgorithm::Max, model, data);

516

}

517

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

518

bool HalPolicy::ConvertMaximum(const Operation& operation, const Model& model, ConversionData& data)

519

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

520

ALOGV("hal_1_2::HalPolicy::ConvertMaximum()");

521

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

522

LayerInputHandle input0 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

523

LayerInputHandle input1 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

524

525

if (!input0.IsValid() || !input1.IsValid())

526

{

527

return Fail("%s: Operation has invalid inputs", __func__);

528

}

529

530

const Operand* outputOperand = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

531

if (!outputOperand)

532

{

533

return Fail("%s: Could not read output", __func__);

534

}

535

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

536

const armnn::TensorInfo& outInfo = GetTensorInfoForOperand(*outputOperand);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

537

if (IsDynamicTensor(outInfo))

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

538

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

539

return Fail("%s: Dynamic output tensors are not supported", __func__);

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

540

}

541

Aron Virginas-Tar

d759323

2019-07-16 13:17:06 +0100

[diff] [blame]

542

bool isSupported = false;

543

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsMaximumSupported,

data.m_Backends,

isSupported,

input0.GetTensorInfo(),

548

input1.GetTensorInfo(),

549

outInfo);

550

551

if (!isSupported)

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* layer = data.m_Network->AddMaximumLayer();

557

assert(layer != nullptr);

Sadik Armagan

64b19b5

2019-08-19 09:49:58 +0100

[diff] [blame]

558

bool isReshapeSupported = BroadcastTensor(input0, input1, layer, data);

559

if (!isReshapeSupported)

560

{

561

return false;

562

}

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

563

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

564

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

565

}

566

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

567

bool HalPolicy::ConvertMean(const Operation& operation, const Model& model, ConversionData& data)

568

{

569

ALOGV("hal_1_2::HalPolicy::ConvertMean()");

570

return ::ConvertMean<hal_1_2::HalPolicy>(operation, model, data);

571

}

572

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

573

bool HalPolicy::ConvertMinimum(const Operation& operation, const Model& model, ConversionData& data)

574

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

575

ALOGV("hal_1_2::HalPolicy::ConvertMinimum()");

576

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

577

LayerInputHandle input0 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

578

LayerInputHandle input1 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

579

580

if (!input0.IsValid() || !input1.IsValid())

581

{

582

return Fail("%s: Operation has invalid inputs", __func__);

583

}

584

585

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

586

if (!output)

587

{

588

return Fail("%s: Could not read output 0", __func__);

589

}

590

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

591

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

592

if (IsDynamicTensor(outputInfo))

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

593

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

594

return Fail("%s: Dynamic output tensors are not supported", __func__);

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

595

}

596

597

bool isSupported = false;

598

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsMinimumSupported,

data.m_Backends,

isSupported,

input0.GetTensorInfo(),

603

input1.GetTensorInfo(),

outputInfo);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddMinimumLayer();

612

assert(layer != nullptr);

Sadik Armagan

64b19b5

2019-08-19 09:49:58 +0100

[diff] [blame]

613

bool isReshapeSupported = BroadcastTensor(input0, input1, layer, data);

614

if (!isReshapeSupported)

615

{

616

return false;

617

}

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

618

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

619

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

620

}

621

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

622

bool HalPolicy::ConvertMul(const Operation& operation, const Model& model, ConversionData& data)

623

{

624

ALOGV("hal_1_2::HalPolicy::ConvertMul()");

625

return ::ConvertMul<hal_1_2::HalPolicy>(operation, model, data);

626

}

627

Aron Virginas-Tar

c921f6b

2019-07-25 10:14:33 +0100

[diff] [blame]

628

bool HalPolicy::ConvertPad(const Operation& operation, const Model& model, ConversionData& data)

629

{

630

ALOGV("hal_1_2::HalPolicy::ConvertPad()");

631

return ::ConvertPad<hal_1_2::HalPolicy>(operation, model, data);

632

}

633

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

634

bool HalPolicy::ConvertPadV2(const Operation& operation, const Model& model, ConversionData& data)

635

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

636

ALOGV("hal_1_2::HalPolicy::ConvertPadV2()");

637

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

638

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

639

if (!input.IsValid())

640

{

641

return Fail("%s: Could not read input 0", __func__);

642

}

643

Aron Virginas-Tar

366e0a6

2019-07-10 13:01:41 +0100

[diff] [blame]

644

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

645

if (!output)

646

{

647

return Fail("%s: Could not read output", __func__);

648

}

649

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

650

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

651

unsigned int rank = inputInfo.GetNumDimensions();

652

653

armnn::PadDescriptor descriptor;

654

if (!ConvertPaddings<hal_1_2::HalPolicy>(operation, model, data, rank, descriptor))

655

{

656

return Fail("%s: Could not convert paddings", __func__);

657

}

658

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

659

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

660

if (IsDynamicTensor(outputInfo))

Sadik Armagan

310d8ff

2019-07-11 10:53:38 +0100

[diff] [blame]

661

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

662

return Fail("%s: Dynamic output tensors are not supported", __func__);

Sadik Armagan

310d8ff

2019-07-11 10:53:38 +0100

[diff] [blame]

663

}

664

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

665

// Determine type of padding value

666

OperandType operandType0;

667

OperandType operandType2;

668

669

if (!GetOperandType<hal_1_2::HalPolicy>(operation, 0, model, operandType0) ||

670

!GetOperandType<hal_1_2::HalPolicy>(operation, 2, model, operandType2))

671

{

672

return Fail("%s: Operation has invalid inputs", __func__);

673

}

674

675

// Read value to use for padding

676

if (operandType0 == OperandType::TENSOR_FLOAT16 && operandType2 == OperandType::FLOAT16)

677

{

678

armnn::Half f16PadValue;

679

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 2, operandType2, f16PadValue, model, data))

680

{

681

return Fail("%s: Could not read input 2 (FLOAT16)", __func__);

682

}

683

684

descriptor.m_PadValue = f16PadValue;

685

}

686

else if (operandType0 == OperandType::TENSOR_FLOAT32 && operandType2 == OperandType::FLOAT32)

687

{

688

if (!GetInputFloat32<hal_1_2::HalPolicy>(operation, 2, descriptor.m_PadValue, model, data))

689

{

690

return Fail("%s: Could not read input 2 (FLOAT32)", __func__);

691

}

692

}

693

else if (operandType0 == OperandType::TENSOR_QUANT8_ASYMM && operandType2 == OperandType::INT32)

694

{

Mike Kelly

3c67394

2019-07-25 09:26:06 +0100

[diff] [blame]

695

int32_t intPadValue = 0;

696

if (!GetInputInt32<hal_1_2::HalPolicy>(operation, 2, intPadValue, model, data))

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

697

{

698

return Fail("%s: Could not read input 2 (INT32)", __func__);

699

}

Mike Kelly

3c67394

2019-07-25 09:26:06 +0100

[diff] [blame]

700

descriptor.m_PadValue = intPadValue;

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

}

else

{

return Fail("%s: Operation has invalid inputs: type mismatch", __func__);

705

}

706

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

707

bool isSupported = false;

708

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsPadSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

descriptor);

if (!isSupported)

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddPadLayer(descriptor);

721

assert(layer != nullptr);

722

input.Connect(layer->GetInputSlot(0));

723

layer->GetOutputSlot(0).SetTensorInfo(outputInfo);

724

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

725

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

726

}

727

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

728

bool HalPolicy::ConvertPrelu(const Operation& operation, const Model& model, ConversionData& data)

729

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

730

ALOGV("hal_1_2::HalPolicy::ConvertPrelu()");

731

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

732

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

733

LayerInputHandle alpha = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

734

735

if (!input.IsValid() || !alpha.IsValid())

736

{

737

return Fail("%s: Operation has invalid inputs", __func__);

738

}

739

740

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

741

742

if (!output)

743

{

Matteo Martincigh

0bd89a8

2019-07-02 16:53:10 +0100

[diff] [blame]

744

return Fail("%s: Could not read output", __func__);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

745

}

746

747

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

748

const armnn::TensorInfo& alphaInfo = alpha.GetTensorInfo();

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

749

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

750

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

751

if (IsDynamicTensor(outputInfo))

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

752

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

753

return Fail("%s: Dynamic output tensors are not supported", __func__);

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

754

}

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

755

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

756

bool isSupported = false;

757

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsPreluSupported,

data.m_Backends,

isSupported,

inputInfo,

alphaInfo,

outputInfo);

if (!isSupported)

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddPreluLayer();

if (!layer)

{

return Fail("%s: AddPreluLayer failed", __func__);

774

}

775

Sadik Armagan

64b19b5

2019-08-19 09:49:58 +0100

[diff] [blame]

776

bool isReshapeSupported = BroadcastTensor(input, alpha, layer, data);

777

if (!isReshapeSupported)

778

{

779

return false;

780

}

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

781

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

782

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

783

}

784

Sadik Armagan

5a476a8

2019-07-30 09:43:18 +0100

[diff] [blame]

785

bool HalPolicy::ConvertQuantize(const Operation& operation, const Model& model, ConversionData& data)

786

{

787

ALOGV("hal_1_2::HalPolicy::ConvertQuantize()");

788

789

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

790

if (!input.IsValid())

791

{

792

return Fail("%s: Operation has invalid input", __func__);

793

}

794

795

const Operand* const outputOperand = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

796

if (!outputOperand)

797

{

798

return Fail("%s: Operation has invalid outputs", __func__);

799

}

800

801

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*outputOperand);

802

if (IsDynamicTensor(outputInfo))

803

{

804

return Fail("%s: Dynamic output tensors are not supported", __func__);

805

}

806

807

bool isSupported = false;

808

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsQuantizeSupported,

data.m_Backends,

isSupported,

input.GetTensorInfo(),

outputInfo);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddQuantizeLayer();

820

assert(layer != nullptr);

821

input.Connect(layer->GetInputSlot(0));

822

823

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

824

}

825

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

826

bool HalPolicy::ConvertQuantizedLstm(const Operation& operation, const Model& model, ConversionData& data)

827

{

828

ALOGV("hal_1_2::HalPolicy::ConvertQuantizedLstm()");

829

830

//Inputs:

831

// 0: The input: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape [numBatches, inputSize]

832

// specifying the input to the LSTM cell. Tensor is quantized with a fixed quantization range of -1, 127/128.

833

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

834

if (!input.IsValid())

835

{

836

return Fail("%s: Could not read input 0: input", __func__);

837

}

838

839

//13: The previous cell state: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT16_SYMM and shape

840

// [numBatches, outputSize] specifying the cell state from the previous time step of the LSTM cell.

841

// It is quantized using a quantization range of -2^4, 2^4 * 32767/32768.

842

LayerInputHandle previousCellStateIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 13, model, data);

843

if (!previousCellStateIn.IsValid())

844

{

845

return Fail("%s: Could not read input 13: previousCellStateIn", __func__);

846

}

847

848

// 14: The previous output state: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

849

// [numBathes, outputSize] specifying the output of the LSTM cell from previous time-step. Tensor

850

// is quantized with a fixed quantization range of -1, 127/128.

851

LayerInputHandle previousOutputIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 14, model, data);

852

if (!previousOutputIn.IsValid())

853

{

854

return Fail("%s: Could not read input 14: previousOutputIn", __func__);

855

}

856

857

// Get the input tensors:

858

// 1: The input-to-input weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

859

// [outputSize, inputSize] specifying input-to-input part of weights for fully-connected layer inside the

860

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

861

const ConstTensorPin inputToInputWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

862

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

863

864

// 2: The input-to-forget weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

865

// [outputSize, inputSize] specifying input-to-forget part of weights for fully-connected layer inside the

866

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

867

const ConstTensorPin inputToForgetWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

868

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

869

870

// 3: The input-to-cell weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

871

// [outputSize, inputSize] specifying input-to-cell part of weights for fully-connected layer inside the

872

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

873

const ConstTensorPin inputToCellWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

874

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 3, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

875

876

// 4: The input-to-output weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

877

// [outputSize, inputSize] specifying input-to-output part of weights for fully-connected layer inside the

878

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

879

const ConstTensorPin inputToOutputWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

880

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 4, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

881

882

// 5: The recurrent-to-input weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

883

// [outputSize, outputSize] specifying recurrent-to-input part of weights for fully-connected layer inside

884

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

885

const ConstTensorPin recurrentToInputWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

886

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 5, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

887

888

// 6: The recurrent-to-forget weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

889

// [outputSize, outputSize] specifying recurrent-to-forget part of weights for fully-connected layer inside

890

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

891

const ConstTensorPin recurrentToForgetWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

892

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 6, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

893

894

// 7: The recurrent-to-cell weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

895

// [outputSize, outputSize] specifying recurrent-to-cell part of weights for fully-connected layer inside

896

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

897

const ConstTensorPin recurrentToCellWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

898

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 7, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

899

900

// 8: The recurrent-to-output weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

901

// [outputSize, outputSize] specifying recurrent-to-output part of weights for fully-connected layer inside

902

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

903

const ConstTensorPin recurrentToOutputWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

904

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 8, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

905

906

// 9: The input gate bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying the

907

// bias for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product

908

// of input and weights scales and zeroPoint equal to 0.

909

const ConstTensorPin inputGateBiasPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

910

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 9, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

911

912

// 10: The forget gate bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying

913

// the bias for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product

914

// of input and weights scales and zeroPoint equal to 0.

915

const ConstTensorPin forgetGateBiasPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

916

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 10, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

917

918

// 11:The cell bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying the bias

919

// for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product of input

920

// and weights scales and zeroPoint equal to 0.

921

const ConstTensorPin cellBiasPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

922

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 11, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

923

924

// 12:The output gate bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying

925

// the bias for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product

926

// of input and weights scales and zeroPoint equal to 0.

927

const ConstTensorPin outputGateBiasPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

928

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 12, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

929

930

if (!inputToInputWeightsPin.IsValid() ||

931

!inputToForgetWeightsPin.IsValid() ||

932

!inputToCellWeightsPin.IsValid() ||

933

!inputToOutputWeightsPin.IsValid() ||

934

!recurrentToInputWeightsPin.IsValid() ||

935

!recurrentToForgetWeightsPin.IsValid() ||

936

!recurrentToCellWeightsPin.IsValid() ||

937

!recurrentToOutputWeightsPin.IsValid() ||

938

!inputGateBiasPin.IsValid() ||

939

!forgetGateBiasPin.IsValid() ||

940

!cellBiasPin.IsValid() ||

941

!outputGateBiasPin.IsValid())

942

{

943

return Fail("%s: Operation has invalid tensor inputs", __func__);

}

// Outputs:

// 0: The cell state: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT16_SYMM and shape [numBatches, outputSize]

948

// which contains a cell state from the current time step. Tensor is quantized using a quantization range

949

// of -2^4, 2^4 * 32767/32768.

950

const Operand* cellStateOut = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

951

if (!cellStateOut)

952

{

953

return Fail("%s: Could not read output 0: cellStateOut", __func__);

954

}

955

956

// 1: The output: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape [numBathes, outputSize] which

957

// contains the output value. Tensor is quantized with a fixed quantization range of -1, 127/128.

958

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 1, model);

959

if (!output)

960

{

961

return Fail("%s: Could not read output 1: output", __func__);

}

// Inputs

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

966

const armnn::TensorInfo& previousCellStateInInfo = previousCellStateIn.GetTensorInfo();

967

const armnn::TensorInfo& previousOutputInInfo = previousOutputIn.GetTensorInfo();

968

969

// Outputs

970

const armnn::TensorInfo& cellStateOutInfo = GetTensorInfoForOperand(*cellStateOut);

971

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

972

973

// Dynamic tensors currently not supported

974

if (IsDynamicTensor(cellStateOutInfo) || IsDynamicTensor(outputInfo))

975

{

976

return Fail("%s: Dynamic output tensors are not supported", __func__);

977

}

978

979

armnn::QuantizedLstmInputParams params;

980

981

params.m_InputToInputWeights = inputToInputWeightsPin.GetConstTensorPtr();

982

params.m_InputToForgetWeights = inputToForgetWeightsPin.GetConstTensorPtr();

983

params.m_InputToCellWeights = inputToCellWeightsPin.GetConstTensorPtr();

984

params.m_InputToOutputWeights = inputToOutputWeightsPin.GetConstTensorPtr();

985

params.m_RecurrentToInputWeights = recurrentToInputWeightsPin.GetConstTensorPtr();

986

params.m_RecurrentToForgetWeights = recurrentToForgetWeightsPin.GetConstTensorPtr();

987

params.m_RecurrentToCellWeights = recurrentToCellWeightsPin.GetConstTensorPtr();

988

params.m_RecurrentToOutputWeights = recurrentToOutputWeightsPin.GetConstTensorPtr();

989

params.m_InputGateBias = inputGateBiasPin.GetConstTensorPtr();

990

params.m_ForgetGateBias = forgetGateBiasPin.GetConstTensorPtr();

991

params.m_CellBias = cellBiasPin.GetConstTensorPtr();

992

params.m_OutputGateBias = outputGateBiasPin.GetConstTensorPtr();

993

994

armnn::QuantizedLstmInputParamsInfo paramsInfo;

995

paramsInfo.m_InputToInputWeights = &(params.m_InputToInputWeights->GetInfo());

996

paramsInfo.m_InputToForgetWeights = &(params.m_InputToForgetWeights->GetInfo());

997

paramsInfo.m_InputToCellWeights = &(params.m_InputToCellWeights->GetInfo());

998

paramsInfo.m_InputToOutputWeights = &(params.m_InputToOutputWeights->GetInfo());

999

paramsInfo.m_RecurrentToInputWeights = &(params.m_RecurrentToInputWeights->GetInfo());

1000

paramsInfo.m_RecurrentToForgetWeights = &(params.m_RecurrentToForgetWeights->GetInfo());

1001

paramsInfo.m_RecurrentToCellWeights = &(params.m_RecurrentToCellWeights->GetInfo());

1002

paramsInfo.m_RecurrentToOutputWeights = &(params.m_RecurrentToOutputWeights->GetInfo());

1003

paramsInfo.m_InputGateBias = &(params.m_InputGateBias->GetInfo());

1004

paramsInfo.m_ForgetGateBias = &(params.m_ForgetGateBias->GetInfo());

1005

paramsInfo.m_CellBias = &(params.m_CellBias->GetInfo());

1006

paramsInfo.m_OutputGateBias = &(params.m_OutputGateBias->GetInfo());

1007

1008

bool isSupported = false;

1009

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1010

IsQuantizedLstmSupported,

data.m_Backends,

isSupported,

inputInfo,

previousCellStateInInfo,

1015

previousOutputInInfo,

cellStateOutInfo,

outputInfo,

paramsInfo);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddQuantizedLstmLayer(params, "QuantizedLstm");

1026

input.Connect(layer->GetInputSlot(0));

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1027

previousCellStateIn.Connect(layer->GetInputSlot(1));

1028

previousOutputIn.Connect(layer->GetInputSlot(2));

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1029

1030

return (SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, 0, model, data) &&

1031

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 1, *layer, 1, model, data));

1032

}

1033

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

1034

bool HalPolicy::ConvertReLu(const Operation& operation, const Model& model, ConversionData& data)

1035

{

1036

ALOGV("hal_1_2::HalPolicy::ConvertReLu()");

1037

return ::ConvertReLu<hal_1_2::HalPolicy>(operation, model, data);

1038

}

1039

1040

bool HalPolicy::ConvertReLu1(const Operation& operation, const Model& model, ConversionData& data)

1041

{

1042

ALOGV("hal_1_2::HalPolicy::ConvertReLu1()");

1043

return ::ConvertReLu1<hal_1_2::HalPolicy>(operation, model, data);

1044

}

1045

1046

bool HalPolicy::ConvertReLu6(const Operation& operation, const Model& model, ConversionData& data)

1047

{

1048

ALOGV("hal_1_2::HalPolicy::ConvertReLu6()");

1049

return ::ConvertReLu6<hal_1_2::HalPolicy>(operation, model, data);

1050

}

1051

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1052

bool HalPolicy::ConvertReshape(const Operation& operation, const Model& model, ConversionData& data)

1053

{

1054

ALOGV("hal_1_2::HalPolicy::ConvertReshape()");

1055

return ::ConvertReshape<hal_1_2::HalPolicy>(operation, model, data);

1056

}

1057

Aron Virginas-Tar

2019-07-04 11:59:48 +0100

[diff] [blame]

1058

bool HalPolicy::ConvertResize(const Operation& operation,

1059

const Model& model,

1060

ConversionData& data,

1061

armnn::ResizeMethod resizeMethod)

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1062

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1063

ALOGV("hal_1_2::HalPolicy::ConvertResize()");

1064

1065

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1066

if (!input.IsValid())

1067

{

1068

return Fail("%s: Could not read input 0", __func__);

1069

}

1070

1071

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1072

if (!output)

1073

{

1074

return Fail("%s: Could not read output 0", __func__);

1075

}

1076

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1077

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

1078

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1079

1080

if (IsDynamicTensor(outputInfo))

1081

{

1082

return Fail("%s: Dynamic output tensors are not supported", __func__);

1083

}

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1084

1085

armnn::ResizeDescriptor descriptor;

Aron Virginas-Tar

2019-07-04 11:59:48 +0100

[diff] [blame]

1086

descriptor.m_Method = resizeMethod;

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1087

descriptor.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 3, model, data);

1088

1089

OperandType operandType1;

1090

OperandType operandType2;

1091

1092

if (!GetOperandType<hal_1_2::HalPolicy>(operation, 1, model, operandType1) ||

1093

!GetOperandType<hal_1_2::HalPolicy>(operation, 2, model, operandType2))

1094

{

1095

return Fail("%s: Operation has invalid inputs", __func__);

1096

}

1097

1098

if (operandType1 != operandType2)

1099

{

1100

return Fail("%s: Operation has invalid inputs. Type of input 1 and 2 should be the same", __func__);

1101

}

1102

1103

if (operandType1 == OperandType::INT32)

1104

{

1105

// Case 1: resizing by shape

1106

int32_t targetWidth = 0;

1107

int32_t targetHeight = 0;

1108

1109

if (!GetInputInt32<hal_1_2::HalPolicy>(operation, 1, targetWidth, model, data) ||

1110

!GetInputInt32<hal_1_2::HalPolicy>(operation, 2, targetHeight, model, data))

1111

{

1112

return Fail("%s: Operation has invalid inputs for resizing by shape", __func__);

1113

}

1114

1115

if (targetWidth < 0 || targetHeight < 0)

1116

{

1117

return Fail("%s: Operation has invalid inputs for resizing by shape. "

1118

"Target width/height cannot be < 0", __func__);

1119

}

1120

1121

descriptor.m_TargetWidth = static_cast<uint32_t>(targetWidth);

Teresa Charlin

9843c01

2019-07-19 12:18:35 +0100

[diff] [blame]

1122

descriptor.m_TargetHeight = static_cast<uint32_t>(targetHeight);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1123

}

1124

else if (operandType1 == OperandType::FLOAT32)

1125

{

1126

// Case 2: resizing by scale

1127

float widthScale = 1.0f;

1128

float heightScale = 1.0f;

1129

1130

if (!GetInputFloat32<hal_1_2::HalPolicy>(operation, 1, widthScale, model, data) ||

1131

!GetInputFloat32<hal_1_2::HalPolicy>(operation, 2, heightScale, model, data))

1132

{

1133

return Fail("%s: Operation has invalid inputs for resizing by scale", __func__);

1134

}

1135

1136

const armnn::TensorShape& inputShape = inputInfo.GetShape();

1137

armnnUtils::DataLayoutIndexed dataLayoutIndexed(descriptor.m_DataLayout);

1138

1139

float width = inputShape[dataLayoutIndexed.GetWidthIndex()];

1140

float height = inputShape[dataLayoutIndexed.GetHeightIndex()];

1141

1142

descriptor.m_TargetWidth = std::floor(width * widthScale);

1143

descriptor.m_TargetHeight = std::floor(height * heightScale);

}

else

{

// NOTE: FLOAT16 scales are not supported

return false;

}

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1151

bool isSupported = false;

1152

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsResizeSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

descriptor);

Aron Virginas-Tar

be5d356

2019-07-16 11:32:29 +0100

[diff] [blame]

1159

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1160

if (!isSupported)

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* layer = data.m_Network->AddResizeLayer(descriptor);

1166

1167

assert(layer != nullptr);

1168

1169

layer->GetOutputSlot(0).SetTensorInfo(outputInfo);

1170

input.Connect(layer->GetInputSlot(0));

1171

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1172

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1173

}

1174

Finn Williams

d74c505

2019-07-30 17:06:00 +0100

[diff] [blame]

1175

bool HalPolicy::ConvertSpaceToBatchNd(const Operation& operation, const Model& model, ConversionData& data)

1176

{

1177

ALOGV("hal_1_2::HalPolicy::ConvertSpaceToBatchNd()");

1178

return ::ConvertSpaceToBatchNd<hal_1_2::HalPolicy>(operation, model, data);

1179

}

1180

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1181

bool HalPolicy::ConvertSpaceToDepth(const Operation& operation, const Model& model, ConversionData& data)

1182

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1183

ALOGV("hal_1_2::HalPolicy::ConvertSpaceToDepth()");

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1184

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1185

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1186

if (!input.IsValid() )

1187

{

1188

return Fail("%s: Operation has invalid inputs", __func__);

1189

}

1190

1191

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

1192

unsigned int rank = inputInfo.GetNumDimensions();

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1193

if (rank != 4)

1194

{

1195

return Fail("%s: Only inputs with rank 4 are supported", __func__);

1196

}

1197

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1198

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1199

if (!output)

1200

{

1201

return Fail("%s: Could not read output 0", __func__);

1202

}

1203

1204

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1205

if (IsDynamicTensor(outputInfo))

1206

{

1207

return Fail("%s: Dynamic output tensors are not supported", __func__);

1208

}

1209

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1210

armnn::SpaceToDepthDescriptor desc;

1211

1212

GetInputScalar<hal_1_2::HalPolicy>(operation, 1, OperandType::INT32, desc.m_BlockSize, model, data);

1213

1214

if (desc.m_BlockSize <= 1)

1215

{

1216

return Fail("%s: Block size must be at least 1 in all dimensions");

1217

}

1218

1219

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 2, model, data);

1220

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1221

bool isSupported = false;

1222

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1223

IsSpaceToDepthSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc);

if (!isSupported)

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

{

return false;

}

armnn::IConnectableLayer* const layer = data.m_Network->AddSpaceToDepthLayer(desc);

1235

assert(layer != nullptr);

1236

input.Connect(layer->GetInputSlot(0));

1237

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1238

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1239

}

1240

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1241

bool HalPolicy::ConvertSoftmax(const Operation& operation, const Model& model, ConversionData& data)

1242

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1243

ALOGV("hal_1_2::HalPolicy::ConvertSoftmax()");

1244

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1245

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1246

if (!input.IsValid())

1247

{

1248

return Fail("%s: Operation has invalid inputs", __func__);

1249

}

1250

1251

const Operand* outputOperand = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1252

if (!outputOperand)

1253

{

1254

return Fail("%s: Operation has no outputs", __func__);

1255

}

1256

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1257

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*outputOperand);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

1258

if (IsDynamicTensor(outputInfo))

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1259

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1260

return Fail("%s: Dynamic output tensors are not supported", __func__);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1261

}

1262

1263

armnn::SoftmaxDescriptor desc;

1264

if (!GetInputFloat32<hal_1_2::HalPolicy>(operation, 1, desc.m_Beta, model, data))

1265

{

1266

return Fail("%s: Operation has invalid inputs", __func__);

1267

}

1268

1269

if (operation.inputs.size() > 2 && !GetInputScalar<hal_1_2::HalPolicy>(operation,

1270

2,

1271

HalPolicy::OperandType::INT32,

desc.m_Axis,

model,

data))

{

return Fail("%s: Operation has invalid inputs", __func__);

1277

}

1278

Narumol Prangnawarat

52dc527

2019-08-06 17:34:26 +0100

[diff] [blame]

1279

if (input.GetTensorInfo().GetNumDimensions() > 2 ||

1280

!(desc.m_Axis == 1 ||

1281

(desc.m_Axis < 0 && static_cast<int>(input.GetTensorInfo().GetNumDimensions()) + desc.m_Axis == 1)))

1282

{

1283

return Fail("%s: Unsupported input greater than 2D or axis != 1", __func__);

1284

}

1285

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1286

bool isSupported = false;

1287

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsSoftmaxSupported,

data.m_Backends,

isSupported,

input.GetTensorInfo(),

outputInfo,

desc);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* layer = data.m_Network->AddSoftmaxLayer(desc);

1300

assert(layer != nullptr);

1301

input.Connect(layer->GetInputSlot(0));

1302

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1303

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

1304

}

1305

Mike Kelly

0a87936

2019-07-29 16:56:31 +0100

[diff] [blame]

1306

bool HalPolicy::ConvertSub(const Operation& operation, const Model& model, ConversionData& data)

1307

{

1308

ALOGV("hal_1_2::HalPolicy::ConvertSub()");

1309

return ::ConvertSub<hal_1_2::HalPolicy>(operation, model, data);

1310

}

1311

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

1312

bool HalPolicy::ConvertTanH(const Operation& operation, const Model& model, ConversionData& data)

1313

{

1314

ALOGV("hal_1_2::HalPolicy::ConvertTanH()");

1315

return ::ConvertTanH<hal_1_2::HalPolicy>(operation, model, data);

1316

}

1317

Ferran Balaguer

b2397fd

2019-07-25 12:12:39 +0100

[diff] [blame]

1318

bool HalPolicy::ConvertLstm(const Operation& operation, const Model& model, ConversionData& data)

1319

{

1320

// Inputs:

1321

// 00: The input: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, input_size], where

1322

// “batch_size” corresponds to the batching dimension, and “input_size” is the size of the input.

1323

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1324

if (!input.IsValid())

1325

{

1326

return Fail("%s: Could not read input 0: input", __func__);

1327

}

1328

// 18: The output state: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, output_size].

1329

LayerInputHandle outputStateIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 18, model, data);

1330

if (!outputStateIn.IsValid())

1331

{

1332

return Fail("%s: Could not read input 18: outputStateIn", __func__);

1333

}

1334

// 19: The cell state: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, num_units].

1335

LayerInputHandle cellStateIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 19, model, data);

1336

if (!cellStateIn.IsValid())

1337

{

1338

return Fail("%s: Could not read input 19: cellStateIn", __func__);

1339

}

1340

1341

// Get the mandatory input tensors:

1342

// 02: The input-to-forget weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1343

// [num_units, input_size].

1344

const ConstTensorPin inputToForgetWeightsPin =

1345

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

1346

// 03: The input-to-cell weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1347

// [num_units, input_size].

1348

const ConstTensorPin inputToCellWeightsPin =

1349

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 3, model, data);

1350

// 04: The input-to-output weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1351

// [num_units, input_size].

1352

const ConstTensorPin inputToOutputWeightsPin =

1353

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 4, model, data);

1354

// 06: The recurrent-to-forget weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1355

// [num_units, output_size].

1356

const ConstTensorPin recurrentToForgetWeightsPin =

1357

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 6, model, data);

1358

// 07: The recurrent-to-cell weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1359

// [num_units, output_size].

1360

const ConstTensorPin recurrentToCellWeightsPin =

1361

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 7, model, data);

1362

// 08: The recurrent-to-output weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1363

// [num_units, output_size].

1364

const ConstTensorPin recurrentToOutputWeightsPin =

1365

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 8, model, data);

1366

// 13: The forget gate bias: A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1367

const ConstTensorPin forgetGateBiasPin =

1368

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 13, model, data);

1369

// 14: The cell bias: A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1370

const ConstTensorPin cellBiasPin =

1371

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 14, model, data);

1372

// 15: The output gate bias: A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1373

const ConstTensorPin outputGateBiasPin =

1374

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 15, model, data);

1375

1376

if (!inputToForgetWeightsPin.IsValid() ||

1377

!inputToCellWeightsPin.IsValid() ||

1378

!inputToOutputWeightsPin.IsValid() ||

1379

!recurrentToForgetWeightsPin.IsValid() ||

1380

!recurrentToCellWeightsPin.IsValid() ||

1381

!recurrentToOutputWeightsPin.IsValid() ||

1382

!forgetGateBiasPin.IsValid() ||

1383

!cellBiasPin.IsValid() ||

1384

!outputGateBiasPin.IsValid())

1385

{

1386

return Fail("%s: Operation has invalid tensor inputs", __func__);

1387

}

1388

1389

// Get the optional input tensors:

1390

// 01: The input-to-input weights: Optional. A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1391

// [num_units, input_size], where “num_units” corresponds to the number of cell units.

1392

const ConstTensorPin inputToInputWeightsPin =

1393

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

1,

model,

data,

g_DontPermute,

nullptr,

true);

// 05: The recurrent-to-input weights: Optional. A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1402

// [num_units, output_size], where “output_size” corresponds to either the number of cell units (i.e.,

1403

// “num_units”), or the second dimension of the “projection_weights”, if defined.

1404

const ConstTensorPin recurrentToInputWeightsPin =

1405

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

5,

model,

data,

g_DontPermute,

nullptr,

true);

// 09: The cell-to-input weights: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1414

const ConstTensorPin cellToInputWeightsPin =

1415

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

9,

model,

data,

g_DontPermute,

nullptr,

true);

// 10: The cell-to-forget weights: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1424

const ConstTensorPin cellToForgetWeightsPin =

1425

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

10,

model,

data,

g_DontPermute,

nullptr,

true);

// 11: The cell-to-output weights: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1434

const ConstTensorPin cellToOutputWeightsPin =

1435

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

11,

model,

data,

g_DontPermute,

nullptr,

true);

// 12: The input gate bias: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

1444

const ConstTensorPin inputGateBiasPin =

1445

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

12,

model,

data,

g_DontPermute,

nullptr,

true);

// 16: The projection weights: Optional. A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

1454

// [output_size, num_units].

1455

const ConstTensorPin projectionWeightsPin =

1456

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

16,

model,

data,

g_DontPermute,

nullptr,

true);

// 17: The projection bias: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [output_size].

1465

const ConstTensorPin projectionBiasPin =

1466

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

17,

model,

data,

g_DontPermute,

nullptr,

true);

if ((!inputToInputWeightsPin.IsValid() && !inputToInputWeightsPin.IsOptional()) ||

1475

(!recurrentToInputWeightsPin.IsValid() && !recurrentToInputWeightsPin.IsOptional()) ||

1476

(!cellToInputWeightsPin.IsValid() && !cellToInputWeightsPin.IsOptional()) ||

1477

(!cellToForgetWeightsPin.IsValid() && !cellToForgetWeightsPin.IsOptional()) ||

1478

(!cellToOutputWeightsPin.IsValid() && !cellToOutputWeightsPin.IsOptional()) ||

1479

(!inputGateBiasPin.IsValid() && !inputGateBiasPin.IsOptional()) ||

1480

(!projectionWeightsPin.IsValid() && !projectionWeightsPin.IsOptional()) ||

1481

(!projectionBiasPin.IsValid() && !projectionBiasPin.IsOptional()))

1482

{

1483

return Fail("%s: Operation has invalid tensor inputs", __func__);

1484

}

1485

1486

// Get the mandatory input scalars (actually 1-D tensors of size 1):

1487

// 20: The activation function: A value indicating the activation function:

1488

// 0: None; 1: Relu; 3: Relu6; 4: Tanh; 6: Sigmoid.

1489

// 21: The clipping threshold: for the cell state, such that values are bound within [-cell_clip, cell_clip].

1490

// If set to 0.0 then clipping is disabled.

1491

// 22: The clipping threshold: for the output from the projection layer, such that values are bound within

1492

// [-proj_clip, proj_clip]. If set to 0.0 then clipping is disabled.

1493

ActivationFn activation;

1494

float cellClip;

1495

float projClip;

1496

if (!GetInputActivationFunctionFromTensor<hal_1_2::HalPolicy>(operation, 20, activation, model, data) ||

1497

!GetInputScalar<hal_1_2::HalPolicy>(operation, 21, OperandType::FLOAT32, cellClip, model, data) ||

1498

!GetInputScalar<hal_1_2::HalPolicy>(operation, 22, OperandType::FLOAT32, projClip, model, data))

1499

{

1500

return Fail("%s: Operation has invalid scalar inputs", __func__);

1501

}

1502

1503

// Get the normalization tensors

1504

// 23: The input layer normalization weights. A 1-D tensor of shape [num_units].

1505

// Used to rescale normalized inputs to activation at input gate.

1506

const ConstTensorPin inputLayerNormWeightsPin =

1507

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

23,

model,

data,

g_DontPermute,

nullptr,

true);

// 24: The forget layer normalization weights. A 1-D tensor of shape [num_units].

1516

// Used to rescale normalized inputs to activation at forget gate.

1517

const ConstTensorPin forgetLayerNormWeightsPin =

1518

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

24,

model,

data,

g_DontPermute,

nullptr,

true);

// 25: The cell layer normalization weights. A 1-D tensor of shape [num_units].

1527

// Used to rescale normalized inputs to activation at cell gate.

1528

const ConstTensorPin cellLayerNormWeightsPin =

1529

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

25,

model,

data,

g_DontPermute,

nullptr,

true);

// 26: The output layer normalization weights. A 1-D tensor of shape [num_units].

1538

// Used to rescale normalized inputs to activation at output gate.

1539

const ConstTensorPin outputLayerNormWeightsPin =

1540

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

26,

model,

data,

g_DontPermute,

nullptr,

true);

// Outputs:

// 00: The scratch buffer: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, num_units * 4]

1550

// with CIFG, or [batch_size, num_units * 3] without CIFG.

1551

const Operand* scratchBuffer = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1552

if (!scratchBuffer)

1553

{

1554

return Fail("%s: Could not read output 0: scratchBuffer", __func__);

1555

}

1556

// 01: The output state (out): A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, output_size].

1557

const Operand* outputStateOut = GetOutputOperand<hal_1_2::HalPolicy>(operation, 1, model);

1558

if (!outputStateOut)

1559

{

1560

return Fail("%s: Could not read output 1: outputStateOut", __func__);

1561

}

1562

// 02: The cell state (out): A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, num_units].

1563

const Operand* cellStateOut = GetOutputOperand<hal_1_2::HalPolicy>(operation, 2, model);

1564

if (!cellStateOut)

1565

{

1566

return Fail("%s: Could not read output 2: cellStateOut", __func__);

1567

}

1568

// 03: The output: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, output_size]. This is

1569

// effectively the same as the current “output state (out)” value.

1570

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 3, model);

1571

if (!output)

1572

{

1573

return Fail("%s: Could not read output 3: output", __func__);

1574

}

1575

1576

// set the params structure for the AddLstmLayer call

1577

armnn::LstmInputParams params;

1578

params.m_InputToInputWeights = inputToInputWeightsPin.GetConstTensorPtr();

1579

params.m_InputToForgetWeights = inputToForgetWeightsPin.GetConstTensorPtr();

1580

params.m_InputToCellWeights = inputToCellWeightsPin.GetConstTensorPtr();

1581

params.m_InputToOutputWeights = inputToOutputWeightsPin.GetConstTensorPtr();

1582

params.m_RecurrentToInputWeights = recurrentToInputWeightsPin.GetConstTensorPtr();

1583

params.m_RecurrentToForgetWeights = recurrentToForgetWeightsPin.GetConstTensorPtr();

1584

params.m_RecurrentToCellWeights = recurrentToCellWeightsPin.GetConstTensorPtr();

1585

params.m_RecurrentToOutputWeights = recurrentToOutputWeightsPin.GetConstTensorPtr();

1586

params.m_CellToInputWeights = cellToInputWeightsPin.GetConstTensorPtr();

1587

params.m_CellToForgetWeights = cellToForgetWeightsPin.GetConstTensorPtr();

1588

params.m_CellToOutputWeights = cellToOutputWeightsPin.GetConstTensorPtr();

1589

params.m_InputGateBias = inputGateBiasPin.GetConstTensorPtr();

1590

params.m_ForgetGateBias = forgetGateBiasPin.GetConstTensorPtr();

1591

params.m_CellBias = cellBiasPin.GetConstTensorPtr();

1592

params.m_OutputGateBias = outputGateBiasPin.GetConstTensorPtr();

1593

params.m_ProjectionWeights = projectionWeightsPin.GetConstTensorPtr();

1594

params.m_ProjectionBias = projectionBiasPin.GetConstTensorPtr();

1595

params.m_InputLayerNormWeights = inputLayerNormWeightsPin.GetConstTensorPtr();

1596

params.m_ForgetLayerNormWeights = forgetLayerNormWeightsPin.GetConstTensorPtr();

1597

params.m_CellLayerNormWeights = cellLayerNormWeightsPin.GetConstTensorPtr();

1598

params.m_OutputLayerNormWeights = outputLayerNormWeightsPin.GetConstTensorPtr();

1599

1600

// set the layer descriptor

1601

armnn::LstmDescriptor desc;

1602

desc.m_ActivationFunc = activation;

1603

desc.m_ClippingThresCell = cellClip;

1604

desc.m_ClippingThresProj = projClip;

1605

desc.m_CifgEnabled = (params.m_InputToInputWeights == nullptr ||

1606

params.m_RecurrentToInputWeights == nullptr ||

1607

params.m_InputGateBias == nullptr);

1608

desc.m_PeepholeEnabled = (params.m_CellToForgetWeights != nullptr ||

1609

params.m_CellToOutputWeights != nullptr);

1610

desc.m_ProjectionEnabled = (params.m_ProjectionWeights != nullptr);

1611

desc.m_LayerNormEnabled = (params.m_InputLayerNormWeights != nullptr ||

1612

params.m_ForgetLayerNormWeights != nullptr ||

1613

params.m_CellLayerNormWeights != nullptr ||

1614

params.m_OutputLayerNormWeights != nullptr);

1615

1616

// validate the optional input groups

1617

if (desc.m_CifgEnabled &&

1618

(params.m_InputToInputWeights != nullptr ||

1619

params.m_RecurrentToInputWeights != nullptr ||

1620

params.m_InputGateBias != nullptr))

1621

{

1622

return Fail("%s: All, or none, of input-to-input weights, recurrent-to-input weights,"

1623

" and input gate bias must be provided", __func__);

1624

}

1625

1626

if (!desc.m_ProjectionEnabled && params.m_ProjectionBias != nullptr)

1627

{

1628

return Fail("%s: projection bias should not be provided without projection weights", __func__);

1629

}

1630

1631

if (desc.m_PeepholeEnabled &&

1632

(params.m_CellToForgetWeights == nullptr ||

1633

params.m_CellToOutputWeights == nullptr ||

1634

(!desc.m_CifgEnabled && params.m_CellToInputWeights == nullptr)))

1635

{

1636

return Fail("%s: All, or none, of cell-to-forget weights and cell-to-output weights must be provided"

1637

" and, if CIFG is not enabled, cell-to-input weights must also be provided", __func__);

1638

}

1639

1640

if (desc.m_LayerNormEnabled &&

1641

(params.m_ForgetLayerNormWeights == nullptr ||

1642

params.m_CellLayerNormWeights == nullptr ||

1643

params.m_OutputLayerNormWeights == nullptr ||

1644

(!desc.m_CifgEnabled && params.m_InputLayerNormWeights == nullptr)))

1645

{

1646

return Fail("%s: All, or none, of forget-norm weights, cell-norm weights and output-norm weights must be"

1647

" provided and, if CIFG is not enabled, input-norm weights must also be provided", __func__);

1648

}

1649

1650

// Check if the layer is supported

1651

// Inputs

1652

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

1653

const armnn::TensorInfo& outputStateInInfo = outputStateIn.GetTensorInfo();

1654

const armnn::TensorInfo& cellStateInInfo = cellStateIn.GetTensorInfo();

1655

1656

// Outputs

1657

const armnn::TensorInfo& scratchBufferInfo = GetTensorInfoForOperand(*scratchBuffer);

1658

const armnn::TensorInfo& outputStateOutInfo = GetTensorInfoForOperand(*outputStateOut);

1659

const armnn::TensorInfo& cellStateOutInfo = GetTensorInfoForOperand(*cellStateOut);

1660

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1661

Ferran Balaguer

a4a629a

2019-07-30 10:16:13 +0100

[diff] [blame]

1662

if (IsDynamicTensor(scratchBufferInfo) ||

1663

IsDynamicTensor(outputStateOutInfo) ||

1664

IsDynamicTensor(cellStateOutInfo) ||

1665

IsDynamicTensor(outputInfo))

1666

{

1667

return Fail("%s: Dynamic output tensors are not supported", __func__);

1668

}

1669

Ferran Balaguer

b2397fd

2019-07-25 12:12:39 +0100

[diff] [blame]

1670

// Basic parameters

1671

armnn::LstmInputParamsInfo paramsInfo;

1672

paramsInfo.m_InputToForgetWeights = &(params.m_InputToForgetWeights->GetInfo());

1673

paramsInfo.m_InputToCellWeights = &(params.m_InputToCellWeights->GetInfo());

1674

paramsInfo.m_InputToOutputWeights = &(params.m_InputToOutputWeights->GetInfo());

1675

paramsInfo.m_RecurrentToForgetWeights = &(params.m_RecurrentToForgetWeights->GetInfo());

1676

paramsInfo.m_RecurrentToCellWeights = &(params.m_RecurrentToCellWeights->GetInfo());

1677

paramsInfo.m_RecurrentToOutputWeights = &(params.m_RecurrentToOutputWeights->GetInfo());

1678

paramsInfo.m_ForgetGateBias = &(params.m_ForgetGateBias->GetInfo());

1679

paramsInfo.m_CellBias = &(params.m_CellBias->GetInfo());

1680

paramsInfo.m_OutputGateBias = &(params.m_OutputGateBias->GetInfo());

1681

1682

// Optional parameters

1683

if(!desc.m_CifgEnabled)

1684

{

1685

paramsInfo.m_InputToInputWeights = &(params.m_InputToInputWeights->GetInfo());

1686

paramsInfo.m_RecurrentToInputWeights = &(params.m_RecurrentToInputWeights->GetInfo());

1687

if (params.m_CellToInputWeights != nullptr)

1688

{

1689

paramsInfo.m_CellToInputWeights = &(params.m_CellToInputWeights->GetInfo());

1690

}

1691

paramsInfo.m_InputGateBias = &(params.m_InputGateBias->GetInfo());

1692

}

1693

1694

if(desc.m_ProjectionEnabled)

1695

{

1696

paramsInfo.m_ProjectionWeights = &(params.m_ProjectionWeights->GetInfo());

1697

if (params.m_ProjectionBias != nullptr)

1698

{

1699

paramsInfo.m_ProjectionBias = &(params.m_ProjectionBias->GetInfo());

}

}

if(desc.m_PeepholeEnabled)

1704

{

1705

paramsInfo.m_CellToForgetWeights = &(params.m_CellToForgetWeights->GetInfo());

1706

paramsInfo.m_CellToOutputWeights = &(params.m_CellToOutputWeights->GetInfo());

1707

}

1708

1709

if (desc.m_LayerNormEnabled)

1710

{

1711

if(!desc.m_CifgEnabled)

1712

{

1713

paramsInfo.m_InputLayerNormWeights = &(params.m_InputLayerNormWeights->GetInfo());

1714

}

1715

paramsInfo.m_ForgetLayerNormWeights = &(params.m_ForgetLayerNormWeights->GetInfo());

1716

paramsInfo.m_CellLayerNormWeights = &(params.m_CellLayerNormWeights->GetInfo());

1717

paramsInfo.m_OutputLayerNormWeights = &(params.m_OutputLayerNormWeights->GetInfo());

1718

}

1719

1720

bool isSupported = false;

1721

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsLstmSupported,

data.m_Backends,

isSupported,

inputInfo,

outputStateInInfo,

cellStateInInfo,

scratchBufferInfo,

outputStateOutInfo,

cellStateOutInfo,

outputInfo,

desc,

paramsInfo);

if (!isSupported)

{

return false;

}

// Add the layer

armnn::IConnectableLayer* layer = data.m_Network->AddLstmLayer(desc, params, "Lstm");

1741

1742

input.Connect(layer->GetInputSlot(0));

1743

outputStateIn.Connect(layer->GetInputSlot(1));

1744

cellStateIn.Connect(layer->GetInputSlot(2));

1745

1746

return (SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, 0, model, data) &&

1747

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 1, *layer, 1, model, data) &&

1748

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 2, *layer, 2, model, data) &&

1749

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 3, *layer, 3, model, data));

1750

}

1751

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

1752

bool HalPolicy::ConvertSqrt(const Operation& operation, const Model& model, ConversionData& data)

1753

{

1754

ALOGV("hal_1_2::HalPolicy::ConvertSqrt()");

1755

armnn::ActivationDescriptor desc;

1756

desc.m_Function = armnn::ActivationFunction::Sqrt;

1757

1758

return ::ConvertToActivation<hal_1_2::HalPolicy>(operation, __func__, desc, model, data);

1759

}

1760

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1761

bool HalPolicy::ConvertSqueeze(const Operation& operation, const Model& model, ConversionData& data)

1762

{

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

1763

ALOGV("hal_1_2::HalPolicy::ConvertSqueeze()");

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1764

return ::ConvertSqueeze<hal_1_2::HalPolicy>(operation, model, data);

1765

}

1766

1767

bool HalPolicy::ConvertStridedSlice(const Operation& operation, const Model& model, ConversionData& data)

1768

{

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

1769

ALOGV("hal_1_2::HalPolicy::ConvertStridedSlice()");

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1770

return ::ConvertStridedSlice<hal_1_2::HalPolicy>(operation, model, data);

1771

}

1772

1773

bool HalPolicy::ConvertTranspose(const Operation& operation, const Model& model, ConversionData& data)

1774

{

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

1775

ALOGV("hal_1_2::HalPolicy::ConvertTranspose()");

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1776

return ::ConvertTranspose<hal_1_2::HalPolicy>(operation, model, data);

1777

}

1778

Aron Virginas-Tar

8b99168

2019-07-31 12:54:59 +0100

[diff] [blame]

1779

bool HalPolicy::ConvertTransposeConv2d(const Operation& operation, const Model& model, ConversionData& data)

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

1780

{

1781

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1782

1783

if (!input.IsValid())

1784

{

1785

return Fail("%s: Operation has invalid inputs", __func__);

1786

}

1787

1788

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

if (!output)

{

return Fail("%s: Could not read output 0", __func__);

1793

}

1794

1795

const armnn::TensorInfo& inputInfo = input.GetTensorInfo();

1796

const armnn::TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1797

if (IsDynamicTensor(outputInfo))

1798

{

1799

return Fail("%s: Dynamic output tensors are not supported", __func__);

1800

}

1801

1802

// ArmNN does not currently support non-fixed weights or bias

1803

// Find the shape of the weights tensor. In AndroidNN this will be [ 1, H, W, I * M ]

1804

const Operand* weightsOperand = GetInputOperand<hal_1_2::HalPolicy>(operation, 1, model);

1805

1806

if (weightsOperand == nullptr)

1807

{

1808

return Fail("%s: Operand is invalid", __func__);

1809

}

1810

armnn::TransposeConvolution2dDescriptor desc;

1811

desc.m_DataLayout = armnn::DataLayout::NHWC;

1812

1813

// Determine whether padding is implicit or explicit

1814

bool implicitPadding = operation.inputs.size() == 9;

1815

1816

if (implicitPadding )

1817

{

1818

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 8, model, data);

}

else

{

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 10, model, data);

1823

}

1824

1825

armnnUtils::DataLayoutIndexed dataLayoutIndexed(desc.m_DataLayout);

1826

unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

1827

unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

1828

1829

const armnn::PermutationVector OHWIToOIHW = {0, 2, 3, 1};

1830

1831

// The shape of the weight is [depth_out, filter_height, filter_width, depth_in].

1832

// We have to permute it to OIHW if the data layout is NCHW.

1833

const ConstTensorPin weightsPin = (desc.m_DataLayout == armnn::DataLayout::NCHW) ?

1834

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data, OHWIToOIHW) :

1835

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

1836

1837

// Bias is a 1D tensor

1838

const ConstTensorPin biasPin =

1839

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

1840

1841

if (!weightsPin.IsValid())

1842

{

1843

return Fail("%s: Operation has invalid weights", __func__);

1844

}

1845

1846

if (!biasPin.IsValid())

1847

{

1848

return Fail("%s: Operation has invalid biases", __func__);

1849

}

1850

1851

armnn::ConstTensor weights = weightsPin.GetConstTensor();

1852

armnn::ConstTensor bias = biasPin.GetConstTensor();

1853

SanitizeBiasQuantizationScale(bias.GetInfo(), weights.GetInfo(), inputInfo);

1854

1855

ActivationFn activation;

1856

1857

if (implicitPadding)

1858

{

Sadik Armagan

3e3003e

2019-08-13 12:54:34 +0100

[diff] [blame]

int32_t strideX{0};

int32_t strideY{0};

int32_t padLeft{0};

int32_t padRight{0};

int32_t padTop{0};

int32_t padBottom{0};

1865

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

1866

android::nn::PaddingScheme paddingScheme;

1867

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 4, paddingScheme, model, data) ||

Sadik Armagan

3e3003e

2019-08-13 12:54:34 +0100

[diff] [blame]

1868

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, strideX, model, data) ||

1869

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, strideY, model, data) ||

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

1870

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 7, activation, model, data))

1871

{

1872

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

1873

}

1874

1875

const uint32_t kernelX = weights.GetShape()[widthIndex];

1876

const uint32_t kernelY = weights.GetShape()[heightIndex];

Narumol Prangnawarat

c8bdb39

2019-08-01 15:51:44 +0100

[diff] [blame]

1877

const uint32_t outputX = outputInfo.GetShape()[widthIndex];

1878

const uint32_t outputY = outputInfo.GetShape()[heightIndex];

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

1879

Narumol Prangnawarat

c8bdb39

2019-08-01 15:51:44 +0100

[diff] [blame]

1880

CalcPaddingTransposeConv(outputX, kernelX, desc.m_StrideX, padLeft, padRight, paddingScheme);

1881

CalcPaddingTransposeConv(outputY, kernelY, desc.m_StrideY, padTop, padBottom, paddingScheme);

1882

1883

// NOTE: The Android NN API allows for negative padding values in TransposeConv2d,

1884

// but Arm NN only supports values >= 0

1885

if (padLeft < 0 || padRight < 0 || padTop < 0 || padBottom < 0)

1886

{

1887

return Fail("%s: Negative padding values are not supported", __func__);

1888

}

1889

Sadik Armagan

3e3003e

2019-08-13 12:54:34 +0100

[diff] [blame]

1890

desc.m_StrideX = boost::numeric_cast<uint32_t>(strideX);

1891

desc.m_StrideY = boost::numeric_cast<uint32_t>(strideY);

Narumol Prangnawarat

c8bdb39

2019-08-01 15:51:44 +0100

[diff] [blame]

1892

desc.m_PadLeft = boost::numeric_cast<uint32_t>(padLeft);

1893

desc.m_PadRight = boost::numeric_cast<uint32_t>(padRight);

1894

desc.m_PadTop = boost::numeric_cast<uint32_t>(padTop);

1895

desc.m_PadBottom = boost::numeric_cast<uint32_t>(padBottom);

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

1896

}

1897

else if (operation.inputs.size() == 11)

1898

{

1899

// explicit padding

1900

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

1901

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

1902

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

1903

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

1904

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

1905

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

1906

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 9, activation, model, data))

1907

{

1908

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

}

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

1914

}

1915

1916

desc.m_BiasEnabled = true;

1917

armnn::Optional<armnn::TensorInfo> biases(bias.GetInfo());

1918

1919

bool isSupported = false;

1920

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1921

IsTransposeConvolution2dSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc,

weights.GetInfo(),

biases);

if (!isSupported)

{

return false;

}

armnn::IConnectableLayer* startLayer =

1935

data.m_Network->AddTransposeConvolution2dLayer(desc, weights, armnn::Optional<armnn::ConstTensor>(bias));

1936

if (!startLayer)

1937

{

1938

return Fail("%s: AddTransposeConvolution2dLayer failed", __func__);

1939

}

1940

1941

armnn::IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, startLayer, data);

1942

if (!endLayer)

1943

{

1944

return Fail("%s: ProcessActivation failed", __func__);

1945

}

1946

1947

input.Connect(startLayer->GetInputSlot(0));

1948

1949

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *endLayer, model, data);

1950

}

1951

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

1952

} // namespace hal_1_2

Matteo Martincigh