Blame - 1.2/HalPolicy.cpp - ml/android-nn-driver

2019-06-11 16:35:25 +0100

[diff] [blame]

1

//

2

3

// SPDX-License-Identifier: MIT

4

//

5

6

#include "HalPolicy.hpp"

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

7

#include "Utils.hpp"

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

8

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

9

#include <armnn/TypesUtils.hpp>

10

Matteo Martincigh

00d6ed1

2019-11-28 17:13:24 +0000

[diff] [blame]

11

#include <armnnUtils/DataLayoutIndexed.hpp>

12

#include <armnnUtils/TensorUtils.hpp>

#include <Half.hpp>

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

16

#include <cmath>

Aron Virginas-Tar

2019-10-29 14:25:09 +0000

[diff] [blame]

17

#include <string>

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

18

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

19

namespace armnn_driver

{

namespace hal_1_2

{

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

24

using namespace armnn;

25

Aron Virginas-Tar

65a1b1d

2019-11-15 15:59:51 +0000

[diff] [blame]

namespace

{

bool IsQSymmDequantizeForWeights(const Operation& operation, const Model& model)

30

{

31

const Operand* operand = GetInputOperand<hal_1_2::HalPolicy>(operation, 0, model);

if (!operand)

{

return false;

}

if(!IsQSymm8(*operand))

38

{

39

// Only QSymm8 weights are dequantized on the fly by the driver

return false;

}

if (!IsOperandConstant<hal_1_2::HalPolicy>(*operand))

44

{

45

// Non-const input is not accepted for weights

return false;

}

// Iterate through all the operations and find the operation feeding from the Dequantize output

50

const size_t outputIndex = operation.outputs[0];

51

for (uint32_t operationIdx = 0; operationIdx < model.operations.size(); ++operationIdx)

52

{

53

const auto& operationIt = model.operations[operationIdx];

54

switch (operationIt.type)

55

{

56

case HalPolicy::OperationType::FULLY_CONNECTED:

57

if (outputIndex == operationIt.inputs[1]) // Weights are bound to slot 1

58

{

59

// If the output is going into the FC weights return true

return true;

}

break;

case HalPolicy::OperationType::LSTM:

64

for (size_t k = 0; k < operationIt.inputs.size(); ++k)

65

{

66

if (outputIndex == operationIt.inputs[k])

67

{

68

// If the output is going into the LSTM weights return true

return true;

}

}

break;

default:

break;

}

}

return false;

}

} // anonymous namespace

82

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

83

bool HalPolicy::ConvertOperation(const Operation& operation, const Model& model, ConversionData& data)

84

{

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

85

switch (operation.type)

86

{

Kevin May

407718f

2019-09-09 14:46:41 +0100

[diff] [blame]

87

case V1_2::OperationType::ABS:

josh minor

00a963b

2020-01-08 11:55:35 -0600

[diff] [blame^]

88

return ConvertElementwiseUnary(operation, model, data, UnaryOperation::Abs);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

89

case V1_2::OperationType::ADD:

90

return ConvertAdd(operation, model, data);

Francis Murtagh

19fa0cc

2019-11-19 12:06:47 +0000

[diff] [blame]

91

case V1_2::OperationType::ARGMAX:

92

return ConvertArgMinMax(operation, model, data, ArgMinMaxFunction::Max);

93

case V1_2::OperationType::ARGMIN:

94

return ConvertArgMinMax(operation, model, data, ArgMinMaxFunction::Min);

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

95

case V1_2::OperationType::AVERAGE_POOL_2D:

96

return ConvertAveragePool2d(operation, model, data);

Finn Williams

23b87b3

2019-07-30 11:44:05 +0100

[diff] [blame]

97

case V1_2::OperationType::BATCH_TO_SPACE_ND:

98

return ConvertBatchToSpaceNd(operation, model, data);

Mike Kelly

b880520

2019-07-31 17:25:43 +0100

[diff] [blame]

99

case V1_2::OperationType::CONCATENATION:

100

return ConvertConcatenation(operation, model, data);

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

101

case V1_2::OperationType::CONV_2D:

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

102

return ConvertConv2d(operation, model, data);

Aron Virginas-Tar

8edb16d

2019-10-01 13:34:59 +0100

[diff] [blame]

103

case V1_2::OperationType::DEPTH_TO_SPACE:

104

return ConvertDepthToSpace(operation, model, data);

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

105

case V1_2::OperationType::DEPTHWISE_CONV_2D:

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

106

return ConvertDepthwiseConv2d(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

107

case V1_2::OperationType::DEQUANTIZE:

108

return ConvertDequantize(operation, model, data);

109

case V1_2::OperationType::DIV:

110

return ConvertDiv(operation, model, data);

Aron Virginas-Tar

2019-10-29 14:25:09 +0000

[diff] [blame]

111

case V1_2::OperationType::EQUAL:

112

return ConvertComparison(operation, model, data, ComparisonOperation::Equal);

Narumol Prangnawarat

2019-09-12 16:26:29 +0100

[diff] [blame]

113

case V1_2::OperationType::EXPAND_DIMS:

114

return ConvertExpandDims(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

115

case V1_2::OperationType::FLOOR:

116

return ConvertFloor(operation, model, data);

117

case V1_2::OperationType::FULLY_CONNECTED:

118

return ConvertFullyConnected(operation, model, data);

Aron Virginas-Tar

2019-10-29 14:25:09 +0000

[diff] [blame]

119

case V1_2::OperationType::GREATER:

120

return ConvertComparison(operation, model, data, ComparisonOperation::Greater);

121

case V1_2::OperationType::GREATER_EQUAL:

122

return ConvertComparison(operation, model, data, ComparisonOperation::GreaterOrEqual);

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

123

case V1_2::OperationType::GROUPED_CONV_2D:

124

return ConvertGroupedConv2d(operation, model, data);

Aron Virginas-Tar

a2a7380

2019-10-09 15:30:40 +0100

[diff] [blame]

125

case V1_2::OperationType::INSTANCE_NORMALIZATION:

126

return ConvertInstanceNormalization(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

127

case V1_2::OperationType::L2_NORMALIZATION:

128

return ConvertL2Normalization(operation, model, data);

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

129

case V1_2::OperationType::L2_POOL_2D:

130

return ConvertL2Pool2d(operation, model, data);

Aron Virginas-Tar

2019-10-29 14:25:09 +0000

[diff] [blame]

131

case V1_2::OperationType::LESS:

132

return ConvertComparison(operation, model, data, ComparisonOperation::Less);

133

case V1_2::OperationType::LESS_EQUAL:

134

return ConvertComparison(operation, model, data, ComparisonOperation::LessOrEqual);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

135

case V1_2::OperationType::LOCAL_RESPONSE_NORMALIZATION:

136

return ConvertLocalResponseNormalization(operation, model, data);

137

case V1_2::OperationType::LOGISTIC:

138

return ConvertLogistic(operation, model, data);

Aron Virginas-Tar

75e6779

2019-10-15 13:33:03 +0100

[diff] [blame]

139

case V1_2::OperationType::LOG_SOFTMAX:

140

return ConvertLogSoftmax(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

141

case V1_2::OperationType::LSTM:

142

return ConvertLstm(operation, model, data);

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

143

case V1_2::OperationType::MAX_POOL_2D:

144

return ConvertMaxPool2d(operation, model, data);

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

145

case V1_2::OperationType::MAXIMUM:

146

return ConvertMaximum(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

147

case V1_2::OperationType::MEAN:

148

return ConvertMean(operation, model, data);

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

149

case V1_2::OperationType::MINIMUM:

150

return ConvertMinimum(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

151

case V1_2::OperationType::MUL:

152

return ConvertMul(operation, model, data);

Aron Virginas-Tar

2019-10-29 14:25:09 +0000

[diff] [blame]

153

case V1_2::OperationType::NOT_EQUAL:

154

return ConvertComparison(operation, model, data, ComparisonOperation::NotEqual);

Mike Kelly

3c67394

2019-07-25 09:26:06 +0100

[diff] [blame]

155

case V1_2::OperationType::PAD:

Aron Virginas-Tar

c921f6b

2019-07-25 10:14:33 +0100

[diff] [blame]

156

return ConvertPad(operation, model, data);

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

157

case V1_2::OperationType::PAD_V2:

158

return ConvertPadV2(operation, model, data);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

159

case V1_2::OperationType::PRELU:

160

return ConvertPrelu(operation, model, data);

Sadik Armagan

2019-07-30 09:43:18 +0100

[diff] [blame]

161

case V1_2::OperationType::QUANTIZE:

162

return ConvertQuantize(operation, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

163

case V1_2::OperationType::QUANTIZED_16BIT_LSTM:

164

return ConvertQuantizedLstm(operation, model, data);

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

165

case V1_2::OperationType::RELU:

166

return ConvertReLu(operation, model, data);

167

case V1_2::OperationType::RELU1:

168

return ConvertReLu1(operation, model, data);

169

case V1_2::OperationType::RELU6:

170

return ConvertReLu6(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

171

case V1_2::OperationType::RESHAPE:

172

return ConvertReshape(operation, model, data);

Aron Virginas-Tar

fb2fa29

2019-07-04 11:59:48 +0100

[diff] [blame]

173

case V1_2::OperationType::RESIZE_BILINEAR:

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

174

return ConvertResize(operation, model, data, ResizeMethod::Bilinear);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

175

case V1_2::OperationType::RESIZE_NEAREST_NEIGHBOR:

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

176

return ConvertResize(operation, model, data, ResizeMethod::NearestNeighbor);

Aron Virginas-Tar

fa6544e

2019-09-10 14:42:22 +0100

[diff] [blame]

177

case V1_2::OperationType::RSQRT:

josh minor

00a963b

2020-01-08 11:55:35 -0600

[diff] [blame^]

178

return ConvertElementwiseUnary(operation, model, data, UnaryOperation::Rsqrt);

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

179

case V1_2::OperationType::SQRT:

180

return ConvertSqrt(operation, model, data);

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

181

case V1_2::OperationType::SQUEEZE:

182

return ConvertSqueeze(operation, model, data);

183

case V1_2::OperationType::STRIDED_SLICE:

184

return ConvertStridedSlice(operation, model, data);

185

case V1_2::OperationType::TRANSPOSE:

186

return ConvertTranspose(operation, model, data);

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

187

case V1_2::OperationType::TRANSPOSE_CONV_2D:

Aron Virginas-Tar

8b99168

2019-07-31 12:54:59 +0100

[diff] [blame]

188

return ConvertTransposeConv2d(operation, model, data);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

189

case V1_2::OperationType::SOFTMAX:

190

return ConvertSoftmax(operation, model, data);

Finn Williams

d74c505

2019-07-30 17:06:00 +0100

[diff] [blame]

191

case V1_2::OperationType::SPACE_TO_BATCH_ND :

192

return ConvertSpaceToBatchNd(operation, model, data);

Aron Virginas-Tar

ad1ab53

2019-07-25 11:24:42 +0100

[diff] [blame]

193

case V1_2::OperationType::SPACE_TO_DEPTH:

194

return ConvertSpaceToDepth(operation, model, data);

Mike Kelly

0a87936

2019-07-29 16:56:31 +0100

[diff] [blame]

195

case V1_2::OperationType::SUB:

196

return ConvertSub(operation, model, data);

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

197

case V1_2::OperationType::TANH:

198

return ConvertTanH(operation, model, data);

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

199

default:

200

return Fail("%s: Operation type %s not supported in ArmnnDriver",

201

__func__, toString(operation.type).c_str());

}

}

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

205

bool HalPolicy::ConvertAdd(const Operation& operation, const Model& model, ConversionData& data)

206

{

207

ALOGV("hal_1_2::HalPolicy::ConvertAdd()");

208

return ::ConvertAdd<hal_1_2::HalPolicy>(operation, model, data);

209

}

210

Francis Murtagh

19fa0cc

2019-11-19 12:06:47 +0000

[diff] [blame]

211

bool HalPolicy::ConvertArgMinMax(const V1_2::Operation& operation,

212

const V1_2::Model& model,

213

ConversionData& data,

214

armnn::ArgMinMaxFunction argMinMaxFunction)

215

{

216

ALOGV("hal_1_2::HalPolicy::ConvertArgMinMax()");

217

return ::ConvertArgMinMax<hal_1_2::HalPolicy>(operation, model, data, argMinMaxFunction);

218

}

219

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

220

bool HalPolicy::ConvertAveragePool2d(const Operation& operation, const Model& model, ConversionData& data)

221

{

222

ALOGV("hal_1_2::HalPolicy::ConvertAveragePool2d()");

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

223

return ConvertPooling2d<hal_1_2::HalPolicy>(operation, __func__, PoolingAlgorithm::Average, model, data);

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

224

}

225

Finn Williams

23b87b3

2019-07-30 11:44:05 +0100

[diff] [blame]

226

bool HalPolicy::ConvertBatchToSpaceNd(const Operation& operation, const Model& model, ConversionData& data)

227

{

228

ALOGV("hal_1_2::HalPolicy::ConvertBatchToSpaceNd()");

229

return ::ConvertBatchToSpaceNd<hal_1_2::HalPolicy>(operation, model, data);

230

}

231

Aron Virginas-Tar

2019-10-29 14:25:09 +0000

[diff] [blame]

232

bool HalPolicy::ConvertComparison(const Operation& operation,

233

const Model& model,

234

ConversionData& data,

235

ComparisonOperation comparisonOperation)

236

{

237

ALOGV("hal_1_2::HalPolicy::ConvertComparison()");

238

ALOGV("comparisonOperation = %s", GetComparisonOperationAsCString(comparisonOperation));

239

240

LayerInputHandle input0 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

241

LayerInputHandle input1 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

242

243

if (!(input0.IsValid() && input1.IsValid()))

244

{

245

return Fail("%s: Operation has invalid inputs", __func__);

246

}

247

248

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

249

if (!output)

250

{

251

return Fail("%s: Could not read output 0", __func__);

252

}

253

254

const TensorInfo& inputInfo0 = input0.GetTensorInfo();

255

const TensorInfo& inputInfo1 = input1.GetTensorInfo();

256

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

257

258

if (IsDynamicTensor(outputInfo))

259

{

260

return Fail("%s: Dynamic output tensors are not supported", __func__);

261

}

262

263

ComparisonDescriptor descriptor(comparisonOperation);

264

265

bool isSupported = false;

266

FORWARD_LAYER_SUPPORT_FUNC(__func__,

267

IsComparisonSupported,

data.m_Backends,

isSupported,

inputInfo0,

inputInfo1,

outputInfo,

descriptor);

if (!isSupported)

{

return false;

}

IConnectableLayer* layer = data.m_Network->AddComparisonLayer(descriptor);

281

assert(layer != nullptr);

282

283

input0.Connect(layer->GetInputSlot(0));

284

input1.Connect(layer->GetInputSlot(1));

285

286

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

287

}

288

Mike Kelly

b880520

2019-07-31 17:25:43 +0100

[diff] [blame]

289

bool HalPolicy::ConvertConcatenation(const Operation& operation, const Model& model, ConversionData& data)

290

{

291

ALOGV("hal_1_2::HalPolicy::ConvertConcatenation()");

292

return ::ConvertConcatenation<hal_1_2::HalPolicy>(operation, model, data);

293

}

294

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

295

bool HalPolicy::ConvertConv2d(const Operation& operation, const Model& model, ConversionData& data)

296

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

297

ALOGV("hal_1_2::HalPolicy::ConvertConv2d()");

298

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

299

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

300

if (!input.IsValid())

301

{

302

return Fail("%s: Operation has invalid inputs", __func__);

303

}

304

305

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

306

if (!output)

307

{

308

return Fail("%s: Could not read output 0", __func__);

309

}

310

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

311

const TensorInfo& inputInfo = input.GetTensorInfo();

312

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

313

314

if (IsDynamicTensor(outputInfo))

315

{

316

return Fail("%s: Dynamic output tensors are not supported", __func__);

317

}

Aron Virginas-Tar

366e0a6

2019-07-10 13:01:41 +0100

[diff] [blame]

318

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

319

Convolution2dDescriptor desc;

320

desc.m_DataLayout = DataLayout::NHWC;

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

321

322

// Determine whether padding is implicit or explicit

323

bool implicitPadding = operation.inputs.size() == 7 ||

324

(operation.inputs.size() >= 8 &&

325

GetInputOperand<hal_1_2::HalPolicy>(operation, 7, model)->type == OperandType::BOOL);

if (implicitPadding)

{

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 7, model, data);

330

}

331

else if (operation.inputs.size() >= 10)

332

{

333

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 10, model, data);

334

}

335

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

336

const PermutationVector OHWIToOIHW = {0, 2, 3, 1};

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

337

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

338

// ArmNN does not currently support non-fixed weights or bias

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

339

// The NNAPI filter is always OHWI [depth_out, filter_height, filter_width, depth_in] but ArmNN expects the

340

// filter's height and width indices to match the input's height and width indices so we permute it to OIHW if

341

// the DataLayout is NCHW

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

342

const ConstTensorPin weightsPin = (desc.m_DataLayout == DataLayout::NCHW) ?

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

343

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data, OHWIToOIHW) :

344

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

345

const ConstTensorPin biasPin =

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

346

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

347

348

if (!weightsPin.IsValid())

349

{

350

return Fail("%s: Operation has invalid weights", __func__);

351

}

352

353

if (!biasPin.IsValid())

354

{

355

return Fail("%s: Operation has invalid biases", __func__);

356

}

357

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

358

ConstTensor weights = weightsPin.GetConstTensor();

359

ConstTensor bias = biasPin.GetConstTensor();

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

360

SanitizeBiasQuantizationScale(bias.GetInfo(), weights.GetInfo(), inputInfo);

361

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

362

ActivationFn activation;

363

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

364

if (implicitPadding)

365

{

366

android::nn::PaddingScheme paddingScheme;

367

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 3, paddingScheme, model, data) ||

368

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_StrideX, model, data) ||

369

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_StrideY, model, data) ||

370

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 6, activation, model, data) ||

371

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 8, desc, model, data))

372

{

373

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

374

}

375

Mike Kelly

2019-07-11 11:44:52 +0100

[diff] [blame]

376

armnnUtils::DataLayoutIndexed dataLayoutIndexed(desc.m_DataLayout);

377

unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

378

unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

379

const uint32_t kernelX = weights.GetShape()[widthIndex];

380

const uint32_t kernelY = weights.GetShape()[heightIndex];

381

const uint32_t inputX = inputInfo.GetShape()[widthIndex];

382

const uint32_t inputY = inputInfo.GetShape()[heightIndex];

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

383

Mike Kelly

86b36d4

2019-07-12 16:39:33 +0100

[diff] [blame]

384

CalcPadding(inputX, kernelX, desc.m_StrideX, desc.m_DilationX, desc.m_PadLeft, desc.m_PadRight, paddingScheme);

385

CalcPadding(inputY, kernelY, desc.m_StrideY, desc.m_DilationY, desc.m_PadTop, desc.m_PadBottom, paddingScheme);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

386

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

387

}

388

else if (operation.inputs.size() >= 10)

389

{

390

// explicit padding

391

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

392

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

393

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

394

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

395

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

396

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

397

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 9, activation, model, data) ||

398

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 11, desc, model, data))

399

{

400

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

401

}

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

406

}

407

408

desc.m_BiasEnabled = true;

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

409

Optional<TensorInfo> biases(bias.GetInfo());

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

410

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

411

bool isSupported = false;

412

FORWARD_LAYER_SUPPORT_FUNC(__func__,

413

IsConvolution2dSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc,

weights.GetInfo(),

biases);

Aron Virginas-Tar

2b17312

2019-07-15 14:29:09 +0100

[diff] [blame]

421

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

422

if (!isSupported)

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

427

IConnectableLayer* startLayer =

428

data.m_Network->AddConvolution2dLayer(desc, weights, Optional<ConstTensor>(bias));

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

if (!startLayer)

{

return Fail("%s: AddConvolution2dLayer failed", __func__);

433

}

434

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

435

IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, startLayer, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

if (!endLayer)

{

return Fail("%s: ProcessActivation failed", __func__);

440

}

441

442

input.Connect(startLayer->GetInputSlot(0));

443

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

444

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *endLayer, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

445

}

446

Aron Virginas-Tar

8edb16d

2019-10-01 13:34:59 +0100

[diff] [blame]

447

bool HalPolicy::ConvertDepthToSpace(const Operation& operation, const Model& model, ConversionData& data)

448

{

449

ALOGV("hal_1_2::HalPolicy::ConvertDepthToSpace()");

450

return ::ConvertDepthToSpace<hal_1_2::HalPolicy>(operation, model, data);

451

}

452

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

453

bool HalPolicy::ConvertDepthwiseConv2d(const Operation& operation, const Model& model, ConversionData& data)

454

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

455

ALOGV("hal_1_2::HalPolicy::ConvertDepthwiseConv2d()");

456

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

457

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

458

459

if (!input.IsValid())

460

{

461

return Fail("%s: Operation has invalid inputs", __func__);

462

}

463

464

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

if (!output)

{

return Fail("%s: Could not read output 0", __func__);

469

}

470

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

471

const TensorInfo& inputInfo = input.GetTensorInfo();

472

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

473

474

if (IsDynamicTensor(outputInfo))

475

{

476

return Fail("%s: Dynamic output tensors are not supported", __func__);

477

}

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

478

479

// ArmNN does not currently support non-fixed weights or bias

480

// Find the shape of the weights tensor. In AndroidNN this will be [ 1, H, W, I * M ]

481

const Operand* weightsOperand = GetInputOperand<hal_1_2::HalPolicy>(operation, 1, model);

482

483

if (weightsOperand == nullptr)

484

{

485

return Fail("%s: Operand is invalid", __func__);

486

}

Teresa Charlin

3b95960

2019-10-31 17:05:47 +0000

[diff] [blame]

487

if ( weightsOperand->dimensions[0] != 1)

488

{

489

return Fail("%s: Invalid weights; for depthwise convolution, dimension 0 must be 1 but it is %i",

490

__func__, weightsOperand->dimensions[0] );

491

}

492

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

493

DepthwiseConvolution2dDescriptor desc;

494

desc.m_DataLayout = DataLayout::NHWC;

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

495

496

// Determine whether padding is implicit or explicit

497

bool implicitPadding = operation.inputs.size() == 8 ||

498

(operation.inputs.size() >= 9 &&

499

GetInputOperand<hal_1_2::HalPolicy>(operation, 8, model)->type == OperandType::BOOL);

500

501

// Look ahead to find the optional DataLayout, if present

502

const uint32_t dataLayoutFlagIndex = implicitPadding ? 8 : 11;

503

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, dataLayoutFlagIndex, model, data);

504

505

armnnUtils::DataLayoutIndexed dataLayoutIndexed(desc.m_DataLayout);

506

unsigned int channelsIndex = dataLayoutIndexed.GetChannelsIndex();

507

unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

508

unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

509

510

// Reinterpret weight data as [ H, W, I, M ]

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

511

TensorShape weightsShape({ weightsOperand->dimensions[1],

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

512

weightsOperand->dimensions[2],

513

inputInfo.GetShape()[channelsIndex],

514

weightsOperand->dimensions[3] / inputInfo.GetShape()[channelsIndex] });

515

516

// Swizzle weight data [ H, W, I, M ] -> [ M, I, H, W ]

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

517

const PermutationVector HWIMToMIHW = { 2U, 3U, 1U, 0U };

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

518

519

const ConstTensorPin weightsPin =

520

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

1,

model,

data,

HWIMToMIHW,

&weightsShape);

// Bias is a 1D tensor

528

const ConstTensorPin biasPin =

529

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

530

531

if (!weightsPin.IsValid())

532

{

533

return Fail("%s: Operation has invalid weights", __func__);

534

}

535

536

if (!biasPin.IsValid())

537

{

538

return Fail("%s: Operation has invalid biases", __func__);

539

}

540

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

541

ConstTensor weights = weightsPin.GetConstTensor();

542

ConstTensor bias = biasPin.GetConstTensor();

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

543

SanitizeBiasQuantizationScale(bias.GetInfo(), weights.GetInfo(), inputInfo);

544

545

ActivationFn activation;

if (implicitPadding)

{

android::nn::PaddingScheme paddingScheme;

550

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 3, paddingScheme, model, data) ||

551

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_StrideX, model, data) ||

552

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_StrideY, model, data) ||

553

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 7, activation, model, data) ||

554

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 9, desc, model, data))

555

{

556

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

557

}

558

559

const uint32_t kernelX = weights.GetShape()[3];

560

const uint32_t kernelY = weights.GetShape()[2];

561

const uint32_t inputX = inputInfo.GetShape()[widthIndex];

562

const uint32_t inputY = inputInfo.GetShape()[heightIndex];

563

Mike Kelly

86b36d4

2019-07-12 16:39:33 +0100

[diff] [blame]

564

CalcPadding(inputX, kernelX, desc.m_StrideX, desc.m_DilationX, desc.m_PadLeft, desc.m_PadRight, paddingScheme);

565

CalcPadding(inputY, kernelY, desc.m_StrideY, desc.m_DilationY, desc.m_PadTop, desc.m_PadBottom, paddingScheme);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

566

}

567

else if (operation.inputs.size() >= 11)

568

{

569

// explicit padding

570

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

571

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

572

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

573

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

574

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

575

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

576

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 10, activation, model, data) ||

577

!GetOptionalConvolutionDilationParams<hal_1_2::HalPolicy>(operation, 12, desc, model, data))

578

{

579

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

}

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

585

}

586

587

desc.m_BiasEnabled = true;

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

588

Optional<TensorInfo> biases(bias.GetInfo());

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

589

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

590

bool isSupported = false;

591

FORWARD_LAYER_SUPPORT_FUNC(__func__,

592

IsDepthwiseConvolutionSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc,

weights.GetInfo(),

biases);

Aron Virginas-Tar

9fd3739

2019-07-15 18:04:32 +0100

[diff] [blame]

600

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

601

if (!isSupported)

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

606

IConnectableLayer* startLayer =

607

data.m_Network->AddDepthwiseConvolution2dLayer(desc, weights, Optional<ConstTensor>(bias));

Aron Virginas-Tar

9fd3739

2019-07-15 18:04:32 +0100

[diff] [blame]

608

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

609

if (!startLayer)

610

{

611

return Fail("%s: AddDepthwiseConvolution2dLayer failed", __func__);

612

}

613

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

614

IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, startLayer, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

615

if (!endLayer)

616

{

617

return Fail("%s: ProcessActivation failed", __func__);

618

}

619

620

input.Connect(startLayer->GetInputSlot(0));

621

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

622

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *endLayer, model, data);

Aron Virginas-Tar

2019-06-17 14:47:46 +0100

[diff] [blame]

623

}

624

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

625

bool HalPolicy::ConvertDequantize(const Operation& operation, const Model& model, ConversionData& data)

626

{

627

ALOGV("hal_1_2::HalPolicy::ConvertDequantize()");

Aron Virginas-Tar

65a1b1d

2019-11-15 15:59:51 +0000

[diff] [blame]

628

629

if (IsQSymmDequantizeForWeights(operation, model))

630

{

631

// NOTE: QSymm8 weights are dequantized internally by the driver,

632

// therefore this type of Dequantize is implicitly supported

return true;

}

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

636

return ::ConvertDequantize<hal_1_2::HalPolicy>(operation, model, data);

637

}

638

639

bool HalPolicy::ConvertDiv(const Operation& operation, const Model& model, ConversionData& data)

640

{

641

ALOGV("hal_1_2::HalPolicy::ConvertDiv()");

642

return ::ConvertDiv<hal_1_2::HalPolicy>(operation, model, data);

643

}

644

josh minor

00a963b

2020-01-08 11:55:35 -0600

[diff] [blame^]

645

bool HalPolicy::ConvertElementwiseUnary(const Operation& operation,

646

const Model& model,

647

ConversionData& data,

648

UnaryOperation unaryOperation)

649

{

650

ALOGV("hal_1_2::HalPolicy::ConvertElementwiseUnary()");

651

ALOGV("unaryOperation = %s", GetUnaryOperationAsCString(unaryOperation));

652

653

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

654

655

if (!input.IsValid())

656

{

657

return Fail("%s: Operation has invalid input", __func__);

658

}

659

660

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

661

if (!output)

662

{

663

return Fail("%s: Could not read output 0", __func__);

664

}

665

666

const TensorInfo& inputInfo = input.GetTensorInfo();

667

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

668

669

if (IsDynamicTensor(outputInfo))

670

{

671

return Fail("%s: Dynamic output tensors are not supported", __func__);

672

}

673

674

ElementwiseUnaryDescriptor descriptor(unaryOperation);

675

676

bool isSupported = false;

677

FORWARD_LAYER_SUPPORT_FUNC(__func__,

678

IsElementwiseUnarySupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

descriptor);

if (!isSupported)

{

return false;

}

IConnectableLayer* layer = data.m_Network->AddElementwiseUnaryLayer(descriptor);

691

assert(layer != nullptr);

692

693

input.Connect(layer->GetInputSlot(0));

694

695

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

696

}

697

Narumol Prangnawarat

2019-09-12 16:26:29 +0100

[diff] [blame]

698

bool HalPolicy::ConvertExpandDims(const Operation& operation, const Model& model, ConversionData& data)

699

{

700

ALOGV("hal_1_2::HalPolicy::ConvertExpandDims()");

701

702

LayerInputHandle input = ConvertToLayerInputHandle<HalPolicy>(operation, 0, model, data);

703

704

if (!input.IsValid())

705

{

706

return Fail("%s: Operation has invalid input", __func__);

707

}

708

709

const Operand* output = GetOutputOperand<HalPolicy>(operation, 0, model);

710

if (!output)

711

{

712

return Fail("%s: Operation has invalid output", __func__);

713

}

714

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

715

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Narumol Prangnawarat

2019-09-12 16:26:29 +0100

[diff] [blame]

716

if (IsDynamicTensor(outputInfo))

717

{

718

return Fail("%s: Dynamic output tensors are not supported", __func__);

}

int32_t axis;

if (!GetInputScalar<HalPolicy>(operation, 1, OperandType::INT32, axis, model, data))

723

{

724

return Fail("%s: failed to get axis input value", __func__);

725

}

726

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

727

TensorShape targetShape;

Narumol Prangnawarat

2019-09-12 16:26:29 +0100

[diff] [blame]

try

{

targetShape = armnnUtils::ExpandDims(input.GetTensorInfo().GetShape(), axis);

732

}

733

catch (const std::exception &e)

734

{

735

return Fail("%s: %s", __func__, e.what());

736

}

737

738

if (targetShape != outputInfo.GetShape())

739

{

740

return Fail("%s: Shape of the output operand does not match the resolved expanded shape", __func__);

741

}

742

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

743

ReshapeDescriptor reshapeDescriptor;

Narumol Prangnawarat

2019-09-12 16:26:29 +0100

[diff] [blame]

744

reshapeDescriptor.m_TargetShape = targetShape;

745

746

bool isSupported = false;

747

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsReshapeSupported,

data.m_Backends,

isSupported,

input.GetTensorInfo(),

reshapeDescriptor);

if (!isSupported)

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

759

IConnectableLayer* layer = data.m_Network->AddReshapeLayer(reshapeDescriptor);

Narumol Prangnawarat

2019-09-12 16:26:29 +0100

[diff] [blame]

760

assert(layer != nullptr);

761

input.Connect(layer->GetInputSlot(0));

762

763

return SetupAndTrackLayerOutputSlot<HalPolicy>(operation, 0, *layer, model, data);

764

}

765

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

766

bool HalPolicy::ConvertFloor(const Operation& operation, const Model& model, ConversionData& data)

767

{

768

ALOGV("hal_1_2::HalPolicy::ConvertFloor()");

769

return ::ConvertFloor<hal_1_2::HalPolicy>(operation, model, data);

770

}

771

772

bool HalPolicy::ConvertFullyConnected(const Operation& operation, const Model& model, ConversionData& data)

773

{

774

ALOGV("hal_1_2::HalPolicy::ConvertFullyConnected()");

775

return ::ConvertFullyConnected<hal_1_2::HalPolicy>(operation, model, data);

776

}

777

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

778

bool HalPolicy::ConvertGroupedConv2d(const Operation& operation, const Model& model, ConversionData& data)

779

{

780

ALOGV("hal_1_2::HalPolicy::ConvertGroupedConv2d()");

//

// Parse data

//

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

786

if (!input.IsValid())

787

{

788

return Fail("%s: Operation has invalid inputs", __func__);

789

}

790

const TensorInfo& inputInfo = input.GetTensorInfo();

791

792

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

793

if (!output)

794

{

795

return Fail("%s: Could not read output 0", __func__);

796

}

797

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

798

if (IsDynamicTensor(outputInfo))

799

{

800

return Fail("%s: Dynamic output tensors are not supported", __func__);

801

}

802

803

// Look ahead to determine data layout

804

DataLayout dataLayout = DataLayout::NHWC;

805

if (operation.inputs.size() == 12)

806

{

807

dataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 11, model, data);

}

else

{

dataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 8, model, data);

}

// NOTE:

// NNAPI weights are always OHWI, i.e. [depth_out, filter_height, filter_width, depth_group],

816

// but Arm NN expects the filter's height and width indices to match the input's height and

817

// width indices so when the DataLayout is NCHW, we need to permute the weights to OIHW

818

const PermutationVector ohwiToOihw = { 0u, 2u, 3u, 1u };

819

const ConstTensorPin weightsPin = (dataLayout == DataLayout::NCHW) ?

820

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data, ohwiToOihw) :

821

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

822

const ConstTensorPin biasesPin =

823

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

824

if (!weightsPin.IsValid() || !biasesPin.IsValid())

825

{

826

return Fail("%s: Operation has invalid inputs", __func__);

827

}

828

829

ConstTensor weights = weightsPin.GetConstTensor();

Aron Virginas-Tar

2019-11-07 14:49:26 +0000

[diff] [blame]

830

ConstTensor biases = biasesPin.GetConstTensor();

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

831

SanitizeBiasQuantizationScale(biases.GetInfo(), weights.GetInfo(), inputInfo);

832

833

const TensorShape& inputShape = inputInfo.GetShape();

834

const TensorShape& outputShape = outputInfo.GetShape();

835

const TensorShape& weightsShape = weights.GetShape();

836

const TensorShape& biasesShape = biases.GetShape();

837

838

armnnUtils::DataLayoutIndexed dataLayoutIndexed(dataLayout);

839

const unsigned int channelsIndex = dataLayoutIndexed.GetChannelsIndex();

840

const unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

841

const unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

842

843

Convolution2dDescriptor desc;

844

desc.m_DataLayout = dataLayout;

845

desc.m_BiasEnabled = true;

846

847

int numGroups;

848

ActivationFn activation;

849

850

if (operation.inputs.size() == 12)

851

{

852

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

853

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

854

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

855

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

856

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

857

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

858

!GetInputScalar<hal_1_2::HalPolicy>(operation, 9, OperandType::INT32, numGroups, model, data) ||

859

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 10, activation, model, data))

860

{

861

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

}

}

else if (operation.inputs.size() == 9)

866

{

867

android::nn::PaddingScheme paddingScheme;

868

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 3, paddingScheme, model, data) ||

869

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_StrideX, model, data) ||

870

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_StrideY, model, data) ||

871

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, numGroups, model, data) ||

872

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 7, activation, model, data))

873

{

874

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

875

}

876

877

const uint32_t inputX = inputInfo.GetShape()[widthIndex];

878

const uint32_t inputY = inputInfo.GetShape()[heightIndex];

879

880

const uint32_t kernelX = weightsShape[widthIndex];

881

const uint32_t kernelY = weightsShape[heightIndex];

882

883

CalcPadding(inputX, kernelX, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, paddingScheme);

884

CalcPadding(inputY, kernelY, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, paddingScheme);

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

889

}

890

891

const unsigned int outputChannels = outputShape[channelsIndex];

892

893

const unsigned int channelsPerGroup = weightsShape[channelsIndex];

894

const unsigned int channelMultiplier = outputChannels / numGroups;

895

896

//

897

// Validate all relevant inputs

//

if (numGroups <= 0)

{

return Fail("%s: Number of groups must be greater than 0. Got: %d", __func__, numGroups);

902

}

903

904

if (outputChannels % numGroups != 0u)

905

{

906

return Fail("%s: Output channels must be divisible by the number of groups", __func__);

}

//

// Set up Splitter layer

911

//

912

unsigned int splitterDimSizes[4] = { inputShape[0], inputShape[1], inputShape[2], inputShape[3] };

913

splitterDimSizes[channelsIndex] /= numGroups; // split in depth

914

915

TensorInfo splitterOutputInfo(4,

916

splitterDimSizes,

917

inputInfo.GetDataType(),

918

inputInfo.GetQuantizationScale(),

919

inputInfo.GetQuantizationOffset());

920

921

std::vector<std::reference_wrapper<TensorInfo>> splitterOutputInfos(numGroups, std::ref(splitterOutputInfo));

922

923

ViewsDescriptor splitterDesc(numGroups);

924

for (unsigned int group = 0u; group < numGroups; ++group)

925

{

926

splitterDesc.SetViewOriginCoord(group, channelsIndex, splitterDimSizes[channelsIndex] * group);

927

for (unsigned int dimIdx = 0u; dimIdx < 4u; dimIdx++)

928

{

929

splitterDesc.SetViewSize(group, dimIdx, splitterDimSizes[dimIdx]);

}

}

bool isSupported = false;

934

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsSplitterSupported,

data.m_Backends,

isSupported,

inputInfo,

splitterOutputInfos,

splitterDesc);

if (!isSupported)

{

return false;

}

IConnectableLayer* splitterLayer = data.m_Network->AddSplitterLayer(splitterDesc);

947

if (!splitterLayer)

948

{

949

return Fail("%s: Failed to add SplitterLayer", __func__);

950

}

951

952

input.Connect(splitterLayer->GetInputSlot(0));

953

for (unsigned int group = 0u; group < splitterLayer->GetNumOutputSlots(); ++group)

954

{

955

splitterLayer->GetOutputSlot(group).SetTensorInfo(splitterOutputInfo);

}

//

// Set up Convolution2d layers for each group

960

//

Aron Virginas-Tar

2019-11-07 14:49:26 +0000

[diff] [blame]

961

962

// Set up group tensor shapes

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

963

TensorShape groupInputShape(inputShape);

964

groupInputShape[channelsIndex] = channelsPerGroup;

965

966

TensorShape groupOutputShape(outputShape);

967

groupOutputShape[channelsIndex] = 1;

968

969

TensorShape groupWeightsShape(weightsShape);

970

groupWeightsShape[0] /= channelMultiplier * numGroups;

971

972

TensorShape groupBiasesShape({ 1 });

973

Aron Virginas-Tar

2019-11-07 14:49:26 +0000

[diff] [blame]

974

// Set up group tensor infos

975

TensorInfo groupInputInfo(inputInfo);

976

groupInputInfo.SetShape(groupInputShape);

977

978

const TensorInfo& weightsInfo = weights.GetInfo();

979

TensorInfo groupWeightsInfo(weightsInfo);

980

groupWeightsInfo.SetShape(groupWeightsShape);

981

982

const TensorInfo& biasesInfo = biases.GetInfo();

983

TensorInfo groupBiasesInfo(biasesInfo);

984

groupBiasesInfo.SetShape(groupBiasesShape);

985

986

TensorInfo groupOutputInfo(outputInfo);

987

groupOutputInfo.SetShape(groupOutputShape);

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

988

989

const unsigned int weightsDataTypeSize = GetDataTypeSize(groupWeightsInfo.GetDataType());

990

const unsigned int biasesDataTypeSize = GetDataTypeSize(groupBiasesInfo.GetDataType());

991

Aron Virginas-Tar

2019-11-07 14:49:26 +0000

[diff] [blame]

992

std::vector<IConnectableLayer*> convLayers(numGroups * channelMultiplier, nullptr);

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

993

for (unsigned int group = 0u; group < numGroups; ++group)

994

{

995

for (unsigned int m = 0u; m < channelMultiplier; ++m)

996

{

997

auto index = group * channelMultiplier + m;

998

999

const unsigned int weightsDataOffset = groupWeightsShape.GetNumElements() * index * weightsDataTypeSize;

1000

const unsigned int biasesDataOffset = groupBiasesShape.GetNumElements() * index * biasesDataTypeSize;

1001

Aron Virginas-Tar

2019-11-07 14:49:26 +0000

[diff] [blame]

1002

if (weightsInfo.HasPerAxisQuantization())

1003

{

1004

// Extract per-axis quantization scales for group weights

1005

const std::vector<float>& weightsQuantScales = weightsInfo.GetQuantizationScales();

1006

groupWeightsInfo.SetQuantizationScales(

1007

std::vector<float>(weightsQuantScales.begin() + index,

1008

weightsQuantScales.begin() + index + groupWeightsShape[0]));

1009

1010

// Extract per-axis quantization scales for group biases

1011

const std::vector<float>& biasesQuantScales = biasesInfo.GetQuantizationScales();

1012

groupBiasesInfo.SetQuantizationScales(

1013

std::vector<float>(biasesQuantScales.begin() + index,

1014

biasesQuantScales.begin() + index + groupWeightsShape[0]));

1015

}

1016

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1017

// Extract weights and biases data for current group convolution

1018

ConstTensor groupWeights(groupWeightsInfo,

1019

static_cast<const void *>(reinterpret_cast<const char *>(weights.GetMemoryArea()) +

1020

weightsDataOffset));

1021

ConstTensor groupBiases(groupBiasesInfo,

1022

static_cast<const void *>(reinterpret_cast<const char *>(biases.GetMemoryArea()) +

biasesDataOffset));

isSupported = false;

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1027

IsConvolution2dSupported,

data.m_Backends,

isSupported,

groupInputInfo,

groupOutputInfo,

desc,

groupWeightsInfo,

Optional<TensorInfo>(groupBiasesInfo));

if (!isSupported)

{

return false;

}

IConnectableLayer *convLayer =

1041

data.m_Network->AddConvolution2dLayer(desc, groupWeights, Optional<ConstTensor>(groupBiases));

1042

if (!convLayer)

1043

{

1044

return Fail("%s: AddConvolution2dLayer failed", __func__);

1045

}

1046

1047

splitterLayer->GetOutputSlot(group).Connect(convLayer->GetInputSlot(0));

1048

convLayer->GetOutputSlot(0).SetTensorInfo(groupOutputInfo);

1049

1050

convLayers[index] = convLayer;

}

}

//

// Set up Concat layer

1056

//

1057

ConcatDescriptor concatDescriptor(outputInfo.GetShape()[channelsIndex]);

1058

for (unsigned int group = 0u; group < numGroups; ++group)

1059

{

1060

for (unsigned int m = 0u; m < channelMultiplier; ++m)

1061

{

1062

auto index = group * channelMultiplier + m;

1063

concatDescriptor.SetViewOriginCoord(index, channelsIndex, index);

1064

concatDescriptor.SetConcatAxis(channelsIndex);

}

}

isSupported = false;

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsConcatSupported,

data.m_Backends,

isSupported,

std::vector<const TensorInfo*>(numGroups * channelMultiplier, &groupOutputInfo),

outputInfo,

concatDescriptor);

if (!isSupported)

{

return false;

}

IConnectableLayer* concatLayer = data.m_Network->AddConcatLayer(concatDescriptor);

1082

if (!concatLayer)

1083

{

1084

return Fail("%s: AddConcatLayer failed", __func__);

1085

}

1086

1087

for (unsigned int group = 0u; group < numGroups; ++group)

1088

{

1089

for (unsigned int m = 0u; m < channelMultiplier; ++m)

1090

{

1091

auto index = group * channelMultiplier + m;

1092

convLayers[index]->GetOutputSlot(0).Connect(concatLayer->GetInputSlot(index));

1093

}

1094

}

1095

concatLayer->GetOutputSlot(0).SetTensorInfo(outputInfo);

1096

1097

//

1098

// Set up Activation layer (if it is set)

1099

//

1100

IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, concatLayer, data);

1101

if (!endLayer)

1102

{

1103

return Fail("%s: ProcessActivation failed", __func__);

1104

}

1105

1106

return SetupAndTrackLayerOutputSlot<HalPolicy>(operation, 0, *endLayer, model, data);

1107

}

1108

Aron Virginas-Tar

a2a7380

2019-10-09 15:30:40 +0100

[diff] [blame]

1109

bool HalPolicy::ConvertInstanceNormalization(const Operation& operation, const Model& model, ConversionData& data)

1110

{

1111

ALOGV("hal_1_2::HalPolicy::ConvertInstanceNormalization()");

1112

1113

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1114

if (!input.IsValid())

1115

{

1116

return Fail("%s: Operation has an invalid input 0", __func__);

1117

}

1118

1119

const Operand* output = GetOutputOperand<HalPolicy>(operation, 0, model);

1120

if (!output)

1121

{

1122

return Fail("%s: Operation has an invalid output", __func__);

1123

}

1124

1125

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1126

if (IsDynamicTensor(outputInfo))

1127

{

1128

return Fail("%s: Dynamic output tensors are not supported", __func__);

1129

}

1130

1131

// Determine data type of input tensor

1132

OperandType inputType;

1133

if (!GetOperandType<hal_1_2::HalPolicy>(operation, 0, model, inputType))

1134

{

1135

return Fail("%s: Operation has invalid inputs", __func__);

1136

}

1137

1138

InstanceNormalizationDescriptor desc;

1139

1140

// Read gamma, beta & epsilon

1141

if (inputType == OperandType::TENSOR_FLOAT16)

{

Half fp16Gamma;

Half fp16Beta;

Half fp16Epsilon;

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 1, OperandType::FLOAT16, fp16Gamma, model, data) ||

1148

!GetInputScalar<hal_1_2::HalPolicy>(operation, 2, OperandType::FLOAT16, fp16Beta, model, data) ||

1149

!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::FLOAT16, fp16Epsilon, model, data))

1150

{

1151

return Fail("%s: Operation has invalid inputs (FLOAT16)", __func__);

1152

}

1153

1154

desc.m_Gamma = static_cast<float>(fp16Gamma);

1155

desc.m_Beta = static_cast<float>(fp16Beta);

1156

desc.m_Eps = static_cast<float>(fp16Epsilon);

1157

}

1158

else if (inputType == OperandType::TENSOR_FLOAT32)

1159

{

1160

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 1, OperandType::FLOAT32, desc.m_Gamma, model, data) ||

1161

!GetInputScalar<hal_1_2::HalPolicy>(operation, 2, OperandType::FLOAT32, desc.m_Beta, model, data) ||

1162

!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::FLOAT32, desc.m_Eps, model, data))

1163

{

1164

return Fail("%s: Operation has invalid inputs (FLOAT32)", __func__);

}

}

else

{

return Fail("%s: Unsupported input tensor type: %d", __func__, inputType);

1170

}

1171

1172

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 4, model, data);

1173

1174

bool isSupported = false;

1175

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1176

IsInstanceNormalizationSupported,

1177

data.m_Backends,

1178

isSupported,

1179

input.GetTensorInfo(),

outputInfo,

desc);

if (!isSupported)

{

return false;

}

IConnectableLayer* layer = data.m_Network->AddInstanceNormalizationLayer(desc);

1188

input.Connect(layer->GetInputSlot(0));

1189

1190

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

1191

}

1192

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1193

bool HalPolicy::ConvertL2Normalization(const Operation& operation, const Model& model, ConversionData& data)

1194

{

1195

ALOGV("hal_1_2::HalPolicy::ConvertL2Normalization()");

1196

return ::ConvertL2Normalization<hal_1_2::HalPolicy>(operation, model, data);

1197

}

1198

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

1199

bool HalPolicy::ConvertL2Pool2d(const Operation& operation, const Model& model, ConversionData& data)

1200

{

1201

ALOGV("hal_1_2::HalPolicy::ConvertL2Pool2d()");

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1202

return ConvertPooling2d<hal_1_2::HalPolicy>(operation, __func__, PoolingAlgorithm::L2, model, data);

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

1203

}

1204

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1205

bool HalPolicy::ConvertLocalResponseNormalization(const Operation& operation,

1206

const Model& model,

1207

ConversionData& data)

1208

{

1209

ALOGV("hal_1_2::HalPolicy::ConvertLocalResponseNormalization()");

1210

return ::ConvertLocalResponseNormalization<hal_1_2::HalPolicy>(operation, model, data);

1211

}

1212

1213

bool HalPolicy::ConvertLogistic(const Operation& operation, const Model& model, ConversionData& data)

1214

{

1215

ALOGV("hal_1_2::HalPolicy::ConvertLogistic()");

1216

return ::ConvertLogistic<hal_1_2::HalPolicy>(operation, model, data);

1217

}

1218

Aron Virginas-Tar

75e6779

2019-10-15 13:33:03 +0100

[diff] [blame]

1219

bool HalPolicy::ConvertLogSoftmax(const Operation& operation, const Model& model, ConversionData& data)

1220

{

1221

ALOGV("hal_1_2::HalPolicy::ConvertLogSoftmax()");

1222

1223

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1224

if (!input.IsValid())

1225

{

1226

return Fail("%s: Failed to read input 0", __func__);

1227

}

1228

1229

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1230

if (!output)

1231

{

1232

return Fail("%s: Failed to read output", __func__);

1233

}

1234

1235

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

1236

if (IsDynamicTensor(outputInfo))

1237

{

1238

return Fail("%s: Dynamic output tensors are not supported", __func__);

1239

}

1240

1241

// Determine data type of input tensor

1242

OperandType inputType;

1243

if (!GetOperandType<hal_1_2::HalPolicy>(operation, 0, model, inputType))

1244

{

1245

return Fail("%s: Operation has invalid inputs", __func__);

1246

}

1247

1248

LogSoftmaxDescriptor descriptor;

1249

1250

// Read beta

1251

if (inputType == OperandType::TENSOR_FLOAT16)

1252

{

1253

Half fp16Beta;

1254

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 1, OperandType::FLOAT16, fp16Beta, model, data))

1255

{

1256

return Fail("%s: Failed to read input 1 (FLOAT16)", __func__);

1257

}

1258

1259

descriptor.m_Beta = static_cast<float>(fp16Beta);

1260

}

1261

else if (inputType == OperandType::TENSOR_FLOAT32)

1262

{

1263

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 1, OperandType::FLOAT32, descriptor.m_Beta, model, data))

1264

{

1265

return Fail("%s: Failed to read input 1 (FLOAT32)", __func__);

}

}

else

{

return Fail("%s: Unsupported input tensor type: %d", __func__, inputType);

}

// Read axis

if (!GetInputInt32<hal_1_2::HalPolicy>(operation, 2, descriptor.m_Axis, model, data))

1275

{

1276

return Fail("%s: Failed to read input 2", __func__);

1277

}

1278

1279

bool isSupported = false;

1280

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1281

IsLogSoftmaxSupported,

1282

data.m_Backends,

1283

isSupported,

1284

input.GetTensorInfo(),

outputInfo,

descriptor);

if (!isSupported)

{

return false;

}

Aron Virginas-Tar

2019-10-29 14:25:09 +0000

[diff] [blame]

1292

IConnectableLayer* layer = data.m_Network->AddLogSoftmaxLayer(descriptor);

Aron Virginas-Tar

75e6779

2019-10-15 13:33:03 +0100

[diff] [blame]

1293

if (!layer)

1294

{

1295

return Fail("%s: AddLogSoftmaxLayer() returned nullptr", __func__);

1296

}

1297

1298

input.Connect(layer->GetInputSlot(0));

1299

1300

return SetupAndTrackLayerOutputSlot<HalPolicy>(operation, 0, *layer, model, data);

1301

}

1302

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

1303

bool HalPolicy::ConvertMaxPool2d(const Operation& operation, const Model& model, ConversionData& data)

1304

{

1305

ALOGV("hal_1_2::HalPolicy::ConvertMaxPool2d()");

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1306

return ConvertPooling2d<hal_1_2::HalPolicy>(operation, __func__, PoolingAlgorithm::Max, model, data);

Sadik Armagan

2019-07-26 16:59:35 +0100

[diff] [blame]

1307

}

1308

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

1309

bool HalPolicy::ConvertMaximum(const Operation& operation, const Model& model, ConversionData& data)

1310

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1311

ALOGV("hal_1_2::HalPolicy::ConvertMaximum()");

1312

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

1313

LayerInputHandle input0 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1314

LayerInputHandle input1 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

1315

1316

if (!input0.IsValid() || !input1.IsValid())

1317

{

1318

return Fail("%s: Operation has invalid inputs", __func__);

1319

}

1320

1321

const Operand* outputOperand = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1322

if (!outputOperand)

1323

{

1324

return Fail("%s: Could not read output", __func__);

1325

}

1326

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1327

const TensorInfo& outInfo = GetTensorInfoForOperand(*outputOperand);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

1328

if (IsDynamicTensor(outInfo))

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

1329

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1330

return Fail("%s: Dynamic output tensors are not supported", __func__);

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

1331

}

1332

Aron Virginas-Tar

d759323

2019-07-16 13:17:06 +0100

[diff] [blame]

1333

bool isSupported = false;

1334

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsMaximumSupported,

data.m_Backends,

isSupported,

input0.GetTensorInfo(),

1339

input1.GetTensorInfo(),

1340

outInfo);

1341

1342

if (!isSupported)

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1347

IConnectableLayer* layer = data.m_Network->AddMaximumLayer();

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

1348

assert(layer != nullptr);

Sadik Armagan

64b19b5

2019-08-19 09:49:58 +0100

[diff] [blame]

1349

bool isReshapeSupported = BroadcastTensor(input0, input1, layer, data);

1350

if (!isReshapeSupported)

1351

{

1352

return false;

1353

}

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

1354

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1355

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Narumol Prangnawarat

2019-07-15 12:02:20 +0100

[diff] [blame]

1356

}

1357

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1358

bool HalPolicy::ConvertMean(const Operation& operation, const Model& model, ConversionData& data)

1359

{

1360

ALOGV("hal_1_2::HalPolicy::ConvertMean()");

1361

return ::ConvertMean<hal_1_2::HalPolicy>(operation, model, data);

1362

}

1363

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

1364

bool HalPolicy::ConvertMinimum(const Operation& operation, const Model& model, ConversionData& data)

1365

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1366

ALOGV("hal_1_2::HalPolicy::ConvertMinimum()");

1367

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

1368

LayerInputHandle input0 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1369

LayerInputHandle input1 = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

1370

1371

if (!input0.IsValid() || !input1.IsValid())

1372

{

1373

return Fail("%s: Operation has invalid inputs", __func__);

1374

}

1375

1376

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1377

if (!output)

1378

{

1379

return Fail("%s: Could not read output 0", __func__);

1380

}

1381

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1382

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

1383

if (IsDynamicTensor(outputInfo))

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

1384

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1385

return Fail("%s: Dynamic output tensors are not supported", __func__);

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

1386

}

1387

1388

bool isSupported = false;

1389

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsMinimumSupported,

data.m_Backends,

isSupported,

input0.GetTensorInfo(),

1394

input1.GetTensorInfo(),

outputInfo);

if (!isSupported)

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1402

IConnectableLayer* const layer = data.m_Network->AddMinimumLayer();

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

1403

assert(layer != nullptr);

Sadik Armagan

64b19b5

2019-08-19 09:49:58 +0100

[diff] [blame]

1404

bool isReshapeSupported = BroadcastTensor(input0, input1, layer, data);

1405

if (!isReshapeSupported)

1406

{

1407

return false;

1408

}

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

1409

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1410

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Ellen Norris-Thompson

2019-07-11 17:27:37 +0100

[diff] [blame]

1411

}

1412

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1413

bool HalPolicy::ConvertMul(const Operation& operation, const Model& model, ConversionData& data)

1414

{

1415

ALOGV("hal_1_2::HalPolicy::ConvertMul()");

1416

return ::ConvertMul<hal_1_2::HalPolicy>(operation, model, data);

1417

}

1418

Aron Virginas-Tar

c921f6b

2019-07-25 10:14:33 +0100

[diff] [blame]

1419

bool HalPolicy::ConvertPad(const Operation& operation, const Model& model, ConversionData& data)

1420

{

1421

ALOGV("hal_1_2::HalPolicy::ConvertPad()");

1422

return ::ConvertPad<hal_1_2::HalPolicy>(operation, model, data);

1423

}

1424

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

1425

bool HalPolicy::ConvertPadV2(const Operation& operation, const Model& model, ConversionData& data)

1426

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1427

ALOGV("hal_1_2::HalPolicy::ConvertPadV2()");

1428

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

1429

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1430

if (!input.IsValid())

1431

{

1432

return Fail("%s: Could not read input 0", __func__);

1433

}

1434

Aron Virginas-Tar

366e0a6

2019-07-10 13:01:41 +0100

[diff] [blame]

1435

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1436

if (!output)

1437

{

1438

return Fail("%s: Could not read output", __func__);

1439

}

1440

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1441

const TensorInfo& inputInfo = input.GetTensorInfo();

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

1442

unsigned int rank = inputInfo.GetNumDimensions();

1443

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1444

PadDescriptor descriptor;

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

1445

if (!ConvertPaddings<hal_1_2::HalPolicy>(operation, model, data, rank, descriptor))

1446

{

1447

return Fail("%s: Could not convert paddings", __func__);

1448

}

1449

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1450

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

1451

if (IsDynamicTensor(outputInfo))

Sadik Armagan

310d8ff

2019-07-11 10:53:38 +0100

[diff] [blame]

1452

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1453

return Fail("%s: Dynamic output tensors are not supported", __func__);

Sadik Armagan

310d8ff

2019-07-11 10:53:38 +0100

[diff] [blame]

1454

}

1455

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

1456

// Determine type of padding value

1457

OperandType operandType0;

1458

OperandType operandType2;

1459

1460

if (!GetOperandType<hal_1_2::HalPolicy>(operation, 0, model, operandType0) ||

1461

!GetOperandType<hal_1_2::HalPolicy>(operation, 2, model, operandType2))

1462

{

1463

return Fail("%s: Operation has invalid inputs", __func__);

1464

}

1465

1466

// Read value to use for padding

1467

if (operandType0 == OperandType::TENSOR_FLOAT16 && operandType2 == OperandType::FLOAT16)

1468

{

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1469

Half f16PadValue;

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

1470

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 2, operandType2, f16PadValue, model, data))

1471

{

1472

return Fail("%s: Could not read input 2 (FLOAT16)", __func__);

1473

}

1474

1475

descriptor.m_PadValue = f16PadValue;

1476

}

1477

else if (operandType0 == OperandType::TENSOR_FLOAT32 && operandType2 == OperandType::FLOAT32)

1478

{

1479

if (!GetInputFloat32<hal_1_2::HalPolicy>(operation, 2, descriptor.m_PadValue, model, data))

1480

{

1481

return Fail("%s: Could not read input 2 (FLOAT32)", __func__);

1482

}

1483

}

1484

else if (operandType0 == OperandType::TENSOR_QUANT8_ASYMM && operandType2 == OperandType::INT32)

1485

{

Mike Kelly

3c67394

2019-07-25 09:26:06 +0100

[diff] [blame]

1486

int32_t intPadValue = 0;

1487

if (!GetInputInt32<hal_1_2::HalPolicy>(operation, 2, intPadValue, model, data))

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

1488

{

1489

return Fail("%s: Could not read input 2 (INT32)", __func__);

1490

}

Mike Kelly

3c67394

2019-07-25 09:26:06 +0100

[diff] [blame]

1491

descriptor.m_PadValue = intPadValue;

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

}

else

{

return Fail("%s: Operation has invalid inputs: type mismatch", __func__);

1496

}

1497

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1498

bool isSupported = false;

1499

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsPadSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

descriptor);

if (!isSupported)

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1511

IConnectableLayer* const layer = data.m_Network->AddPadLayer(descriptor);

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

1512

assert(layer != nullptr);

1513

input.Connect(layer->GetInputSlot(0));

1514

layer->GetOutputSlot(0).SetTensorInfo(outputInfo);

1515

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1516

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Aron Virginas-Tar

2019-07-05 15:47:07 +0100

[diff] [blame]

1517

}

1518

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

1519

bool HalPolicy::ConvertPrelu(const Operation& operation, const Model& model, ConversionData& data)

1520

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1521

ALOGV("hal_1_2::HalPolicy::ConvertPrelu()");

1522

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

1523

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1524

LayerInputHandle alpha = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 1, model, data);

1525

1526

if (!input.IsValid() || !alpha.IsValid())

1527

{

1528

return Fail("%s: Operation has invalid inputs", __func__);

1529

}

1530

1531

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1532

1533

if (!output)

1534

{

Matteo Martincigh

0bd89a8

2019-07-02 16:53:10 +0100

[diff] [blame]

1535

return Fail("%s: Could not read output", __func__);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

1536

}

1537

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1538

const TensorInfo& inputInfo = input.GetTensorInfo();

1539

const TensorInfo& alphaInfo = alpha.GetTensorInfo();

1540

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

1541

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

1542

if (IsDynamicTensor(outputInfo))

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

1543

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1544

return Fail("%s: Dynamic output tensors are not supported", __func__);

Aron Virginas-Tar

2019-07-09 17:44:24 +0100

[diff] [blame]

1545

}

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

1546

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1547

bool isSupported = false;

1548

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsPreluSupported,

data.m_Backends,

isSupported,

inputInfo,

alphaInfo,

outputInfo);

if (!isSupported)

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1560

IConnectableLayer* const layer = data.m_Network->AddPreluLayer();

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

if (!layer)

{

return Fail("%s: AddPreluLayer failed", __func__);

1565

}

1566

Sadik Armagan

64b19b5

2019-08-19 09:49:58 +0100

[diff] [blame]

1567

bool isReshapeSupported = BroadcastTensor(input, alpha, layer, data);

1568

if (!isReshapeSupported)

1569

{

1570

return false;

1571

}

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

1572

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1573

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Matteo Martincigh

2019-06-27 14:12:55 +0100

[diff] [blame]

1574

}

1575

Sadik Armagan

2019-07-30 09:43:18 +0100

[diff] [blame]

1576

bool HalPolicy::ConvertQuantize(const Operation& operation, const Model& model, ConversionData& data)

1577

{

1578

ALOGV("hal_1_2::HalPolicy::ConvertQuantize()");

1579

1580

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1581

if (!input.IsValid())

1582

{

1583

return Fail("%s: Operation has invalid input", __func__);

1584

}

1585

1586

const Operand* const outputOperand = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1587

if (!outputOperand)

1588

{

1589

return Fail("%s: Operation has invalid outputs", __func__);

1590

}

1591

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1592

const TensorInfo& outputInfo = GetTensorInfoForOperand(*outputOperand);

Sadik Armagan

2019-07-30 09:43:18 +0100

[diff] [blame]

1593

if (IsDynamicTensor(outputInfo))

1594

{

1595

return Fail("%s: Dynamic output tensors are not supported", __func__);

1596

}

1597

1598

bool isSupported = false;

1599

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsQuantizeSupported,

data.m_Backends,

isSupported,

input.GetTensorInfo(),

outputInfo);

if (!isSupported)

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1610

IConnectableLayer* const layer = data.m_Network->AddQuantizeLayer();

Sadik Armagan

2019-07-30 09:43:18 +0100

[diff] [blame]

1611

assert(layer != nullptr);

1612

input.Connect(layer->GetInputSlot(0));

1613

1614

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

1615

}

1616

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1617

bool HalPolicy::ConvertQuantizedLstm(const Operation& operation, const Model& model, ConversionData& data)

1618

{

1619

ALOGV("hal_1_2::HalPolicy::ConvertQuantizedLstm()");

1620

1621

//Inputs:

1622

// 0: The input: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape [numBatches, inputSize]

1623

// specifying the input to the LSTM cell. Tensor is quantized with a fixed quantization range of -1, 127/128.

1624

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

1625

if (!input.IsValid())

1626

{

1627

return Fail("%s: Could not read input 0: input", __func__);

1628

}

1629

1630

//13: The previous cell state: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT16_SYMM and shape

1631

// [numBatches, outputSize] specifying the cell state from the previous time step of the LSTM cell.

1632

// It is quantized using a quantization range of -2^4, 2^4 * 32767/32768.

1633

LayerInputHandle previousCellStateIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 13, model, data);

1634

if (!previousCellStateIn.IsValid())

1635

{

1636

return Fail("%s: Could not read input 13: previousCellStateIn", __func__);

1637

}

1638

1639

// 14: The previous output state: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

1640

// [numBathes, outputSize] specifying the output of the LSTM cell from previous time-step. Tensor

1641

// is quantized with a fixed quantization range of -1, 127/128.

1642

LayerInputHandle previousOutputIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 14, model, data);

1643

if (!previousOutputIn.IsValid())

1644

{

1645

return Fail("%s: Could not read input 14: previousOutputIn", __func__);

1646

}

1647

1648

// Get the input tensors:

1649

// 1: The input-to-input weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

1650

// [outputSize, inputSize] specifying input-to-input part of weights for fully-connected layer inside the

1651

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

1652

const ConstTensorPin inputToInputWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1653

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1654

1655

// 2: The input-to-forget weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

1656

// [outputSize, inputSize] specifying input-to-forget part of weights for fully-connected layer inside the

1657

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

1658

const ConstTensorPin inputToForgetWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1659

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1660

1661

// 3: The input-to-cell weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

1662

// [outputSize, inputSize] specifying input-to-cell part of weights for fully-connected layer inside the

1663

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

1664

const ConstTensorPin inputToCellWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1665

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 3, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1666

1667

// 4: The input-to-output weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

1668

// [outputSize, inputSize] specifying input-to-output part of weights for fully-connected layer inside the

1669

// LSTM cell. Quantization zero point and scale must be the same across all the weights.

1670

const ConstTensorPin inputToOutputWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1671

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 4, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1672

1673

// 5: The recurrent-to-input weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

1674

// [outputSize, outputSize] specifying recurrent-to-input part of weights for fully-connected layer inside

1675

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

1676

const ConstTensorPin recurrentToInputWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1677

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 5, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1678

1679

// 6: The recurrent-to-forget weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

1680

// [outputSize, outputSize] specifying recurrent-to-forget part of weights for fully-connected layer inside

1681

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

1682

const ConstTensorPin recurrentToForgetWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1683

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 6, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1684

1685

// 7: The recurrent-to-cell weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

1686

// [outputSize, outputSize] specifying recurrent-to-cell part of weights for fully-connected layer inside

1687

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

1688

const ConstTensorPin recurrentToCellWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1689

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 7, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1690

1691

// 8: The recurrent-to-output weights. A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape

1692

// [outputSize, outputSize] specifying recurrent-to-output part of weights for fully-connected layer inside

1693

// the LSTM cell. Quantization zero point and scale must be the same across all the weights.

1694

const ConstTensorPin recurrentToOutputWeightsPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1695

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 8, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1696

1697

// 9: The input gate bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying the

1698

// bias for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product

1699

// of input and weights scales and zeroPoint equal to 0.

1700

const ConstTensorPin inputGateBiasPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1701

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 9, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1702

1703

// 10: The forget gate bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying

1704

// the bias for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product

1705

// of input and weights scales and zeroPoint equal to 0.

1706

const ConstTensorPin forgetGateBiasPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1707

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 10, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1708

1709

// 11:The cell bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying the bias

1710

// for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product of input

1711

// and weights scales and zeroPoint equal to 0.

1712

const ConstTensorPin cellBiasPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1713

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 11, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1714

1715

// 12:The output gate bias. A 1-D tensor of type ANEURALNETWORKS_TENSOR_INT32 and shape [outputSize] specifying

1716

// the bias for the fully-connected layer inside the LSTM cell. Bias is quantized with scale being a product

1717

// of input and weights scales and zeroPoint equal to 0.

1718

const ConstTensorPin outputGateBiasPin =

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1719

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 12, model, data);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1720

1721

if (!inputToInputWeightsPin.IsValid() ||

1722

!inputToForgetWeightsPin.IsValid() ||

1723

!inputToCellWeightsPin.IsValid() ||

1724

!inputToOutputWeightsPin.IsValid() ||

1725

!recurrentToInputWeightsPin.IsValid() ||

1726

!recurrentToForgetWeightsPin.IsValid() ||

1727

!recurrentToCellWeightsPin.IsValid() ||

1728

!recurrentToOutputWeightsPin.IsValid() ||

1729

!inputGateBiasPin.IsValid() ||

1730

!forgetGateBiasPin.IsValid() ||

1731

!cellBiasPin.IsValid() ||

1732

!outputGateBiasPin.IsValid())

1733

{

1734

return Fail("%s: Operation has invalid tensor inputs", __func__);

}

// Outputs:

// 0: The cell state: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT16_SYMM and shape [numBatches, outputSize]

1739

// which contains a cell state from the current time step. Tensor is quantized using a quantization range

1740

// of -2^4, 2^4 * 32767/32768.

1741

const Operand* cellStateOut = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1742

if (!cellStateOut)

1743

{

1744

return Fail("%s: Could not read output 0: cellStateOut", __func__);

1745

}

1746

1747

// 1: The output: A 2-D tensor of type ANEURALNETWORKS_TENSOR_QUANT8_ASYMM and shape [numBathes, outputSize] which

1748

// contains the output value. Tensor is quantized with a fixed quantization range of -1, 127/128.

1749

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 1, model);

1750

if (!output)

1751

{

1752

return Fail("%s: Could not read output 1: output", __func__);

1753

}

1754

1755

// Inputs

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1756

const TensorInfo& inputInfo = input.GetTensorInfo();

1757

const TensorInfo& previousCellStateInInfo = previousCellStateIn.GetTensorInfo();

1758

const TensorInfo& previousOutputInInfo = previousOutputIn.GetTensorInfo();

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1759

1760

// Outputs

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1761

const TensorInfo& cellStateOutInfo = GetTensorInfoForOperand(*cellStateOut);

1762

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1763

1764

// Dynamic tensors currently not supported

1765

if (IsDynamicTensor(cellStateOutInfo) || IsDynamicTensor(outputInfo))

1766

{

1767

return Fail("%s: Dynamic output tensors are not supported", __func__);

1768

}

1769

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1770

QuantizedLstmInputParams params;

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1771

1772

params.m_InputToInputWeights = inputToInputWeightsPin.GetConstTensorPtr();

1773

params.m_InputToForgetWeights = inputToForgetWeightsPin.GetConstTensorPtr();

1774

params.m_InputToCellWeights = inputToCellWeightsPin.GetConstTensorPtr();

1775

params.m_InputToOutputWeights = inputToOutputWeightsPin.GetConstTensorPtr();

1776

params.m_RecurrentToInputWeights = recurrentToInputWeightsPin.GetConstTensorPtr();

1777

params.m_RecurrentToForgetWeights = recurrentToForgetWeightsPin.GetConstTensorPtr();

1778

params.m_RecurrentToCellWeights = recurrentToCellWeightsPin.GetConstTensorPtr();

1779

params.m_RecurrentToOutputWeights = recurrentToOutputWeightsPin.GetConstTensorPtr();

1780

params.m_InputGateBias = inputGateBiasPin.GetConstTensorPtr();

1781

params.m_ForgetGateBias = forgetGateBiasPin.GetConstTensorPtr();

1782

params.m_CellBias = cellBiasPin.GetConstTensorPtr();

1783

params.m_OutputGateBias = outputGateBiasPin.GetConstTensorPtr();

1784

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1785

QuantizedLstmInputParamsInfo paramsInfo;

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1786

paramsInfo.m_InputToInputWeights = &(params.m_InputToInputWeights->GetInfo());

1787

paramsInfo.m_InputToForgetWeights = &(params.m_InputToForgetWeights->GetInfo());

1788

paramsInfo.m_InputToCellWeights = &(params.m_InputToCellWeights->GetInfo());

1789

paramsInfo.m_InputToOutputWeights = &(params.m_InputToOutputWeights->GetInfo());

1790

paramsInfo.m_RecurrentToInputWeights = &(params.m_RecurrentToInputWeights->GetInfo());

1791

paramsInfo.m_RecurrentToForgetWeights = &(params.m_RecurrentToForgetWeights->GetInfo());

1792

paramsInfo.m_RecurrentToCellWeights = &(params.m_RecurrentToCellWeights->GetInfo());

1793

paramsInfo.m_RecurrentToOutputWeights = &(params.m_RecurrentToOutputWeights->GetInfo());

1794

paramsInfo.m_InputGateBias = &(params.m_InputGateBias->GetInfo());

1795

paramsInfo.m_ForgetGateBias = &(params.m_ForgetGateBias->GetInfo());

1796

paramsInfo.m_CellBias = &(params.m_CellBias->GetInfo());

1797

paramsInfo.m_OutputGateBias = &(params.m_OutputGateBias->GetInfo());

1798

1799

bool isSupported = false;

1800

FORWARD_LAYER_SUPPORT_FUNC(__func__,

1801

IsQuantizedLstmSupported,

data.m_Backends,

isSupported,

inputInfo,

previousCellStateInInfo,

1806

previousOutputInInfo,

cellStateOutInfo,

outputInfo,

paramsInfo);

if (!isSupported)

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1816

IConnectableLayer* const layer = data.m_Network->AddQuantizedLstmLayer(params, "QuantizedLstm");

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1817

input.Connect(layer->GetInputSlot(0));

Ellen Norris-Thompson

2019-08-05 14:20:32 +0100

[diff] [blame]

1818

previousCellStateIn.Connect(layer->GetInputSlot(1));

1819

previousOutputIn.Connect(layer->GetInputSlot(2));

Ellen Norris-Thompson

2019-07-24 17:39:19 +0100

[diff] [blame]

1820

1821

return (SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, 0, model, data) &&

1822

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 1, *layer, 1, model, data));

1823

}

1824

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

1825

bool HalPolicy::ConvertReLu(const Operation& operation, const Model& model, ConversionData& data)

1826

{

1827

ALOGV("hal_1_2::HalPolicy::ConvertReLu()");

1828

return ::ConvertReLu<hal_1_2::HalPolicy>(operation, model, data);

1829

}

1830

1831

bool HalPolicy::ConvertReLu1(const Operation& operation, const Model& model, ConversionData& data)

1832

{

1833

ALOGV("hal_1_2::HalPolicy::ConvertReLu1()");

1834

return ::ConvertReLu1<hal_1_2::HalPolicy>(operation, model, data);

1835

}

1836

1837

bool HalPolicy::ConvertReLu6(const Operation& operation, const Model& model, ConversionData& data)

1838

{

1839

ALOGV("hal_1_2::HalPolicy::ConvertReLu6()");

1840

return ::ConvertReLu6<hal_1_2::HalPolicy>(operation, model, data);

1841

}

1842

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

1843

bool HalPolicy::ConvertReshape(const Operation& operation, const Model& model, ConversionData& data)

1844

{

1845

ALOGV("hal_1_2::HalPolicy::ConvertReshape()");

1846

return ::ConvertReshape<hal_1_2::HalPolicy>(operation, model, data);

1847

}

1848

Aron Virginas-Tar

fb2fa29

2019-07-04 11:59:48 +0100

[diff] [blame]

1849

bool HalPolicy::ConvertResize(const Operation& operation,

1850

const Model& model,

1851

ConversionData& data,

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1852

ResizeMethod resizeMethod)

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1853

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1854

ALOGV("hal_1_2::HalPolicy::ConvertResize()");

Aron Virginas-Tar

7d2ccfd

2019-10-29 14:03:51 +0000

[diff] [blame]

1855

ALOGV("resizeMethod = %s", GetResizeMethodAsCString(resizeMethod));

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1856

1857

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1858

if (!input.IsValid())

1859

{

1860

return Fail("%s: Could not read input 0", __func__);

1861

}

1862

1863

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

1864

if (!output)

1865

{

1866

return Fail("%s: Could not read output 0", __func__);

1867

}

1868

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1869

const TensorInfo& inputInfo = input.GetTensorInfo();

1870

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1871

1872

if (IsDynamicTensor(outputInfo))

1873

{

1874

return Fail("%s: Dynamic output tensors are not supported", __func__);

1875

}

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1876

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1877

ResizeDescriptor descriptor;

Aron Virginas-Tar

fb2fa29

2019-07-04 11:59:48 +0100

[diff] [blame]

1878

descriptor.m_Method = resizeMethod;

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1879

descriptor.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 3, model, data);

1880

1881

OperandType operandType1;

1882

OperandType operandType2;

1883

1884

if (!GetOperandType<hal_1_2::HalPolicy>(operation, 1, model, operandType1) ||

1885

!GetOperandType<hal_1_2::HalPolicy>(operation, 2, model, operandType2))

1886

{

1887

return Fail("%s: Operation has invalid inputs", __func__);

1888

}

1889

1890

if (operandType1 != operandType2)

1891

{

1892

return Fail("%s: Operation has invalid inputs. Type of input 1 and 2 should be the same", __func__);

1893

}

1894

1895

if (operandType1 == OperandType::INT32)

1896

{

1897

// Case 1: resizing by shape

1898

int32_t targetWidth = 0;

1899

int32_t targetHeight = 0;

1900

1901

if (!GetInputInt32<hal_1_2::HalPolicy>(operation, 1, targetWidth, model, data) ||

1902

!GetInputInt32<hal_1_2::HalPolicy>(operation, 2, targetHeight, model, data))

1903

{

1904

return Fail("%s: Operation has invalid inputs for resizing by shape", __func__);

1905

}

1906

1907

if (targetWidth < 0 || targetHeight < 0)

1908

{

1909

return Fail("%s: Operation has invalid inputs for resizing by shape. "

1910

"Target width/height cannot be < 0", __func__);

1911

}

1912

1913

descriptor.m_TargetWidth = static_cast<uint32_t>(targetWidth);

Teresa Charlin

9843c01

2019-07-19 12:18:35 +0100

[diff] [blame]

1914

descriptor.m_TargetHeight = static_cast<uint32_t>(targetHeight);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1915

}

1916

else if (operandType1 == OperandType::FLOAT32)

1917

{

1918

// Case 2: resizing by scale

1919

float widthScale = 1.0f;

1920

float heightScale = 1.0f;

1921

1922

if (!GetInputFloat32<hal_1_2::HalPolicy>(operation, 1, widthScale, model, data) ||

1923

!GetInputFloat32<hal_1_2::HalPolicy>(operation, 2, heightScale, model, data))

1924

{

1925

return Fail("%s: Operation has invalid inputs for resizing by scale", __func__);

1926

}

1927

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1928

const TensorShape& inputShape = inputInfo.GetShape();

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1929

armnnUtils::DataLayoutIndexed dataLayoutIndexed(descriptor.m_DataLayout);

1930

1931

float width = inputShape[dataLayoutIndexed.GetWidthIndex()];

1932

float height = inputShape[dataLayoutIndexed.GetHeightIndex()];

1933

1934

descriptor.m_TargetWidth = std::floor(width * widthScale);

1935

descriptor.m_TargetHeight = std::floor(height * heightScale);

1936

}

Keith Davis

d410b60

2019-12-19 12:31:30 +0000

[diff] [blame]

1937

else if (operandType1 == OperandType::FLOAT16)

{

Half widthScale;

Half heightScale;

if (!GetInputScalar<HalPolicy>(operation, 1, HalPolicy::OperandType::FLOAT16, widthScale, model, data) ||

1943

!GetInputScalar<HalPolicy>(operation, 2, HalPolicy::OperandType::FLOAT16, heightScale, model, data))

1944

{

1945

return Fail("%s: Operation has invalid inputs for resizing by scale", __func__);

1946

}

1947

1948

const TensorShape& inputShape = inputInfo.GetShape();

1949

armnnUtils::DataLayoutIndexed dataLayoutIndexed(descriptor.m_DataLayout);

1950

1951

Half width = static_cast<Half>(inputShape[dataLayoutIndexed.GetWidthIndex()]);

1952

Half height = static_cast<Half>(inputShape[dataLayoutIndexed.GetHeightIndex()]);

1953

1954

descriptor.m_TargetWidth = std::floor(width * widthScale);

1955

descriptor.m_TargetHeight = std::floor(height * heightScale);

1956

}

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1957

else

1958

{

Keith Davis

d410b60

2019-12-19 12:31:30 +0000

[diff] [blame]

1959

return Fail("%s: Operand has invalid data type for resizing by scale", __func__);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1960

}

1961

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1962

bool isSupported = false;

1963

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsResizeSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

descriptor);

Aron Virginas-Tar

be5d356

2019-07-16 11:32:29 +0100

[diff] [blame]

1970

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

1971

if (!isSupported)

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

1976

IConnectableLayer* layer = data.m_Network->AddResizeLayer(descriptor);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1977

1978

assert(layer != nullptr);

1979

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1980

input.Connect(layer->GetInputSlot(0));

1981

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

1982

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Aron Virginas-Tar

2019-07-03 15:27:08 +0100

[diff] [blame]

1983

}

1984

Finn Williams

d74c505

2019-07-30 17:06:00 +0100

[diff] [blame]

1985

bool HalPolicy::ConvertSpaceToBatchNd(const Operation& operation, const Model& model, ConversionData& data)

1986

{

1987

ALOGV("hal_1_2::HalPolicy::ConvertSpaceToBatchNd()");

1988

return ::ConvertSpaceToBatchNd<hal_1_2::HalPolicy>(operation, model, data);

1989

}

1990

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1991

bool HalPolicy::ConvertSpaceToDepth(const Operation& operation, const Model& model, ConversionData& data)

1992

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1993

ALOGV("hal_1_2::HalPolicy::ConvertSpaceToDepth()");

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1994

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

1995

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

1996

if (!input.IsValid() )

1997

{

1998

return Fail("%s: Operation has invalid inputs", __func__);

1999

}

2000

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2001

const TensorInfo& inputInfo = input.GetTensorInfo();

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

2002

unsigned int rank = inputInfo.GetNumDimensions();

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

2003

if (rank != 4)

2004

{

2005

return Fail("%s: Only inputs with rank 4 are supported", __func__);

2006

}

2007

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

2008

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

2009

if (!output)

2010

{

2011

return Fail("%s: Could not read output 0", __func__);

2012

}

2013

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2014

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

2015

if (IsDynamicTensor(outputInfo))

2016

{

2017

return Fail("%s: Dynamic output tensors are not supported", __func__);

2018

}

2019

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2020

SpaceToDepthDescriptor desc;

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

2021

2022

GetInputScalar<hal_1_2::HalPolicy>(operation, 1, OperandType::INT32, desc.m_BlockSize, model, data);

2023

2024

if (desc.m_BlockSize <= 1)

2025

{

2026

return Fail("%s: Block size must be at least 1 in all dimensions");

2027

}

2028

2029

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 2, model, data);

2030

Ferran Balaguer

2019-07-09 17:04:47 +0100

[diff] [blame]

2031

bool isSupported = false;

2032

FORWARD_LAYER_SUPPORT_FUNC(__func__,

2033

IsSpaceToDepthSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc);

if (!isSupported)

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2044

IConnectableLayer* const layer = data.m_Network->AddSpaceToDepthLayer(desc);

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

2045

assert(layer != nullptr);

2046

input.Connect(layer->GetInputSlot(0));

2047

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

2048

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Keith Davis

2019-06-26 09:39:49 +0100

[diff] [blame]

2049

}

2050

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

2051

bool HalPolicy::ConvertSoftmax(const Operation& operation, const Model& model, ConversionData& data)

2052

{

Aron Virginas-Tar

2019-07-24 13:55:31 +0100

[diff] [blame]

2053

ALOGV("hal_1_2::HalPolicy::ConvertSoftmax()");

2054

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

2055

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

2056

if (!input.IsValid())

2057

{

2058

return Fail("%s: Operation has invalid inputs", __func__);

2059

}

2060

2061

const Operand* outputOperand = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

2062

if (!outputOperand)

2063

{

2064

return Fail("%s: Operation has no outputs", __func__);

2065

}

2066

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2067

const TensorInfo& outputInfo = GetTensorInfoForOperand(*outputOperand);

Aron Virginas-Tar

2019-07-23 14:01:37 +0100

[diff] [blame]

2068

if (IsDynamicTensor(outputInfo))

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

2069

{

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

2070

return Fail("%s: Dynamic output tensors are not supported", __func__);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

2071

}

2072

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2073

SoftmaxDescriptor desc;

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

2074

if (!GetInputFloat32<hal_1_2::HalPolicy>(operation, 1, desc.m_Beta, model, data))

2075

{

2076

return Fail("%s: Operation has invalid inputs", __func__);

2077

}

2078

2079

if (operation.inputs.size() > 2 && !GetInputScalar<hal_1_2::HalPolicy>(operation,

2080

2,

2081

HalPolicy::OperandType::INT32,

desc.m_Axis,

model,

data))

{

return Fail("%s: Operation has invalid inputs", __func__);

2087

}

2088

Narumol Prangnawarat

52dc527

2019-08-06 17:34:26 +0100

[diff] [blame]

2089

if (input.GetTensorInfo().GetNumDimensions() > 2 ||

2090

!(desc.m_Axis == 1 ||

2091

(desc.m_Axis < 0 && static_cast<int>(input.GetTensorInfo().GetNumDimensions()) + desc.m_Axis == 1)))

2092

{

2093

return Fail("%s: Unsupported input greater than 2D or axis != 1", __func__);

2094

}

2095

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

2096

bool isSupported = false;

2097

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsSoftmaxSupported,

data.m_Backends,

isSupported,

input.GetTensorInfo(),

outputInfo,

desc);

if (!isSupported)

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2109

IConnectableLayer* layer = data.m_Network->AddSoftmaxLayer(desc);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

2110

assert(layer != nullptr);

2111

input.Connect(layer->GetInputSlot(0));

2112

Aron Virginas-Tar

2019-07-26 13:14:39 +0100

[diff] [blame]

2113

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *layer, model, data);

Francis Murtagh

2019-07-22 16:40:57 +0100

[diff] [blame]

2114

}

2115

Mike Kelly

0a87936

2019-07-29 16:56:31 +0100

[diff] [blame]

2116

bool HalPolicy::ConvertSub(const Operation& operation, const Model& model, ConversionData& data)

2117

{

2118

ALOGV("hal_1_2::HalPolicy::ConvertSub()");

2119

return ::ConvertSub<hal_1_2::HalPolicy>(operation, model, data);

2120

}

2121

Sadik Armagan

2019-07-25 09:09:40 +0100

[diff] [blame]

2122

bool HalPolicy::ConvertTanH(const Operation& operation, const Model& model, ConversionData& data)

2123

{

2124

ALOGV("hal_1_2::HalPolicy::ConvertTanH()");

2125

return ::ConvertTanH<hal_1_2::HalPolicy>(operation, model, data);

2126

}

2127

Pablo Tello

2019-11-28 15:21:41 +0000

[diff] [blame]

2128

template<typename HalPolicy,

2129

typename HalOperation = typename HalPolicy::Operation,

2130

typename HalModel = typename HalPolicy::Model>

2131

bool SetupAndTrackLayerOutputSlotAndOverrideTensorInfo(const HalOperation& operation,

2132

uint32_t operationOutputIndex,

2133

armnn::IConnectableLayer& layer,

2134

uint32_t layerOutputIndex,

2135

const HalModel& model,

2136

ConversionData& data,

2137

const armnn::TensorInfo tensor_info)

2138

{

2139

using HalOperand = typename HalPolicy::Operand;

2140

2141

const HalOperand* outputOperand = GetOutputOperand<HalPolicy>(operation, operationOutputIndex, model);

2142

if ((outputOperand == nullptr) || (operationOutputIndex >= layer.GetNumOutputSlots()))

{

return false;

}

armnn::IOutputSlot& outputSlot = layer.GetOutputSlot(layerOutputIndex);

2148

2149

const uint32_t operandIndex = operation.outputs[operationOutputIndex];

2150

data.m_OutputSlotForOperand[operandIndex] = &outputSlot;

2151

2152

outputSlot.SetTensorInfo(tensor_info);

return true;

}

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2158

bool HalPolicy::ConvertLstm(const Operation& operation, const Model& model, ConversionData& data)

2159

{

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2160

ALOGV("hal_1_2::HalPolicy::ConvertLstm()");

2161

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2162

// Inputs:

2163

// 00: The input: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, input_size], where

2164

// “batch_size” corresponds to the batching dimension, and “input_size” is the size of the input.

2165

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

2166

if (!input.IsValid())

2167

{

2168

return Fail("%s: Could not read input 0: input", __func__);

2169

}

2170

// 18: The output state: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, output_size].

2171

LayerInputHandle outputStateIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 18, model, data);

2172

if (!outputStateIn.IsValid())

2173

{

2174

return Fail("%s: Could not read input 18: outputStateIn", __func__);

2175

}

2176

// 19: The cell state: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, num_units].

2177

LayerInputHandle cellStateIn = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 19, model, data);

2178

if (!cellStateIn.IsValid())

2179

{

2180

return Fail("%s: Could not read input 19: cellStateIn", __func__);

2181

}

2182

2183

// Get the mandatory input tensors:

2184

// 02: The input-to-forget weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

2185

// [num_units, input_size].

2186

const ConstTensorPin inputToForgetWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2187

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 2));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2188

// 03: The input-to-cell weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

2189

// [num_units, input_size].

2190

const ConstTensorPin inputToCellWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2191

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 3));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2192

// 04: The input-to-output weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

2193

// [num_units, input_size].

2194

const ConstTensorPin inputToOutputWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2195

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 4));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2196

// 06: The recurrent-to-forget weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

2197

// [num_units, output_size].

2198

const ConstTensorPin recurrentToForgetWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2199

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 6));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2200

// 07: The recurrent-to-cell weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

2201

// [num_units, output_size].

2202

const ConstTensorPin recurrentToCellWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2203

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 7));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2204

// 08: The recurrent-to-output weights: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

2205

// [num_units, output_size].

2206

const ConstTensorPin recurrentToOutputWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2207

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 8));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2208

// 13: The forget gate bias: A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

2209

const ConstTensorPin forgetGateBiasPin =

2210

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 13, model, data);

2211

// 14: The cell bias: A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

2212

const ConstTensorPin cellBiasPin =

2213

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 14, model, data);

2214

// 15: The output gate bias: A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

2215

const ConstTensorPin outputGateBiasPin =

2216

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 15, model, data);

2217

2218

if (!inputToForgetWeightsPin.IsValid() ||

2219

!inputToCellWeightsPin.IsValid() ||

2220

!inputToOutputWeightsPin.IsValid() ||

2221

!recurrentToForgetWeightsPin.IsValid() ||

2222

!recurrentToCellWeightsPin.IsValid() ||

2223

!recurrentToOutputWeightsPin.IsValid() ||

2224

!forgetGateBiasPin.IsValid() ||

2225

!cellBiasPin.IsValid() ||

2226

!outputGateBiasPin.IsValid())

2227

{

2228

return Fail("%s: Operation has invalid tensor inputs", __func__);

2229

}

2230

2231

// Get the optional input tensors:

2232

// 01: The input-to-input weights: Optional. A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

2233

// [num_units, input_size], where “num_units” corresponds to the number of cell units.

2234

const ConstTensorPin inputToInputWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2235

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 1, true));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2236

// 05: The recurrent-to-input weights: Optional. A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

2237

// [num_units, output_size], where “output_size” corresponds to either the number of cell units (i.e.,

2238

// “num_units”), or the second dimension of the “projection_weights”, if defined.

2239

const ConstTensorPin recurrentToInputWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2240

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 5, true));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2241

// 09: The cell-to-input weights: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

2242

const ConstTensorPin cellToInputWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2243

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 9, true));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2244

// 10: The cell-to-forget weights: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

2245

const ConstTensorPin cellToForgetWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2246

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 10, true));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2247

// 11: The cell-to-output weights: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

2248

const ConstTensorPin cellToOutputWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2249

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 11, true));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2250

// 12: The input gate bias: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [num_units].

2251

const ConstTensorPin inputGateBiasPin =

2252

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

12,

model,

data,

g_DontPermute,

nullptr,

true);

// 16: The projection weights: Optional. A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape

2261

// [output_size, num_units].

2262

const ConstTensorPin projectionWeightsPin =

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2263

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 16, true));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2264

// 17: The projection bias: Optional. A 1-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [output_size].

2265

const ConstTensorPin projectionBiasPin =

2266

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

17,

model,

data,

g_DontPermute,

nullptr,

true);

if ((!inputToInputWeightsPin.IsValid() && !inputToInputWeightsPin.IsOptional()) ||

2275

(!recurrentToInputWeightsPin.IsValid() && !recurrentToInputWeightsPin.IsOptional()) ||

2276

(!cellToInputWeightsPin.IsValid() && !cellToInputWeightsPin.IsOptional()) ||

2277

(!cellToForgetWeightsPin.IsValid() && !cellToForgetWeightsPin.IsOptional()) ||

2278

(!cellToOutputWeightsPin.IsValid() && !cellToOutputWeightsPin.IsOptional()) ||

2279

(!inputGateBiasPin.IsValid() && !inputGateBiasPin.IsOptional()) ||

2280

(!projectionWeightsPin.IsValid() && !projectionWeightsPin.IsOptional()) ||

2281

(!projectionBiasPin.IsValid() && !projectionBiasPin.IsOptional()))

2282

{

2283

return Fail("%s: Operation has invalid tensor inputs", __func__);

2284

}

2285

2286

// Get the mandatory input scalars (actually 1-D tensors of size 1):

2287

// 20: The activation function: A value indicating the activation function:

2288

// 0: None; 1: Relu; 3: Relu6; 4: Tanh; 6: Sigmoid.

2289

// 21: The clipping threshold: for the cell state, such that values are bound within [-cell_clip, cell_clip].

2290

// If set to 0.0 then clipping is disabled.

2291

// 22: The clipping threshold: for the output from the projection layer, such that values are bound within

2292

// [-proj_clip, proj_clip]. If set to 0.0 then clipping is disabled.

2293

ActivationFn activation;

2294

float cellClip;

2295

float projClip;

2296

if (!GetInputActivationFunctionFromTensor<hal_1_2::HalPolicy>(operation, 20, activation, model, data) ||

2297

!GetInputScalar<hal_1_2::HalPolicy>(operation, 21, OperandType::FLOAT32, cellClip, model, data) ||

2298

!GetInputScalar<hal_1_2::HalPolicy>(operation, 22, OperandType::FLOAT32, projClip, model, data))

2299

{

2300

return Fail("%s: Operation has invalid scalar inputs", __func__);

2301

}

2302

2303

// Get the normalization tensors

2304

// 23: The input layer normalization weights. A 1-D tensor of shape [num_units].

2305

// Used to rescale normalized inputs to activation at input gate.

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2306

const ConstTensorPin inputLayerNormWeightsPin

2307

(DequantizeAndMakeConstTensorPin<hal_1_2::HalPolicy>(operation, model, data, 23, true));

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2308

2309

// 24: The forget layer normalization weights. A 1-D tensor of shape [num_units].

2310

// Used to rescale normalized inputs to activation at forget gate.

2311

const ConstTensorPin forgetLayerNormWeightsPin =

2312

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

24,

model,

data,

g_DontPermute,

nullptr,

true);

// 25: The cell layer normalization weights. A 1-D tensor of shape [num_units].

2321

// Used to rescale normalized inputs to activation at cell gate.

2322

const ConstTensorPin cellLayerNormWeightsPin =

2323

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

25,

model,

data,

g_DontPermute,

nullptr,

true);

// 26: The output layer normalization weights. A 1-D tensor of shape [num_units].

2332

// Used to rescale normalized inputs to activation at output gate.

2333

const ConstTensorPin outputLayerNormWeightsPin =

2334

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation,

26,

model,

data,

g_DontPermute,

nullptr,

true);

// Outputs:

// 00: The scratch buffer: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, num_units * 4]

2344

// with CIFG, or [batch_size, num_units * 3] without CIFG.

2345

const Operand* scratchBuffer = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

2346

if (!scratchBuffer)

2347

{

2348

return Fail("%s: Could not read output 0: scratchBuffer", __func__);

2349

}

2350

// 01: The output state (out): A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, output_size].

2351

const Operand* outputStateOut = GetOutputOperand<hal_1_2::HalPolicy>(operation, 1, model);

2352

if (!outputStateOut)

2353

{

2354

return Fail("%s: Could not read output 1: outputStateOut", __func__);

2355

}

2356

// 02: The cell state (out): A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, num_units].

2357

const Operand* cellStateOut = GetOutputOperand<hal_1_2::HalPolicy>(operation, 2, model);

2358

if (!cellStateOut)

2359

{

2360

return Fail("%s: Could not read output 2: cellStateOut", __func__);

2361

}

2362

// 03: The output: A 2-D tensor of ANEURALNETWORKS_TENSOR_FLOAT32, of shape [batch_size, output_size]. This is

2363

// effectively the same as the current “output state (out)” value.

2364

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 3, model);

2365

if (!output)

2366

{

2367

return Fail("%s: Could not read output 3: output", __func__);

2368

}

2369

2370

// set the params structure for the AddLstmLayer call

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2371

LstmInputParams params;

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2372

params.m_InputToInputWeights = inputToInputWeightsPin.GetConstTensorPtr();

2373

params.m_InputToForgetWeights = inputToForgetWeightsPin.GetConstTensorPtr();

2374

params.m_InputToCellWeights = inputToCellWeightsPin.GetConstTensorPtr();

2375

params.m_InputToOutputWeights = inputToOutputWeightsPin.GetConstTensorPtr();

2376

params.m_RecurrentToInputWeights = recurrentToInputWeightsPin.GetConstTensorPtr();

2377

params.m_RecurrentToForgetWeights = recurrentToForgetWeightsPin.GetConstTensorPtr();

2378

params.m_RecurrentToCellWeights = recurrentToCellWeightsPin.GetConstTensorPtr();

2379

params.m_RecurrentToOutputWeights = recurrentToOutputWeightsPin.GetConstTensorPtr();

2380

params.m_CellToInputWeights = cellToInputWeightsPin.GetConstTensorPtr();

2381

params.m_CellToForgetWeights = cellToForgetWeightsPin.GetConstTensorPtr();

2382

params.m_CellToOutputWeights = cellToOutputWeightsPin.GetConstTensorPtr();

2383

params.m_InputGateBias = inputGateBiasPin.GetConstTensorPtr();

2384

params.m_ForgetGateBias = forgetGateBiasPin.GetConstTensorPtr();

2385

params.m_CellBias = cellBiasPin.GetConstTensorPtr();

2386

params.m_OutputGateBias = outputGateBiasPin.GetConstTensorPtr();

2387

params.m_ProjectionWeights = projectionWeightsPin.GetConstTensorPtr();

2388

params.m_ProjectionBias = projectionBiasPin.GetConstTensorPtr();

2389

params.m_InputLayerNormWeights = inputLayerNormWeightsPin.GetConstTensorPtr();

2390

params.m_ForgetLayerNormWeights = forgetLayerNormWeightsPin.GetConstTensorPtr();

2391

params.m_CellLayerNormWeights = cellLayerNormWeightsPin.GetConstTensorPtr();

2392

params.m_OutputLayerNormWeights = outputLayerNormWeightsPin.GetConstTensorPtr();

2393

2394

// set the layer descriptor

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2395

LstmDescriptor desc;

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2396

desc.m_ActivationFunc = activation;

2397

desc.m_ClippingThresCell = cellClip;

2398

desc.m_ClippingThresProj = projClip;

2399

desc.m_CifgEnabled = (params.m_InputToInputWeights == nullptr ||

2400

params.m_RecurrentToInputWeights == nullptr ||

2401

params.m_InputGateBias == nullptr);

2402

desc.m_PeepholeEnabled = (params.m_CellToForgetWeights != nullptr ||

2403

params.m_CellToOutputWeights != nullptr);

2404

desc.m_ProjectionEnabled = (params.m_ProjectionWeights != nullptr);

2405

desc.m_LayerNormEnabled = (params.m_InputLayerNormWeights != nullptr ||

2406

params.m_ForgetLayerNormWeights != nullptr ||

2407

params.m_CellLayerNormWeights != nullptr ||

2408

params.m_OutputLayerNormWeights != nullptr);

2409

2410

// validate the optional input groups

2411

if (desc.m_CifgEnabled &&

2412

(params.m_InputToInputWeights != nullptr ||

2413

params.m_RecurrentToInputWeights != nullptr ||

2414

params.m_InputGateBias != nullptr))

2415

{

2416

return Fail("%s: All, or none, of input-to-input weights, recurrent-to-input weights,"

2417

" and input gate bias must be provided", __func__);

2418

}

2419

2420

if (!desc.m_ProjectionEnabled && params.m_ProjectionBias != nullptr)

2421

{

2422

return Fail("%s: projection bias should not be provided without projection weights", __func__);

2423

}

2424

2425

if (desc.m_PeepholeEnabled &&

2426

(params.m_CellToForgetWeights == nullptr ||

2427

params.m_CellToOutputWeights == nullptr ||

2428

(!desc.m_CifgEnabled && params.m_CellToInputWeights == nullptr)))

2429

{

2430

return Fail("%s: All, or none, of cell-to-forget weights and cell-to-output weights must be provided"

2431

" and, if CIFG is not enabled, cell-to-input weights must also be provided", __func__);

2432

}

2433

2434

if (desc.m_LayerNormEnabled &&

2435

(params.m_ForgetLayerNormWeights == nullptr ||

2436

params.m_CellLayerNormWeights == nullptr ||

2437

params.m_OutputLayerNormWeights == nullptr ||

2438

(!desc.m_CifgEnabled && params.m_InputLayerNormWeights == nullptr)))

2439

{

2440

return Fail("%s: All, or none, of forget-norm weights, cell-norm weights and output-norm weights must be"

2441

" provided and, if CIFG is not enabled, input-norm weights must also be provided", __func__);

2442

}

2443

2444

// Check if the layer is supported

2445

// Inputs

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2446

const TensorInfo& inputInfo = input.GetTensorInfo();

2447

const TensorInfo& outputStateInInfo = outputStateIn.GetTensorInfo();

2448

const TensorInfo& cellStateInInfo = cellStateIn.GetTensorInfo();

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2449

2450

// Outputs

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2451

const TensorInfo& scratchBufferInfo = GetTensorInfoForOperand(*scratchBuffer);

2452

const TensorInfo& outputStateOutInfo = GetTensorInfoForOperand(*outputStateOut);

2453

const TensorInfo& cellStateOutInfo = GetTensorInfoForOperand(*cellStateOut);

2454

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2455

Pablo Tello

2019-11-28 15:21:41 +0000

[diff] [blame]

2456

// Check if the scratch buffer shape was initialized,

2457

// In some cases the shape could be (0,0) which requires the driver

2458

// to infer the shape and set it up accordingly.

2459

// The code below does that.

2460

TensorInfo fixSbInfo = scratchBufferInfo;

2461

if (IsDynamicTensor(scratchBufferInfo))

2462

{

2463

auto & s = fixSbInfo.GetShape();

2464

s[0] = outputStateInInfo.GetShape()[0];

2465

if (desc.m_CifgEnabled)

2466

{

2467

// 2D tensor with dimensions [num_units * 3, batch_size] with CIFG

2468

s[1] = cellStateOutInfo.GetShape()[1]*3;

}

else

{

// scratch_buffer [num_units * 4, batch_size] without CIFG

2473

s[1] = cellStateOutInfo.GetShape()[1]*4;

}

}

if (IsDynamicTensor(outputStateOutInfo) ||

Ferran Balaguer

a4a629a

2019-07-30 10:16:13 +0100

[diff] [blame]

2478

IsDynamicTensor(cellStateOutInfo) ||

2479

IsDynamicTensor(outputInfo))

2480

{

Pablo Tello

2019-10-18 16:51:57 +0100

[diff] [blame]

2481

return Fail("%s: Dynamic output tensors are not supported %d %d %d %d", __func__,

2482

IsDynamicTensor(scratchBufferInfo), IsDynamicTensor(outputStateOutInfo),

2483

IsDynamicTensor(cellStateOutInfo), IsDynamicTensor(outputInfo));

Ferran Balaguer

a4a629a

2019-07-30 10:16:13 +0100

[diff] [blame]

2484

}

2485

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2486

// Basic parameters

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2487

LstmInputParamsInfo paramsInfo;

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2488

paramsInfo.m_InputToForgetWeights = &(params.m_InputToForgetWeights->GetInfo());

2489

paramsInfo.m_InputToCellWeights = &(params.m_InputToCellWeights->GetInfo());

2490

paramsInfo.m_InputToOutputWeights = &(params.m_InputToOutputWeights->GetInfo());

2491

paramsInfo.m_RecurrentToForgetWeights = &(params.m_RecurrentToForgetWeights->GetInfo());

2492

paramsInfo.m_RecurrentToCellWeights = &(params.m_RecurrentToCellWeights->GetInfo());

2493

paramsInfo.m_RecurrentToOutputWeights = &(params.m_RecurrentToOutputWeights->GetInfo());

2494

paramsInfo.m_ForgetGateBias = &(params.m_ForgetGateBias->GetInfo());

2495

paramsInfo.m_CellBias = &(params.m_CellBias->GetInfo());

2496

paramsInfo.m_OutputGateBias = &(params.m_OutputGateBias->GetInfo());

2497

2498

// Optional parameters

2499

if(!desc.m_CifgEnabled)

2500

{

2501

paramsInfo.m_InputToInputWeights = &(params.m_InputToInputWeights->GetInfo());

2502

paramsInfo.m_RecurrentToInputWeights = &(params.m_RecurrentToInputWeights->GetInfo());

2503

if (params.m_CellToInputWeights != nullptr)

2504

{

2505

paramsInfo.m_CellToInputWeights = &(params.m_CellToInputWeights->GetInfo());

2506

}

2507

paramsInfo.m_InputGateBias = &(params.m_InputGateBias->GetInfo());

2508

}

2509

2510

if(desc.m_ProjectionEnabled)

2511

{

2512

paramsInfo.m_ProjectionWeights = &(params.m_ProjectionWeights->GetInfo());

2513

if (params.m_ProjectionBias != nullptr)

2514

{

2515

paramsInfo.m_ProjectionBias = &(params.m_ProjectionBias->GetInfo());

}

}

if(desc.m_PeepholeEnabled)

2520

{

2521

paramsInfo.m_CellToForgetWeights = &(params.m_CellToForgetWeights->GetInfo());

2522

paramsInfo.m_CellToOutputWeights = &(params.m_CellToOutputWeights->GetInfo());

2523

}

2524

2525

if (desc.m_LayerNormEnabled)

2526

{

2527

if(!desc.m_CifgEnabled)

2528

{

2529

paramsInfo.m_InputLayerNormWeights = &(params.m_InputLayerNormWeights->GetInfo());

2530

}

2531

paramsInfo.m_ForgetLayerNormWeights = &(params.m_ForgetLayerNormWeights->GetInfo());

2532

paramsInfo.m_CellLayerNormWeights = &(params.m_CellLayerNormWeights->GetInfo());

2533

paramsInfo.m_OutputLayerNormWeights = &(params.m_OutputLayerNormWeights->GetInfo());

2534

}

2535

2536

bool isSupported = false;

2537

FORWARD_LAYER_SUPPORT_FUNC(__func__,

IsLstmSupported,

data.m_Backends,

isSupported,

inputInfo,

outputStateInInfo,

cellStateInInfo,

Pablo Tello

2019-11-28 15:21:41 +0000

[diff] [blame]

2544

fixSbInfo,

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

outputStateOutInfo,

cellStateOutInfo,

outputInfo,

desc,

paramsInfo);

if (!isSupported)

{

return false;

}

// Add the layer

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2556

IConnectableLayer* layer = data.m_Network->AddLstmLayer(desc, params, "Lstm");

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2557

2558

input.Connect(layer->GetInputSlot(0));

2559

outputStateIn.Connect(layer->GetInputSlot(1));

2560

cellStateIn.Connect(layer->GetInputSlot(2));

2561

Pablo Tello

2019-11-28 15:21:41 +0000

[diff] [blame]

2562

2563

return (

2564

(IsDynamicTensor(scratchBufferInfo)?

2565

SetupAndTrackLayerOutputSlotAndOverrideTensorInfo<hal_1_2::HalPolicy>(

2566

operation, 0, *layer, 0, model, data,fixSbInfo):

2567

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(

2568

operation, 0, *layer, 0, model, data)) &&

Ferran Balaguer

2019-07-25 12:12:39 +0100

[diff] [blame]

2569

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 1, *layer, 1, model, data) &&

2570

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 2, *layer, 2, model, data) &&

2571

SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 3, *layer, 3, model, data));

2572

}

2573

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

2574

bool HalPolicy::ConvertSqrt(const Operation& operation, const Model& model, ConversionData& data)

2575

{

2576

ALOGV("hal_1_2::HalPolicy::ConvertSqrt()");

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2577

ActivationDescriptor desc;

2578

desc.m_Function = ActivationFunction::Sqrt;

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

2579

2580

return ::ConvertToActivation<hal_1_2::HalPolicy>(operation, __func__, desc, model, data);

2581

}

2582

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

2583

bool HalPolicy::ConvertSqueeze(const Operation& operation, const Model& model, ConversionData& data)

2584

{

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

2585

ALOGV("hal_1_2::HalPolicy::ConvertSqueeze()");

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

2586

return ::ConvertSqueeze<hal_1_2::HalPolicy>(operation, model, data);

2587

}

2588

2589

bool HalPolicy::ConvertStridedSlice(const Operation& operation, const Model& model, ConversionData& data)

2590

{

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

2591

ALOGV("hal_1_2::HalPolicy::ConvertStridedSlice()");

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

2592

return ::ConvertStridedSlice<hal_1_2::HalPolicy>(operation, model, data);

2593

}

2594

2595

bool HalPolicy::ConvertTranspose(const Operation& operation, const Model& model, ConversionData& data)

2596

{

Sadik Armagan

2019-09-04 15:16:18 +0100

[diff] [blame]

2597

ALOGV("hal_1_2::HalPolicy::ConvertTranspose()");

Mike Kelly

2019-08-14 17:00:48 +0100

[diff] [blame]

2598

return ::ConvertTranspose<hal_1_2::HalPolicy>(operation, model, data);

2599

}

2600

Aron Virginas-Tar

8b99168

2019-07-31 12:54:59 +0100

[diff] [blame]

2601

bool HalPolicy::ConvertTransposeConv2d(const Operation& operation, const Model& model, ConversionData& data)

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2602

{

2603

LayerInputHandle input = ConvertToLayerInputHandle<hal_1_2::HalPolicy>(operation, 0, model, data);

2604

2605

if (!input.IsValid())

2606

{

2607

return Fail("%s: Operation has invalid inputs", __func__);

2608

}

2609

2610

const Operand* output = GetOutputOperand<hal_1_2::HalPolicy>(operation, 0, model);

if (!output)

{

return Fail("%s: Could not read output 0", __func__);

2615

}

2616

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2617

const TensorInfo& inputInfo = input.GetTensorInfo();

2618

const TensorInfo& outputInfo = GetTensorInfoForOperand(*output);

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2619

if (IsDynamicTensor(outputInfo))

2620

{

2621

return Fail("%s: Dynamic output tensors are not supported", __func__);

2622

}

2623

2624

// ArmNN does not currently support non-fixed weights or bias

2625

// Find the shape of the weights tensor. In AndroidNN this will be [ 1, H, W, I * M ]

2626

const Operand* weightsOperand = GetInputOperand<hal_1_2::HalPolicy>(operation, 1, model);

2627

2628

if (weightsOperand == nullptr)

2629

{

2630

return Fail("%s: Operand is invalid", __func__);

2631

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2632

TransposeConvolution2dDescriptor desc;

2633

desc.m_DataLayout = DataLayout::NHWC;

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2634

2635

// Determine whether padding is implicit or explicit

2636

bool implicitPadding = operation.inputs.size() == 9;

2637

2638

if (implicitPadding )

2639

{

2640

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 8, model, data);

}

else

{

desc.m_DataLayout = OptionalDataLayout<hal_1_2::HalPolicy>(operation, 10, model, data);

2645

}

2646

2647

armnnUtils::DataLayoutIndexed dataLayoutIndexed(desc.m_DataLayout);

2648

unsigned int widthIndex = dataLayoutIndexed.GetWidthIndex();

2649

unsigned int heightIndex = dataLayoutIndexed.GetHeightIndex();

2650

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2651

const PermutationVector OHWIToOIHW = {0, 2, 3, 1};

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2652

2653

// The shape of the weight is [depth_out, filter_height, filter_width, depth_in].

2654

// We have to permute it to OIHW if the data layout is NCHW.

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2655

const ConstTensorPin weightsPin = (desc.m_DataLayout == DataLayout::NCHW) ?

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2656

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data, OHWIToOIHW) :

2657

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 1, model, data);

2658

2659

// Bias is a 1D tensor

2660

const ConstTensorPin biasPin =

2661

ConvertOperationInputToConstTensorPin<hal_1_2::HalPolicy>(operation, 2, model, data);

2662

2663

if (!weightsPin.IsValid())

2664

{

2665

return Fail("%s: Operation has invalid weights", __func__);

2666

}

2667

2668

if (!biasPin.IsValid())

2669

{

2670

return Fail("%s: Operation has invalid biases", __func__);

2671

}

2672

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2673

ConstTensor weights = weightsPin.GetConstTensor();

2674

ConstTensor bias = biasPin.GetConstTensor();

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2675

SanitizeBiasQuantizationScale(bias.GetInfo(), weights.GetInfo(), inputInfo);

2676

2677

ActivationFn activation;

2678

2679

if (implicitPadding)

2680

{

Sadik Armagan

3e3003e

2019-08-13 12:54:34 +0100

[diff] [blame]

int32_t strideX{0};

int32_t strideY{0};

int32_t padLeft{0};

int32_t padRight{0};

int32_t padTop{0};

int32_t padBottom{0};

2687

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2688

android::nn::PaddingScheme paddingScheme;

2689

if (!GetInputPaddingScheme<hal_1_2::HalPolicy>(operation, 4, paddingScheme, model, data) ||

Sadik Armagan

3e3003e

2019-08-13 12:54:34 +0100

[diff] [blame]

2690

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, strideX, model, data) ||

2691

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, strideY, model, data) ||

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2692

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 7, activation, model, data))

2693

{

2694

return Fail("%s: Operation has invalid inputs (implicit padding)", __func__);

2695

}

2696

2697

const uint32_t kernelX = weights.GetShape()[widthIndex];

2698

const uint32_t kernelY = weights.GetShape()[heightIndex];

Narumol Prangnawarat

c8bdb39

2019-08-01 15:51:44 +0100

[diff] [blame]

2699

const uint32_t outputX = outputInfo.GetShape()[widthIndex];

2700

const uint32_t outputY = outputInfo.GetShape()[heightIndex];

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2701

Narumol Prangnawarat

c8bdb39

2019-08-01 15:51:44 +0100

[diff] [blame]

2702

CalcPaddingTransposeConv(outputX, kernelX, desc.m_StrideX, padLeft, padRight, paddingScheme);

2703

CalcPaddingTransposeConv(outputY, kernelY, desc.m_StrideY, padTop, padBottom, paddingScheme);

2704

2705

// NOTE: The Android NN API allows for negative padding values in TransposeConv2d,

2706

// but Arm NN only supports values >= 0

2707

if (padLeft < 0 || padRight < 0 || padTop < 0 || padBottom < 0)

2708

{

2709

return Fail("%s: Negative padding values are not supported", __func__);

2710

}

2711

Sadik Armagan

3e3003e

2019-08-13 12:54:34 +0100

[diff] [blame]

2712

desc.m_StrideX = boost::numeric_cast<uint32_t>(strideX);

2713

desc.m_StrideY = boost::numeric_cast<uint32_t>(strideY);

Narumol Prangnawarat

c8bdb39

2019-08-01 15:51:44 +0100

[diff] [blame]

2714

desc.m_PadLeft = boost::numeric_cast<uint32_t>(padLeft);

2715

desc.m_PadRight = boost::numeric_cast<uint32_t>(padRight);

2716

desc.m_PadTop = boost::numeric_cast<uint32_t>(padTop);

2717

desc.m_PadBottom = boost::numeric_cast<uint32_t>(padBottom);

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2718

}

2719

else if (operation.inputs.size() == 11)

2720

{

2721

// explicit padding

2722

if (!GetInputScalar<hal_1_2::HalPolicy>(operation, 3, OperandType::INT32, desc.m_PadLeft, model, data) ||

2723

!GetInputScalar<hal_1_2::HalPolicy>(operation, 4, OperandType::INT32, desc.m_PadRight, model, data) ||

2724

!GetInputScalar<hal_1_2::HalPolicy>(operation, 5, OperandType::INT32, desc.m_PadTop, model, data) ||

2725

!GetInputScalar<hal_1_2::HalPolicy>(operation, 6, OperandType::INT32, desc.m_PadBottom, model, data) ||

2726

!GetInputScalar<hal_1_2::HalPolicy>(operation, 7, OperandType::INT32, desc.m_StrideX, model, data) ||

2727

!GetInputScalar<hal_1_2::HalPolicy>(operation, 8, OperandType::INT32, desc.m_StrideY, model, data) ||

2728

!GetInputActivationFunction<hal_1_2::HalPolicy>(operation, 9, activation, model, data))

2729

{

2730

return Fail("%s: Operation has invalid inputs (explicit padding)", __func__);

}

}

else

{

return Fail("%s: Unsupported number of operation inputs", __func__);

2736

}

2737

2738

desc.m_BiasEnabled = true;

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2739

Optional<TensorInfo> biases(bias.GetInfo());

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2740

2741

bool isSupported = false;

2742

FORWARD_LAYER_SUPPORT_FUNC(__func__,

2743

IsTransposeConvolution2dSupported,

data.m_Backends,

isSupported,

inputInfo,

outputInfo,

desc,

weights.GetInfo(),

biases);

if (!isSupported)

{

return false;

}

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2756

IConnectableLayer* startLayer =

2757

data.m_Network->AddTransposeConvolution2dLayer(desc, weights, Optional<ConstTensor>(bias));

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2758

if (!startLayer)

2759

{

2760

return Fail("%s: AddTransposeConvolution2dLayer failed", __func__);

2761

}

2762

Teresa Charlin

2019-10-01 13:10:15 +0100

[diff] [blame]

2763

IConnectableLayer* endLayer = ProcessActivation(outputInfo, activation, startLayer, data);

David Monahan

2019-06-27 11:37:47 +0100

[diff] [blame]

2764

if (!endLayer)

2765

{

2766

return Fail("%s: ProcessActivation failed", __func__);

2767

}

2768

2769

input.Connect(startLayer->GetInputSlot(0));

2770

2771

return SetupAndTrackLayerOutputSlot<hal_1_2::HalPolicy>(operation, 0, *endLayer, model, data);

2772

}

2773

Mike Kelly

2019-06-11 16:35:25 +0100

[diff] [blame]

2774

} // namespace hal_1_2

Matteo Martincigh