Blame - 1.3/ArmnnDriverImpl.cpp - ml/android-nn-driver

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

1

//

2

3

// SPDX-License-Identifier: MIT

4

//

5

6

#include "ArmnnDriverImpl.hpp"

7

#include "../ArmnnPreparedModel_1_3.hpp"

8

#include "../ModelToINetworkConverter.hpp"

9

#include "../SystemPropertiesUtils.hpp"

#include <log/log.h>

namespace

{

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

15

const char *g_RelaxedFloat32toFloat16PerformanceExecTime = "ArmNN.relaxedFloat32toFloat16Performance.execTime";

16

const char *g_RelaxedFloat32toFloat16PerformancePowerUsage = "ArmNN.relaxedFloat32toFloat16Performance.powerUsage";

17

Kevin May

2eaa119

2020-04-15 16:50:57 +0100

[diff] [blame]

18

const char *g_ifPerformanceExecTime = "ArmNN.ifPerformance.execTime";

19

const char *g_ifPerformancePowerUsage = "ArmNN.ifPerformance.powerUsage";

20

21

const char *g_whilePerformanceExecTime = "ArmNN.whilePerformance.execTime";

22

const char *g_whilePerformancePowerUsage = "ArmNN.whilePerformance.powerUsage";

23

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

24

const char *g_OperandTypeTensorFloat32PerformanceExecTime = "Armnn.operandTypeTensorFloat32Performance.execTime";

25

const char *g_OperandTypeTensorFloat32PerformancePowerUsage = "Armnn.operandTypeTensorFloat32Performance.powerUsage";

26

27

const char *g_OperandTypeFloat32PerformanceExecTime = "Armnn.operandTypeFloat32Performance.execTime";

28

const char *g_OperandTypeFloat32PerformancePowerUsage = "Armnn.operandTypeFloat32Performance.powerUsage";

29

30

const char *g_OperandTypeTensorFloat16PerformanceExecTime = "Armnn.operandTypeTensorFloat16Performance.execTime";

31

const char *g_OperandTypeTensorFloat16PerformancePowerUsage = "Armnn.operandTypeTensorFloat16Performance.powerUsage";

32

33

const char *g_OperandTypeFloat16PerformanceExecTime = "Armnn.operandTypeFloat16Performance.execTime";

34

const char *g_OperandTypeFloat16PerformancePowerUsage = "Armnn.operandTypeFloat16Performance.powerUsage";

35

36

const char *g_OperandTypeTensorQuant8AsymmPerformanceExecTime =

37

"Armnn.operandTypeTensorQuant8AsymmPerformance.execTime";

38

const char *g_OperandTypeTensorQuant8AsymmPerformancePowerUsage =

39

"Armnn.operandTypeTensorQuant8AsymmPerformance.powerUsage";

40

41

const char *g_OperandTypeTensorQuant8AsymmSignedPerformanceExecTime =

42

"Armnn.operandTypeTensorQuant8AsymmSignedPerformance.execTime";

43

const char *g_OperandTypeTensorQuant8AsymmSignedPerformancePowerUsage =

44

"Armnn.operandTypeTensorQuant8AsymmSignedPerformance.powerUsage";

45

46

const char *g_OperandTypeTensorQuant16SymmPerformanceExecTime =

47

"Armnn.operandTypeTensorQuant16SymmPerformance.execTime";

48

const char *g_OperandTypeTensorQuant16SymmPerformancePowerUsage =

49

"Armnn.operandTypeTensorQuant16SymmPerformance.powerUsage";

50

51

const char *g_OperandTypeTensorQuant8SymmPerformanceExecTime =

52

"Armnn.operandTypeTensorQuant8SymmPerformance.execTime";

53

const char *g_OperandTypeTensorQuant8SymmPerformancePowerUsage =

54

"Armnn.operandTypeTensorQuant8SymmPerformance.powerUsage";

55

56

const char *g_OperandTypeTensorQuant8SymmPerChannelPerformanceExecTime =

57

"Armnn.operandTypeTensorQuant8SymmPerChannelPerformance.execTime";

58

const char *g_OperandTypeTensorQuant8SymmPerChannelPerformancePowerUsage =

59

"Armnn.operandTypeTensorQuant8SymmPerChannelPerformance.powerUsage";

60

61

62

const char *g_OperandTypeTensorInt32PerformanceExecTime = "Armnn.operandTypeTensorInt32Performance.execTime";

63

const char *g_OperandTypeTensorInt32PerformancePowerUsage = "Armnn.operandTypeTensorInt32Performance.powerUsage";

64

65

const char *g_OperandTypeInt32PerformanceExecTime = "Armnn.operandTypeInt32Performance.execTime";

66

const char *g_OperandTypeInt32PerformancePowerUsage = "Armnn.operandTypeInt32Performance.powerUsage";

67

68

69

void NotifyCallbackAndCheck(const sp<V1_3::IPreparedModelCallback>& callback,

70

V1_3::ErrorStatus errorStatus,

71

const sp<V1_3::IPreparedModel>& preparedModelPtr)

72

{

73

Return<void> returned = callback->notify_1_3(errorStatus, preparedModelPtr);

74

// This check is required, if the callback fails and it isn't checked it will bring down the service

75

if (!returned.isOk())

76

{

77

ALOGE("ArmnnDriverImpl::prepareModel: hidl callback failed to return properly: %s ",

78

returned.description().c_str());

}

}

Return<V1_3::ErrorStatus> FailPrepareModel(V1_3::ErrorStatus error,

83

const std::string& message,

84

const sp<V1_3::IPreparedModelCallback>& callback)

85

{

86

ALOGW("ArmnnDriverImpl::prepareModel: %s", message.c_str());

87

NotifyCallbackAndCheck(callback, error, nullptr);

return error;

}

} // anonymous namespace

92

93

namespace armnn_driver

{

namespace hal_1_3

{

Return<V1_3::ErrorStatus> ArmnnDriverImpl::prepareArmnnModel_1_3(

99

const armnn::IRuntimePtr& runtime,

100

const armnn::IGpuAccTunedParametersPtr& clTunedParameters,

101

const DriverOptions& options,

102

const V1_3::Model& model,

103

const sp<V1_3::IPreparedModelCallback>& cb,

Narumol Prangnawarat

cad4e91

2020-06-02 12:07:43 +0100

[diff] [blame]

104

bool float32ToFloat16,

105

V1_3::Priority priority)

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

106

{

107

ALOGV("ArmnnDriverImpl::prepareArmnnModel_1_3()");

108

109

if (cb.get() == nullptr)

110

{

111

ALOGW("ArmnnDriverImpl::prepareModel: Invalid callback passed to prepareModel");

112

return V1_3::ErrorStatus::INVALID_ARGUMENT;

}

if (!runtime)

{

return FailPrepareModel(V1_3::ErrorStatus::DEVICE_UNAVAILABLE, "Device unavailable", cb);

118

}

119

120

if (!android::nn::validateModel(model))

121

{

122

return FailPrepareModel(V1_3::ErrorStatus::INVALID_ARGUMENT, "Invalid model passed as input", cb);

123

}

124

125

// Deliberately ignore any unsupported operations requested by the options -

126

// at this point we're being asked to prepare a model that we've already declared support for

127

// and the operation indices may be different to those in getSupportedOperations anyway.

128

std::set<unsigned int> unsupportedOperations;

129

ModelToINetworkConverter<HalPolicy> modelConverter(options.GetBackends(),

130

model,

131

unsupportedOperations);

132

133

if (modelConverter.GetConversionResult() != ConversionResult::Success)

134

{

135

FailPrepareModel(V1_3::ErrorStatus::GENERAL_FAILURE, "ModelToINetworkConverter failed", cb);

136

return V1_3::ErrorStatus::NONE;

137

}

138

Sadik Armagan

b302143

2021-01-13 15:56:51 +0000

[diff] [blame]

139

// Serialize the network graph to a .armnn file if an output directory

140

// has been specified in the drivers' arguments.

141

auto serializedNetworkFileName =

142

SerializeNetwork(*modelConverter.GetINetwork(), options.GetRequestInputsAndOutputsDumpDir());

143

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

144

// Optimize the network

145

armnn::IOptimizedNetworkPtr optNet(nullptr, nullptr);

146

armnn::OptimizerOptions OptOptions;

147

OptOptions.m_ReduceFp32ToFp16 = float32ToFloat16;

148

Mike Kelly

7ed56dd

2020-09-30 20:22:56 +0100

[diff] [blame]

149

armnn::BackendOptions gpuAcc("GpuAcc",

150

{

Sadik Armagan

f36e10b

2021-01-11 16:34:01 +0000

[diff] [blame]

151

{ "FastMathEnabled", options.IsFastMathEnabled() },

152

{ "SaveCachedNetwork", options.SaveCachedNetwork() },

153

{ "CachedNetworkFilePath", options.GetCachedNetworkFilePath() }

Mike Kelly

7ed56dd

2020-09-30 20:22:56 +0100

[diff] [blame]

154

});

155

armnn::BackendOptions cpuAcc("CpuAcc",

156

{

157

{ "FastMathEnabled", options.IsFastMathEnabled() }

158

});

159

OptOptions.m_ModelOptions.push_back(gpuAcc);

160

OptOptions.m_ModelOptions.push_back(cpuAcc);

161

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

162

std::vector<std::string> errMessages;

163

try

164

{

165

optNet = armnn::Optimize(*modelConverter.GetINetwork(),

166

options.GetBackends(),

167

runtime->GetDeviceSpec(),

OptOptions,

errMessages);

}

catch (std::exception& e)

172

{

173

std::stringstream message;

174

message << "Exception (" << e.what() << ") caught from optimize.";

175

FailPrepareModel(V1_3::ErrorStatus::GENERAL_FAILURE, message.str(), cb);

176

return V1_3::ErrorStatus::NONE;

177

}

178

179

// Check that the optimized network is valid.

180

if (!optNet)

181

{

182

std::stringstream message;

183

message << "Invalid optimized network";

184

for (const std::string& msg : errMessages)

185

{

186

message << "\n" << msg;

187

}

188

FailPrepareModel(V1_3::ErrorStatus::GENERAL_FAILURE, message.str(), cb);

189

return V1_3::ErrorStatus::NONE;

190

}

191

192

// Export the optimized network graph to a dot file if an output dump directory

193

// has been specified in the drivers' arguments.

194

std::string dotGraphFileName = ExportNetworkGraphToDotFile(*optNet,

195

options.GetRequestInputsAndOutputsDumpDir());

196

197

// Load it into the runtime.

198

armnn::NetworkId netId = 0;

199

try

200

{

201

if (runtime->LoadNetwork(netId, move(optNet)) != armnn::Status::Success)

202

{

203

return FailPrepareModel(V1_3::ErrorStatus::GENERAL_FAILURE, "Network could not be loaded", cb);

204

}

205

}

206

catch (std::exception& e)

207

{

208

std::stringstream message;

209

message << "Exception (" << e.what()<< ") caught from LoadNetwork.";

210

FailPrepareModel(V1_3::ErrorStatus::GENERAL_FAILURE, message.str(), cb);

211

return V1_3::ErrorStatus::NONE;

212

}

213

Sadik Armagan

b302143

2021-01-13 15:56:51 +0000

[diff] [blame]

214

// Now that we have a networkId for the graph rename the exported files to use it

215

// so that we can associate the graph file and the input/output tensor exported files

216

RenameExportedFiles(serializedNetworkFileName,

217

dotGraphFileName,

218

options.GetRequestInputsAndOutputsDumpDir(),

219

netId);

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

220

221

std::unique_ptr<ArmnnPreparedModel_1_3<hal_1_3::HalPolicy>> preparedModel(

222

new ArmnnPreparedModel_1_3<hal_1_3::HalPolicy>(

netId,

runtime.get(),

model,

options.GetRequestInputsAndOutputsDumpDir(),

Narumol Prangnawarat

cad4e91

2020-06-02 12:07:43 +0100

[diff] [blame]

227

options.IsGpuProfilingEnabled(),

228

priority));

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

229

230

// Run a single 'dummy' inference of the model. This means that CL kernels will get compiled (and tuned if

231

// this is enabled) before the first 'real' inference which removes the overhead of the first inference.

232

if (!preparedModel->ExecuteWithDummyInputs())

233

{

234

return FailPrepareModel(V1_3::ErrorStatus::GENERAL_FAILURE, "Network could not be executed", cb);

235

}

236

237

if (clTunedParameters &&

238

options.GetClTunedParametersMode() == armnn::IGpuAccTunedParameters::Mode::UpdateTunedParameters)

239

{

240

// Now that we've done one inference the CL kernel parameters will have been tuned, so save the updated file.

241

try

242

{

243

clTunedParameters->Save(options.GetClTunedParametersFile().c_str());

244

}

245

catch (std::exception& error)

246

{

247

ALOGE("ArmnnDriverImpl::prepareModel: Failed to save CL tuned parameters file '%s': %s",

248

options.GetClTunedParametersFile().c_str(), error.what());

}

}

NotifyCallbackAndCheck(cb, V1_3::ErrorStatus::NONE, preparedModel.release());

253

254

return V1_3::ErrorStatus::NONE;

255

}

256

257

Return<void> ArmnnDriverImpl::getCapabilities_1_3(const armnn::IRuntimePtr& runtime,

258

V1_3::IDevice::getCapabilities_1_3_cb cb)

259

{

260

ALOGV("hal_1_3::ArmnnDriverImpl::getCapabilities()");

261

262

V1_3::Capabilities capabilities;

263

264

float defaultValue = .1f;

if (runtime)

{

capabilities.relaxedFloat32toFloat16PerformanceScalar.execTime =

269

ParseSystemProperty(g_RelaxedFloat32toFloat16PerformanceExecTime, defaultValue);

270

Kevin May

2eaa119

2020-04-15 16:50:57 +0100

[diff] [blame]

271

capabilities.relaxedFloat32toFloat16PerformanceScalar.powerUsage =

272

ParseSystemProperty(g_RelaxedFloat32toFloat16PerformancePowerUsage, defaultValue);

273

274

capabilities.relaxedFloat32toFloat16PerformanceTensor.execTime =

275

ParseSystemProperty(g_RelaxedFloat32toFloat16PerformanceExecTime, defaultValue);

276

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

277

capabilities.relaxedFloat32toFloat16PerformanceTensor.powerUsage =

278

ParseSystemProperty(g_RelaxedFloat32toFloat16PerformancePowerUsage, defaultValue);

279

Kevin May

2eaa119

2020-04-15 16:50:57 +0100

[diff] [blame]

280

capabilities.ifPerformance.execTime =

281

ParseSystemProperty(g_ifPerformanceExecTime, defaultValue);

282

283

capabilities.ifPerformance.powerUsage =

284

ParseSystemProperty(g_ifPerformancePowerUsage, defaultValue);

285

286

capabilities.whilePerformance.execTime =

287

ParseSystemProperty(g_whilePerformanceExecTime, defaultValue);

288

289

capabilities.whilePerformance.powerUsage =

290

ParseSystemProperty(g_whilePerformancePowerUsage, defaultValue);

291

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

292

// Set the base value for all operand types

293

capabilities.operandPerformance = nonExtensionOperandPerformance<HalVersion::V1_3>({FLT_MAX, FLT_MAX});

294

295

// Load supported operand types

296

update(&capabilities.operandPerformance, V1_3::OperandType::TENSOR_FLOAT32,

297

{

298

.execTime = ParseSystemProperty(g_OperandTypeTensorFloat32PerformanceExecTime, defaultValue),

299

.powerUsage = ParseSystemProperty(g_OperandTypeTensorFloat32PerformancePowerUsage, defaultValue)

300

});

301

302

update(&capabilities.operandPerformance, V1_3::OperandType::FLOAT32,

303

{

304

.execTime = ParseSystemProperty(g_OperandTypeFloat32PerformanceExecTime, defaultValue),

305

.powerUsage = ParseSystemProperty(g_OperandTypeFloat32PerformancePowerUsage, defaultValue)

306

});

307

308

update(&capabilities.operandPerformance, V1_3::OperandType::TENSOR_FLOAT16,

309

{

310

.execTime = ParseSystemProperty(g_OperandTypeTensorFloat16PerformanceExecTime, defaultValue),

311

.powerUsage = ParseSystemProperty(g_OperandTypeTensorFloat16PerformancePowerUsage, defaultValue)

312

});

313

314

update(&capabilities.operandPerformance, V1_3::OperandType::FLOAT16,

315

{

316

.execTime = ParseSystemProperty(g_OperandTypeFloat16PerformanceExecTime, defaultValue),

317

.powerUsage = ParseSystemProperty(g_OperandTypeFloat16PerformancePowerUsage, defaultValue)

318

});

319

320

update(&capabilities.operandPerformance, V1_3::OperandType::TENSOR_QUANT8_ASYMM,

321

{

322

.execTime = ParseSystemProperty(g_OperandTypeTensorQuant8AsymmPerformanceExecTime, defaultValue),

323

.powerUsage = ParseSystemProperty(g_OperandTypeTensorQuant8AsymmPerformancePowerUsage, defaultValue)

324

});

325

326

update(&capabilities.operandPerformance, V1_3::OperandType::TENSOR_QUANT8_SYMM,

327

{

328

.execTime = ParseSystemProperty(g_OperandTypeTensorQuant8SymmPerformanceExecTime, defaultValue),

329

.powerUsage = ParseSystemProperty(g_OperandTypeTensorQuant8SymmPerformancePowerUsage, defaultValue)

330

});

331

update(&capabilities.operandPerformance, V1_3::OperandType::TENSOR_QUANT8_ASYMM_SIGNED,

332

{

333

.execTime = ParseSystemProperty(g_OperandTypeTensorQuant8AsymmSignedPerformanceExecTime,

334

defaultValue),

335

.powerUsage = ParseSystemProperty(g_OperandTypeTensorQuant8AsymmSignedPerformancePowerUsage,

defaultValue)

});

update(&capabilities.operandPerformance, V1_3::OperandType::TENSOR_QUANT16_SYMM,

340

{

341

.execTime = ParseSystemProperty(g_OperandTypeTensorQuant16SymmPerformanceExecTime, defaultValue),

342

.powerUsage = ParseSystemProperty(g_OperandTypeTensorQuant16SymmPerformancePowerUsage, defaultValue)

343

});

344

345

update(&capabilities.operandPerformance, V1_3::OperandType::TENSOR_QUANT8_SYMM_PER_CHANNEL,

346

{

347

.execTime =

348

ParseSystemProperty(g_OperandTypeTensorQuant8SymmPerChannelPerformanceExecTime, defaultValue),

349

.powerUsage =

350

ParseSystemProperty(g_OperandTypeTensorQuant8SymmPerChannelPerformancePowerUsage, defaultValue)

351

});

352

353

update(&capabilities.operandPerformance, V1_3::OperandType::TENSOR_INT32,

354

{

355

.execTime = ParseSystemProperty(g_OperandTypeTensorInt32PerformanceExecTime, defaultValue),

356

.powerUsage = ParseSystemProperty(g_OperandTypeTensorInt32PerformancePowerUsage, defaultValue)

357

});

358

359

update(&capabilities.operandPerformance, V1_3::OperandType::INT32,

360

{

361

.execTime = ParseSystemProperty(g_OperandTypeInt32PerformanceExecTime, defaultValue),

362

.powerUsage = ParseSystemProperty(g_OperandTypeInt32PerformancePowerUsage, defaultValue)

363

});

364

365

cb(V1_3::ErrorStatus::NONE, capabilities);

366

}

367

else

368

{

Kevin May

2eaa119

2020-04-15 16:50:57 +0100

[diff] [blame]

369

capabilities.relaxedFloat32toFloat16PerformanceScalar.execTime = 0;

370

capabilities.relaxedFloat32toFloat16PerformanceScalar.powerUsage = 0;

371

capabilities.relaxedFloat32toFloat16PerformanceTensor.execTime = 0;

372

capabilities.relaxedFloat32toFloat16PerformanceTensor.powerUsage = 0;

373

capabilities.ifPerformance.execTime = 0;

374

capabilities.ifPerformance.powerUsage = 0;

375

capabilities.whilePerformance.execTime = 0;

376

capabilities.whilePerformance.powerUsage = 0;

Kevin May

42477c1

2020-03-26 13:34:14 +0000

[diff] [blame]

377

378

// Set the base value for all operand types

379

capabilities.operandPerformance = nonExtensionOperandPerformance<HalVersion::V1_3>({0.f, 0.0f});

380

381

cb(V1_3::ErrorStatus::DEVICE_UNAVAILABLE, capabilities);

}

return Void();

}

} // namespace hal_1_3

388

} // namespace armnn_driver