Blame - ArmnnPreparedModel.cpp - ml/android-nn-driver

2018-03-09 13:51:08 +0000

[diff] [blame]

1

//

2

David Beck

93e4898

2018-09-05 13:05:09 +0100

[diff] [blame]

3

// SPDX-License-Identifier: MIT

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

4

//

5

6

#define LOG_TAG "ArmnnDriver"

7

8

#include "ArmnnPreparedModel.hpp"

9

#include "Utils.hpp"

10

11

#include <boost/format.hpp>

12

#include <log/log.h>

13

#include <OperationsUtils.h>

14

Mike Kelly

b5fdf38

2019-06-11 16:35:25 +0100

[diff] [blame]

15

#if defined(ARMNN_ANDROID_P) || defined(ARMNN_ANDROID_Q)

surmeh01

deb3bdb

2018-07-05 12:06:04 +0100

[diff] [blame]

16

// The headers of the ML framework have changed between Android O and Android P.

17

// The validation functions have been moved into their own header, ValidateHal.h.

18

#include <ValidateHal.h>

19

#endif

20

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

#include <cassert>

#include <cinttypes>

using namespace android;

namespace

{

using namespace armnn_driver;

29

Matthew Bentham

9e80cd2

2019-05-03 22:54:36 +0100

[diff] [blame]

30

void NotifyCallbackAndCheck(const ::android::sp<V1_0::IExecutionCallback>& callback, ErrorStatus errorStatus,

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

31

std::string callingFunction)

32

{

33

Return<void> returned = callback->notify(errorStatus);

34

// This check is required, if the callback fails and it isn't checked it will bring down the service

35

if (!returned.isOk())

36

{

37

ALOGE("ArmnnDriver::%s: hidl callback failed to return properly: %s",

38

callingFunction.c_str(), returned.description().c_str());

}

}

bool ValidateRequestArgument(const RequestArgument& requestArg, const armnn::TensorInfo& tensorInfo)

43

{

44

if (requestArg.dimensions.size() != 0)

45

{

46

if (requestArg.dimensions.size() != tensorInfo.GetNumDimensions())

47

{

48

ALOGE("Mismatched dimensions (request argument: %zu, expected: %u)",

49

requestArg.dimensions.size(), tensorInfo.GetNumDimensions());

return false;

}

for (unsigned int d = 0; d < tensorInfo.GetNumDimensions(); ++d)

54

{

55

if (requestArg.dimensions[d] != tensorInfo.GetShape()[d])

56

{

57

ALOGE("Mismatched size for dimension %d (request argument: %u, expected %u)",

58

d, requestArg.dimensions[d], tensorInfo.GetShape()[d]);

return false;

}

}

}

return true;

}

armnn::Tensor GetTensorForRequestArgument(const RequestArgument& requestArg,

68

const armnn::TensorInfo& tensorInfo,

69

const std::vector<::android::nn::RunTimePoolInfo>& requestPools)

70

{

71

if (!ValidateRequestArgument(requestArg, tensorInfo))

72

{

73

return armnn::Tensor();

74

}

75

76

return armnn::Tensor(tensorInfo, GetMemoryFromPool(requestArg.location, requestPools));

77

}

78

79

inline std::string BuildTensorName(const char* tensorNamePrefix, std::size_t index)

80

{

81

return tensorNamePrefix + std::to_string(index);

82

}

83

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

84

} // anonymous namespace

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

85

telsoa01

2018-08-31 09:31:35 +0100

[diff] [blame]

86

using namespace android::hardware;

87

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

88

namespace armnn_driver

89

{

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

90

template<typename HalVersion>

Mike Kelly

2019-07-22 14:06:00 +0100

[diff] [blame]

91

RequestThread<ArmnnPreparedModel, HalVersion, ArmnnCallback_1_0> ArmnnPreparedModel<HalVersion>::m_RequestThread;

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

92

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

93

template<typename HalVersion>

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

94

template <typename TensorBindingCollection>

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

95

void ArmnnPreparedModel<HalVersion>::DumpTensorsIfRequired(char const* tensorNamePrefix,

96

const TensorBindingCollection& tensorBindings)

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

97

{

98

if (!m_RequestInputsAndOutputsDumpDir.empty())

99

{

100

const std::string requestName = boost::str(boost::format("%1%_%2%.dump") % m_NetworkId % m_RequestCount);

101

for (std::size_t i = 0u; i < tensorBindings.size(); ++i)

102

{

103

DumpTensor(m_RequestInputsAndOutputsDumpDir,

104

requestName,

105

BuildTensorName(tensorNamePrefix, i),

106

tensorBindings[i].second);

}

}

}

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

111

template<typename HalVersion>

112

ArmnnPreparedModel<HalVersion>::ArmnnPreparedModel(armnn::NetworkId networkId,

113

armnn::IRuntime* runtime,

114

const HalModel& model,

115

const std::string& requestInputsAndOutputsDumpDir,

116

const bool gpuProfilingEnabled)

telsoa01

2018-08-31 09:31:35 +0100

[diff] [blame]

117

: m_NetworkId(networkId)

, m_Runtime(runtime)

, m_Model(model)

, m_RequestCount(0)

, m_RequestInputsAndOutputsDumpDir(requestInputsAndOutputsDumpDir)

122

, m_GpuProfilingEnabled(gpuProfilingEnabled)

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

123

{

telsoa01

2018-08-31 09:31:35 +0100

[diff] [blame]

124

// Enable profiling if required.

125

m_Runtime->GetProfiler(m_NetworkId)->EnableProfiling(m_GpuProfilingEnabled);

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

126

}

127

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

128

template<typename HalVersion>

129

ArmnnPreparedModel<HalVersion>::~ArmnnPreparedModel()

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

130

{

telsoa01

2018-08-31 09:31:35 +0100

[diff] [blame]

131

// Get a hold of the profiler used by this model.

132

std::shared_ptr<armnn::IProfiler> profiler = m_Runtime->GetProfiler(m_NetworkId);

133

134

// Unload the network associated with this model.

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

135

m_Runtime->UnloadNetwork(m_NetworkId);

telsoa01

2018-08-31 09:31:35 +0100

[diff] [blame]

136

137

// Dump the profiling info to a file if required.

138

DumpJsonProfilingIfRequired(m_GpuProfilingEnabled, m_RequestInputsAndOutputsDumpDir, m_NetworkId, profiler.get());

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

139

}

140

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

141

template<typename HalVersion>

142

Return<ErrorStatus> ArmnnPreparedModel<HalVersion>::execute(const Request& request,

Matthew Bentham

9e80cd2

2019-05-03 22:54:36 +0100

[diff] [blame]

143

const ::android::sp<V1_0::IExecutionCallback>& callback)

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

144

{

145

ALOGV("ArmnnPreparedModel::execute(): %s", GetModelSummary(m_Model).c_str());

146

m_RequestCount++;

147

148

if (callback.get() == nullptr) {

149

ALOGE("ArmnnPreparedModel::execute invalid callback passed");

150

return ErrorStatus::INVALID_ARGUMENT;

151

}

152

153

if (!android::nn::validateRequest(request, m_Model))

154

{

155

NotifyCallbackAndCheck(callback, ErrorStatus::INVALID_ARGUMENT, "ArmnnPreparedModel::execute");

156

return ErrorStatus::INVALID_ARGUMENT;

157

}

158

159

if (!m_RequestInputsAndOutputsDumpDir.empty())

160

{

161

ALOGD("Dumping inputs and outputs for request %" PRIuPTR, reinterpret_cast<std::uintptr_t>(callback.get()));

162

}

163

164

// allocate the tensors on the heap, as they are passed to the request thread

165

auto pInputTensors = std::make_shared<armnn::InputTensors>();

166

auto pOutputTensors = std::make_shared<armnn::OutputTensors>();

167

168

// map the memory pool into shared pointers

169

// use a shared memory pools vector on the heap, as it is passed to the request thread

170

auto pMemPools = std::make_shared<std::vector<android::nn::RunTimePoolInfo>>();

171

if (!setRunTimePoolInfosFromHidlMemories(pMemPools.get(), request.pools))

172

{

173

NotifyCallbackAndCheck(callback, ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::execute");

174

return ErrorStatus::GENERAL_FAILURE;

175

}

176

177

// add the inputs and outputs with their data

178

try

179

{

180

pInputTensors->reserve(request.inputs.size());

181

for (unsigned int i = 0; i < request.inputs.size(); i++)

182

{

183

const auto& inputArg = request.inputs[i];

184

185

const armnn::TensorInfo inputTensorInfo = m_Runtime->GetInputTensorInfo(m_NetworkId, i);

186

const armnn::Tensor inputTensor = GetTensorForRequestArgument(inputArg, inputTensorInfo, *pMemPools);

187

if (inputTensor.GetMemoryArea() == nullptr)

188

{

189

ALOGE("Cannot execute request. Error converting request input %u to tensor", i);

190

return ErrorStatus::GENERAL_FAILURE;

191

}

192

193

pInputTensors->emplace_back(i, inputTensor);

194

}

195

196

pOutputTensors->reserve(request.outputs.size());

197

for (unsigned int i = 0; i < request.outputs.size(); i++)

198

{

199

const auto& outputArg = request.outputs[i];

200

201

const armnn::TensorInfo outputTensorInfo = m_Runtime->GetOutputTensorInfo(m_NetworkId, i);

202

const armnn::Tensor outputTensor = GetTensorForRequestArgument(outputArg, outputTensorInfo, *pMemPools);

203

if (outputTensor.GetMemoryArea() == nullptr)

204

{

205

ALOGE("Cannot execute request. Error converting request output %u to tensor", i);

206

return ErrorStatus::GENERAL_FAILURE;

207

}

208

209

pOutputTensors->emplace_back(i, outputTensor);

210

}

211

}

Mike Kelly

2019-12-11 19:27:11 +0000

[diff] [blame]

212

catch (std::exception& e)

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

213

{

Mike Kelly

2019-12-11 19:27:11 +0000

[diff] [blame]

214

ALOGW("Exception caught while preparing for EnqueueWorkload: %s", e.what());

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

215

NotifyCallbackAndCheck(callback, ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::execute");

216

return ErrorStatus::GENERAL_FAILURE;

217

}

218

219

ALOGV("ArmnnPreparedModel::execute(...) before PostMsg");

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

220

Mike Kelly

2019-07-22 14:06:00 +0100

[diff] [blame]

221

auto cb = [callback](ErrorStatus errorStatus, std::string callingFunction)

222

{

223

NotifyCallbackAndCheck(callback, errorStatus, callingFunction);

224

};

225

226

ArmnnCallback_1_0 armnnCb;

227

armnnCb.callback = cb;

228

// post the request for asynchronous execution

229

m_RequestThread.PostMsg(this, pMemPools, pInputTensors, pOutputTensors, armnnCb);

230

ALOGV("ArmnnPreparedModel::execute(...) after PostMsg");

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

231

return ErrorStatus::NONE; // successfully queued

232

}

233

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

234

template<typename HalVersion>

235

void ArmnnPreparedModel<HalVersion>::ExecuteGraph(

236

std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& pMemPools,

237

std::shared_ptr<armnn::InputTensors>& pInputTensors,

238

std::shared_ptr<armnn::OutputTensors>& pOutputTensors,

Mike Kelly

2019-07-22 14:06:00 +0100

[diff] [blame]

239

ArmnnCallback_1_0 cb)

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

240

{

241

ALOGV("ArmnnPreparedModel::ExecuteGraph(...)");

242

243

DumpTensorsIfRequired("Input", *pInputTensors);

// run it

try

{

Matthew Bentham

2019-04-01 17:17:58 +0100

[diff] [blame]

248

armnn::Status status = m_Runtime->EnqueueWorkload(m_NetworkId, *pInputTensors, *pOutputTensors);

249

if (status != armnn::Status::Success)

250

{

251

ALOGW("EnqueueWorkload failed");

Mike Kelly

2019-07-22 14:06:00 +0100

[diff] [blame]

252

cb.callback(ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::ExecuteGraph");

Matthew Bentham

2019-04-01 17:17:58 +0100

[diff] [blame]

253

return;

254

}

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

255

}

Mike Kelly

2019-12-11 19:27:11 +0000

[diff] [blame]

256

catch (std::exception& e)

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

257

{

Mike Kelly

2019-12-11 19:27:11 +0000

[diff] [blame]

258

ALOGW("Exception caught from EnqueueWorkload: %s", e.what());

Mike Kelly

2019-07-22 14:06:00 +0100

[diff] [blame]

259

cb.callback(ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::ExecuteGraph");

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

return;

}

DumpTensorsIfRequired("Output", *pOutputTensors);

264

265

// Commit output buffers.

266

// Note that we update *all* pools, even if they aren't actually used as outputs -

267

// this is simpler and is what the CpuExecutor does.

268

for (android::nn::RunTimePoolInfo& pool : *pMemPools)

{

pool.update();

}

Mike Kelly

2019-07-22 14:06:00 +0100

[diff] [blame]

273

cb.callback(ErrorStatus::NONE, "ExecuteGraph");

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

274

}

275

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

276

template<typename HalVersion>

Matthew Bentham

2019-04-01 17:17:58 +0100

[diff] [blame]

277

bool ArmnnPreparedModel<HalVersion>::ExecuteWithDummyInputs()

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

278

{

279

std::vector<std::vector<char>> storage;

280

armnn::InputTensors inputTensors;

281

for (unsigned int i = 0; i < m_Model.inputIndexes.size(); i++)

282

{

283

const armnn::TensorInfo inputTensorInfo = m_Runtime->GetInputTensorInfo(m_NetworkId, i);

284

storage.emplace_back(inputTensorInfo.GetNumBytes());

285

const armnn::ConstTensor inputTensor(inputTensorInfo, storage.back().data());

286

287

inputTensors.emplace_back(i, inputTensor);

288

}

289

290

armnn::OutputTensors outputTensors;

291

for (unsigned int i = 0; i < m_Model.outputIndexes.size(); i++)

292

{

293

const armnn::TensorInfo outputTensorInfo = m_Runtime->GetOutputTensorInfo(m_NetworkId, i);

294

storage.emplace_back(outputTensorInfo.GetNumBytes());

295

const armnn::Tensor outputTensor(outputTensorInfo, storage.back().data());

296

297

outputTensors.emplace_back(i, outputTensor);

}

try

{

Matthew Bentham

2019-04-01 17:17:58 +0100

[diff] [blame]

302

armnn::Status status = m_Runtime->EnqueueWorkload(m_NetworkId, inputTensors, outputTensors);

303

if (status != armnn::Status::Success)

304

{

305

ALOGW("ExecuteWithDummyInputs: EnqueueWorkload failed");

306

return false;

307

}

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

308

}

Mike Kelly

2019-12-11 19:27:11 +0000

[diff] [blame]

309

catch (std::exception& e)

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

310

{

Mike Kelly

2019-12-11 19:27:11 +0000

[diff] [blame]

311

ALOGW("ExecuteWithDummyInputs: Exception caught from EnqueueWorkload: %s", e.what());

Matthew Bentham

2019-04-01 17:17:58 +0100

[diff] [blame]

312

return false;

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

313

}

Matthew Bentham

2019-04-01 17:17:58 +0100

[diff] [blame]

314

return true;

telsoa01

2018-03-09 13:51:08 +0000

[diff] [blame]

315

}

316

arovir01

b0717b5

2018-09-05 17:03:25 +0100

[diff] [blame]

317

///

318

/// Class template specializations

319

///

Matteo Martincigh

2018-09-03 13:50:50 +0100

[diff] [blame]

320

arovir01

b0717b5

2018-09-05 17:03:25 +0100

[diff] [blame]

321

template class ArmnnPreparedModel<hal_1_0::HalPolicy>;

322

Matteo Martincigh

8b287c2

2018-09-07 09:25:10 +0100

[diff] [blame]

323

#ifdef ARMNN_ANDROID_NN_V1_1

arovir01

b0717b5

2018-09-05 17:03:25 +0100

[diff] [blame]

324

template class ArmnnPreparedModel<hal_1_1::HalPolicy>;

Matteo Martincigh