Blame - tests/ExecuteNetwork/ExecuteNetwork.cpp - ml/armnn

2018-08-31 09:22:23 +0100

[diff] [blame]

5

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

6

#include "NetworkExecutionUtils/NetworkExecutionUtils.hpp"

7

#include "ExecuteNetworkProgramOptions.hpp"

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

8

#include <armnn/IAsyncExecutionCallback.hpp>

9

#include <AsyncExecutionCallback.hpp>

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

10

11

#include <armnn/Logging.hpp>

Rob Hughes

9542f90

2021-07-14 09:48:54 +0100

[diff] [blame]

12

#include <armnnUtils/Filesystem.hpp>

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

13

#include <armnnUtils/TContainer.hpp>

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

14

#include <InferenceTest.hpp>

David Monahan

2021-11-01 10:16:37 +0000

[diff] [blame]

15

#include <Half.hpp>

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

16

17

#if defined(ARMNN_SERIALIZER)

18

#include "armnnDeserializer/IDeserializer.hpp"

19

#endif

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

20

#if defined(ARMNN_TF_LITE_PARSER)

21

#include "armnnTfLiteParser/ITfLiteParser.hpp"

22

#endif

23

#if defined(ARMNN_ONNX_PARSER)

24

#include "armnnOnnxParser/IOnnxParser.hpp"

25

#endif

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

26

#if defined(ARMNN_TFLITE_DELEGATE)

27

#include <armnn_delegate.hpp>

28

#include <DelegateOptions.hpp>

29

30

#include <tensorflow/lite/builtin_ops.h>

31

#include <tensorflow/lite/c/builtin_op_data.h>

32

#include <tensorflow/lite/c/common.h>

33

#include <tensorflow/lite/optional_debug_tools.h>

34

#include <tensorflow/lite/kernels/builtin_op_kernels.h>

35

#include <tensorflow/lite/interpreter.h>

36

#include <tensorflow/lite/kernels/register.h>

37

#endif

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

38

39

#include <future>

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

40

41

/**

42

* Given a measured duration and a threshold time tell the user whether we succeeded or not.

43

*

44

* @param duration the measured inference duration.

45

* @param thresholdTime the threshold time in milliseconds.

46

* @return false if the measured time exceeded the threshold.

47

*/

48

bool CheckInferenceTimeThreshold(const std::chrono::duration<double, std::milli>& duration,

49

const double& thresholdTime)

50

{

51

ARMNN_LOG(info) << "\nInference time: " << std::setprecision(2)

52

<< std::fixed << duration.count() << " ms\n";

53

// If thresholdTime == 0.0 (default), then it hasn't been supplied at command line

54

if (thresholdTime != 0.0)

55

{

56

ARMNN_LOG(info) << "Threshold time: " << std::setprecision(2)

57

<< std::fixed << thresholdTime << " ms";

58

auto thresholdMinusInference = thresholdTime - duration.count();

59

ARMNN_LOG(info) << "Threshold time - Inference time: " << std::setprecision(2)

60

<< std::fixed << thresholdMinusInference << " ms" << "\n";

61

if (thresholdMinusInference < 0)

62

{

63

std::string errorMessage = "Elapsed inference time is greater than provided threshold time.";

64

ARMNN_LOG(fatal) << errorMessage;

return false;

}

}

return true;

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

71

#if defined(ARMNN_TFLITE_DELEGATE)

Colm Donelan

4514228

2021-10-21 23:39:52 +0100

[diff] [blame]

72

int TfLiteDelegateMainImpl(const ExecuteNetworkParams& params, const armnn::IRuntime::CreationOptions runtimeOptions)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

73

{

74

using namespace tflite;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

75

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

76

std::unique_ptr<tflite::FlatBufferModel> model = tflite::FlatBufferModel::BuildFromFile(params.m_ModelPath.c_str());

77

78

auto tfLiteInterpreter = std::make_unique<Interpreter>();

79

tflite::ops::builtin::BuiltinOpResolver resolver;

80

81

tflite::InterpreterBuilder builder(*model, resolver);

82

builder(&tfLiteInterpreter);

83

tfLiteInterpreter->AllocateTensors();

84

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

85

int status = 0;

86

if (params.m_TfLiteExecutor == ExecuteNetworkParams::TfLiteExecutor::ArmNNTfLiteDelegate)

Sadik Armagan

19a1c03

2021-01-20 12:17:00 +0000

[diff] [blame]

87

{

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

88

// Create the Armnn Delegate

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

89

// Populate a DelegateOptions from the ExecuteNetworkParams.

90

armnnDelegate::DelegateOptions delegateOptions = params.ToDelegateOptions();

91

delegateOptions.SetExternalProfilingParams(runtimeOptions.m_ProfilingOptions);

92

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

93

std::unique_ptr<TfLiteDelegate, decltype(&armnnDelegate::TfLiteArmnnDelegateDelete)>

94

theArmnnDelegate(armnnDelegate::TfLiteArmnnDelegateCreate(delegateOptions),

95

armnnDelegate::TfLiteArmnnDelegateDelete);

96

// Register armnn_delegate to TfLiteInterpreter

97

status = tfLiteInterpreter->ModifyGraphWithDelegate(std::move(theArmnnDelegate));

98

if (status == kTfLiteError)

99

{

100

ARMNN_LOG(fatal) << "Could not register ArmNN TfLite Delegate to TfLiteInterpreter!";

101

return EXIT_FAILURE;

102

}

Sadik Armagan

19a1c03

2021-01-20 12:17:00 +0000

[diff] [blame]

103

}

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

104

else

105

{

106

std::cout << "Running on TfLite without ArmNN delegate\n";

107

}

108

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

109

armnn::Optional<std::string> dataFile = params.m_GenerateTensorData

110

? armnn::EmptyOptional()

111

: armnn::MakeOptional<std::string>(params.m_InputTensorDataFilePaths[0]);

112

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

113

const size_t numInputs = params.m_InputNames.size();

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

114

115

for(unsigned int inputIndex = 0; inputIndex < numInputs; ++inputIndex)

116

{

117

int input = tfLiteInterpreter->inputs()[inputIndex];

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

118

TfLiteIntArray* inputDims = tfLiteInterpreter->tensor(input)->dims;

119

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

120

unsigned int inputSize = 1;

121

if (params.m_InputTensorShapes.size() > 0)

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

122

{

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

123

inputSize = params.m_InputTensorShapes[inputIndex]->GetNumElements();

}

else

{

for (unsigned int dim = 0; dim < static_cast<unsigned int>(inputDims->size); ++dim)

128

{

129

inputSize *= inputDims->data[dim];

130

}

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

131

}

132

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

133

if (params.m_InputTypes[inputIndex].compare("float") == 0)

134

{

135

auto inputData = tfLiteInterpreter->typed_tensor<float>(input);

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

136

Matthew Sloyan

2020-12-07 13:33:24 +0000

[diff] [blame]

137

if(inputData == NULL)

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

138

{

139

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

140

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

144

std::vector<float> tensorData;

145

PopulateTensorWithDataGeneric<float>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

146

inputSize,

147

dataFile,

148

[](const std::string& s)

149

{ return std::stof(s); });

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

150

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

151

std::copy(tensorData.begin(), tensorData.end(), inputData);

152

}

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

153

else if (params.m_InputTypes[inputIndex].compare("qsymms8") == 0)

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

154

{

155

auto inputData = tfLiteInterpreter->typed_tensor<int8_t>(input);

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

156

Matthew Sloyan

2020-12-07 13:33:24 +0000

[diff] [blame]

157

if(inputData == NULL)

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

158

{

159

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

160

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

164

std::vector<int8_t> tensorData;

165

PopulateTensorWithDataGeneric<int8_t>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

166

inputSize,

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

167

dataFile,

168

[](const std::string& s)

169

{ return armnn::numeric_cast<int8_t>(std::stoi(s)); });

170

171

std::copy(tensorData.begin(), tensorData.end(), inputData);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

172

}

173

else if (params.m_InputTypes[inputIndex].compare("int") == 0)

174

{

175

auto inputData = tfLiteInterpreter->typed_tensor<int32_t>(input);

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

176

Matthew Sloyan

2020-12-07 13:33:24 +0000

[diff] [blame]

177

if(inputData == NULL)

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

178

{

179

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

180

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

184

std::vector<int32_t> tensorData;

185

PopulateTensorWithDataGeneric<int32_t>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

186

inputSize,

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

187

dataFile,

188

[](const std::string& s)

189

{ return std::stoi(s); });

190

191

std::copy(tensorData.begin(), tensorData.end(), inputData);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

192

}

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

193

else if (params.m_InputTypes[inputIndex].compare("qasymm8") == 0 ||

194

params.m_InputTypes[inputIndex].compare("qasymmu8") == 0)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

195

{

196

auto inputData = tfLiteInterpreter->typed_tensor<uint8_t>(input);

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

197

Matthew Sloyan

2020-12-07 13:33:24 +0000

[diff] [blame]

198

if(inputData == NULL)

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

199

{

200

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

201

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

205

std::vector<uint8_t> tensorData;

206

PopulateTensorWithDataGeneric<uint8_t>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

207

inputSize,

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

208

dataFile,

209

[](const std::string& s)

210

{ return armnn::numeric_cast<uint8_t>(std::stoi(s)); });

211

212

std::copy(tensorData.begin(), tensorData.end(), inputData);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

213

}

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

214

else if (params.m_InputTypes[inputIndex].compare("qasymms8") == 0)

215

{

216

auto inputData = tfLiteInterpreter->typed_tensor<int8_t>(input);

217

218

if(inputData == NULL)

219

{

220

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

221

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

std::vector<int8_t> tensorData;

226

PopulateTensorWithDataGeneric<int8_t>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

227

inputSize,

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

228

dataFile,

229

[](const std::string& s)

230

{ return armnn::numeric_cast<int8_t>(std::stoi(s)); });

231

232

std::copy(tensorData.begin(), tensorData.end(), inputData);

233

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

234

else

235

{

236

ARMNN_LOG(fatal) << "Unsupported input tensor data type \"" << params.m_InputTypes[inputIndex] << "\". ";

return EXIT_FAILURE;

}

}

for (size_t x = 0; x < params.m_Iterations; x++)

242

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

243

// Start timer to record inference time in milliseconds.

244

const auto start_time = armnn::GetTimeNow();

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

245

// Run the inference

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

246

status = tfLiteInterpreter->Invoke();

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

247

const auto duration = armnn::GetTimeDuration(start_time);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

248

249

// Print out the output

250

for (unsigned int outputIndex = 0; outputIndex < params.m_OutputNames.size(); ++outputIndex)

251

{

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

252

auto tfLiteDelegateOutputId = tfLiteInterpreter->outputs()[outputIndex];

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

253

TfLiteIntArray* outputDims = tfLiteInterpreter->tensor(tfLiteDelegateOutputId)->dims;

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

254

// If we've been asked to write to a file then set a file output stream. Otherwise use stdout.

255

FILE* outputTensorFile = stdout;

256

if (!params.m_OutputTensorFiles.empty())

257

{

258

outputTensorFile = fopen(params.m_OutputTensorFiles[outputIndex].c_str(), "w");

259

if (outputTensorFile == NULL)

260

{

261

ARMNN_LOG(fatal) << "Specified output tensor file, \"" <<

262

params.m_OutputTensorFiles[outputIndex] <<

263

"\", cannot be created. Defaulting to stdout. " <<

264

"Error was: " << std::strerror(errno);

265

outputTensorFile = stdout;

}

else

{

ARMNN_LOG(info) << "Writing output " << outputIndex << "' of iteration: " << x+1 << " to file: '"

270

<< params.m_OutputTensorFiles[outputIndex] << "'";

271

}

272

}

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

273

long outputSize = 1;

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

274

for (unsigned int dim = 0; dim < static_cast<unsigned int>(outputDims->size); ++dim)

275

{

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

276

outputSize *= outputDims->data[dim];

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

277

}

278

279

std::cout << params.m_OutputNames[outputIndex] << ": ";

280

if (params.m_OutputTypes[outputIndex].compare("float") == 0)

281

{

282

auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<float>(tfLiteDelegateOutputId);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

283

if(tfLiteDelageOutputData == NULL)

284

{

285

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

286

"\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

290

if (!params.m_DontPrintOutputs)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

291

{

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

292

for (int i = 0; i < outputSize; ++i)

293

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

294

fprintf(outputTensorFile, "%f ", tfLiteDelageOutputData[i]);

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

295

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

296

}

297

}

298

else if (params.m_OutputTypes[outputIndex].compare("int") == 0)

299

{

300

auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<int32_t>(tfLiteDelegateOutputId);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

301

if(tfLiteDelageOutputData == NULL)

302

{

303

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

304

"\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

308

if (!params.m_DontPrintOutputs)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

309

{

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

310

for (int i = 0; i < outputSize; ++i)

311

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

312

fprintf(outputTensorFile, "%d ", tfLiteDelageOutputData[i]);

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

313

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

314

}

315

}

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

316

else if (params.m_OutputTypes[outputIndex].compare("qsymms8") == 0)

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

317

{

318

auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<int8_t>(tfLiteDelegateOutputId);

319

if(tfLiteDelageOutputData == NULL)

320

{

321

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

322

"\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

326

if (!params.m_DontPrintOutputs)

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

327

{

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

328

for (int i = 0; i < outputSize; ++i)

329

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

330

fprintf(outputTensorFile, "%d ", tfLiteDelageOutputData[i]);

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

331

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

332

}

333

}

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

334

else if (params.m_OutputTypes[outputIndex].compare("qasymm8") == 0 ||

335

params.m_OutputTypes[outputIndex].compare("qasymmu8") == 0)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

336

{

337

auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<uint8_t>(tfLiteDelegateOutputId);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

338

if(tfLiteDelageOutputData == NULL)

339

{

340

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

341

"\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

345

if (!params.m_DontPrintOutputs)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

346

{

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

347

for (int i = 0; i < outputSize; ++i)

348

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

349

fprintf(outputTensorFile, "%u ", tfLiteDelageOutputData[i]);

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

350

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

}

}

else

{

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

356

"\"" << params.m_OutputTypes[outputIndex] <<

357

"\" may be incorrect. Output type can be specified with -z argument";

358

return EXIT_FAILURE;

359

}

360

std::cout << std::endl;

361

}

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

362

CheckInferenceTimeThreshold(duration, params.m_ThresholdTime);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

}

return status;

}

#endif

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

368

template<typename TParser, typename TDataType>

369

int MainImpl(const ExecuteNetworkParams& params,

370

const std::shared_ptr<armnn::IRuntime>& runtime = nullptr)

371

{

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

372

using namespace std::chrono;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

373

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

374

std::vector<std::vector<armnnUtils::TContainer>> inputs;

375

std::vector<std::vector<armnnUtils::TContainer>> outputs;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

try

{

// Creates an InferenceModel, which will parse the model and load it into an IRuntime.

380

typename InferenceModel<TParser, TDataType>::Params inferenceModelParams;

381

inferenceModelParams.m_ModelPath = params.m_ModelPath;

382

inferenceModelParams.m_IsModelBinary = params.m_IsModelBinary;

383

inferenceModelParams.m_ComputeDevices = params.m_ComputeDevices;

384

inferenceModelParams.m_DynamicBackendsPath = params.m_DynamicBackendsPath;

385

inferenceModelParams.m_PrintIntermediateLayers = params.m_PrintIntermediate;

386

inferenceModelParams.m_VisualizePostOptimizationModel = params.m_EnableLayerDetails;

387

inferenceModelParams.m_ParseUnsupported = params.m_ParseUnsupported;

388

inferenceModelParams.m_InferOutputShape = params.m_InferOutputShape;

389

inferenceModelParams.m_EnableFastMath = params.m_EnableFastMath;

Matthew Sloyan

4243211

2021-01-08 10:30:51 +0000

[diff] [blame]

390

inferenceModelParams.m_SaveCachedNetwork = params.m_SaveCachedNetwork;

391

inferenceModelParams.m_CachedNetworkFilePath = params.m_CachedNetworkFilePath;

Matthew Sloyan

0a7dc6b

2021-02-10 16:50:53 +0000

[diff] [blame]

392

inferenceModelParams.m_NumberOfThreads = params.m_NumberOfThreads;

Finn Williams

4064632

2021-02-11 16:16:42 +0000

[diff] [blame]

393

inferenceModelParams.m_MLGOTuningFilePath = params.m_MLGOTuningFilePath;

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

394

inferenceModelParams.m_AsyncEnabled = params.m_Concurrent;

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

395

inferenceModelParams.m_ThreadPoolSize = params.m_ThreadPoolSize;

Keith Davis

f487486

2021-08-09 16:49:18 +0100

[diff] [blame]

396

inferenceModelParams.m_OutputDetailsToStdOut = params.m_OutputDetailsToStdOut;

Keith Davis

4914d0c

2021-08-18 17:14:05 +0100

[diff] [blame]

397

inferenceModelParams.m_OutputDetailsOnlyToStdOut = params.m_OutputDetailsOnlyToStdOut;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

398

399

for(const std::string& inputName: params.m_InputNames)

400

{

401

inferenceModelParams.m_InputBindings.push_back(inputName);

402

}

403

404

for(unsigned int i = 0; i < params.m_InputTensorShapes.size(); ++i)

405

{

406

inferenceModelParams.m_InputShapes.push_back(*params.m_InputTensorShapes[i]);

407

}

408

409

for(const std::string& outputName: params.m_OutputNames)

410

{

411

inferenceModelParams.m_OutputBindings.push_back(outputName);

412

}

413

414

inferenceModelParams.m_SubgraphId = params.m_SubgraphId;

415

inferenceModelParams.m_EnableFp16TurboMode = params.m_EnableFp16TurboMode;

416

inferenceModelParams.m_EnableBf16TurboMode = params.m_EnableBf16TurboMode;

417

418

InferenceModel<TParser, TDataType> model(inferenceModelParams,

419

params.m_EnableProfiling,

420

params.m_DynamicBackendsPath,

421

runtime);

422

423

const size_t numInputs = inferenceModelParams.m_InputBindings.size();

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

424

425

armnn::Optional<QuantizationParams> qParams = params.m_QuantizeInput ?

426

armnn::MakeOptional<QuantizationParams>(

427

model.GetInputQuantizationParams()) :

428

armnn::EmptyOptional();

429

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

430

if (params.m_InputTensorDataFilePaths.size() > numInputs)

431

{

432

ARMNN_LOG(info) << "Given network has " << numInputs << " input/s. One input-tensor-data file is required "

433

<< "for each input. The user provided "

434

<< params.m_InputTensorDataFilePaths.size()

435

<< " input-tensor-data file/s which will be used to fill the input/s.\n";

436

}

437

438

for(unsigned int j = 0; j < params.m_Iterations ; ++j)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

439

{

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

440

std::vector<armnnUtils::TContainer> inputDataContainers;

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

441

for(unsigned int i = 0; i < numInputs; ++i)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

442

{

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

443

// If there are less input files given than required for the execution of

444

// params.m_Iterations we simply start with the first input file again

445

size_t inputFileIndex = j * numInputs + i;

446

if (!params.m_InputTensorDataFilePaths.empty())

447

{

448

inputFileIndex = inputFileIndex % params.m_InputTensorDataFilePaths.size();

449

}

450

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

451

armnn::Optional<std::string> dataFile = params.m_GenerateTensorData ?

452

armnn::EmptyOptional() :

453

armnn::MakeOptional<std::string>(

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

454

params.m_InputTensorDataFilePaths.at(inputFileIndex));

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

455

456

unsigned int numElements = model.GetInputSize(i);

457

if (params.m_InputTensorShapes.size() > i && params.m_InputTensorShapes[i])

458

{

459

// If the user has provided a tensor shape for the current input,

460

// override numElements

461

numElements = params.m_InputTensorShapes[i]->GetNumElements();

462

}

463

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

464

armnnUtils::TContainer tensorData;

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

465

PopulateTensorWithData(tensorData,

466

numElements,

467

params.m_InputTypes[i],

qParams,

dataFile);

inputDataContainers.push_back(tensorData);

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

472

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

473

inputs.push_back(inputDataContainers);

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

474

}

475

476

const size_t numOutputs = inferenceModelParams.m_OutputBindings.size();

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

477

Colm Donelan

c5e4198

2021-10-28 20:19:43 +0100

[diff] [blame]

478

// The user is allowed to specify the data type of each output tensor. It is used here to construct the

479

// result tensors for each iteration. It is possible for the user to specify a type that does not match

480

// the data type of the corresponding model output. It may not make sense, but it is historically allowed.

481

// The potential problem here is a buffer overrun when a larger data type is written into the space for a

482

// smaller one. Issue a warning to highlight the potential problem.

483

for (unsigned int outputIdx = 0; outputIdx < model.GetOutputBindingInfos().size(); ++outputIdx)

484

{

485

armnn::DataType type = model.GetOutputBindingInfo(outputIdx).second.GetDataType();

486

switch (type)

487

{

David Monahan

2021-11-01 10:16:37 +0000

[diff] [blame]

488

// --output-type only supports float, float16, int, qasymms8 or qasymmu8.

Colm Donelan

c5e4198

2021-10-28 20:19:43 +0100

[diff] [blame]

489

case armnn::DataType::Float32:

490

if (params.m_OutputTypes[outputIdx].compare("float") != 0)

491

{

492

ARMNN_LOG(warning) << "Model output index: " << outputIdx << " has data type Float32. The " <<

493

"corresponding --output-type is " << params.m_OutputTypes[outputIdx] <<

494

". This may cause unexpected problems or random failures.";

495

}

496

break;

David Monahan

2021-11-01 10:16:37 +0000

[diff] [blame]

497

case armnn::DataType::Float16:

498

if (params.m_OutputTypes[outputIdx].compare("float16") != 0)

499

{

500

ARMNN_LOG(warning) << "Model output index: " << outputIdx << " has data type Float16. The " <<

501

"corresponding --output-type is " << params.m_OutputTypes[outputIdx] <<

502

". This may cause unexpected problems or random failures.";

503

}

504

break;

Colm Donelan

c5e4198

2021-10-28 20:19:43 +0100

[diff] [blame]

505

case armnn::DataType::QAsymmU8:

506

if (params.m_OutputTypes[outputIdx].compare("qasymmu8") != 0)

507

{

508

ARMNN_LOG(warning) << "Model output index: " << outputIdx << " has data type QAsymmU8. The " <<

509

"corresponding --output-type is " << params.m_OutputTypes[outputIdx] <<

510

". This may cause unexpected problemsor random failures.";

511

}

512

break;

513

case armnn::DataType::Signed32:

514

if (params.m_OutputTypes[outputIdx].compare("int") != 0)

515

{

516

ARMNN_LOG(warning) << "Model output index: " << outputIdx << " has data type Signed32. The " <<

517

"corresponding --output-type is " << params.m_OutputTypes[outputIdx] <<

518

". This may cause unexpected problems or random failures.";

519

}

520

break;

521

case armnn::DataType::QAsymmS8:

522

if (params.m_OutputTypes[outputIdx].compare("qasymms8") != 0)

523

{

524

ARMNN_LOG(warning) << "Model output index: " << outputIdx << " has data type QAsymmS8. The " <<

525

"corresponding --output-type is " << params.m_OutputTypes[outputIdx] <<

526

". This may cause unexpected problems or random failures.";

}

break;

default:

break;

}

}

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

533

for (unsigned int j = 0; j < params.m_Iterations; ++j)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

534

{

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

535

std::vector <armnnUtils::TContainer> outputDataContainers;

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

536

for (unsigned int i = 0; i < numOutputs; ++i)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

537

{

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

538

if (params.m_OutputTypes[i].compare("float") == 0)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

539

{

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

540

outputDataContainers.push_back(std::vector<float>(model.GetOutputSize(i)));

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

541

}

David Monahan

2021-11-01 10:16:37 +0000

[diff] [blame]

542

else if (params.m_OutputTypes[i].compare("float16") == 0)

543

{

544

outputDataContainers.push_back(std::vector<armnn::Half>(model.GetOutputSize(i)));

545

}

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

546

else if (params.m_OutputTypes[i].compare("int") == 0)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

547

{

548

outputDataContainers.push_back(std::vector<int>(model.GetOutputSize(i)));

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

549

}

550

else if (params.m_OutputTypes[i].compare("qasymm8") == 0 ||

551

params.m_OutputTypes[i].compare("qasymmu8") == 0)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

552

{

553

outputDataContainers.push_back(std::vector<uint8_t>(model.GetOutputSize(i)));

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

554

}

555

else if (params.m_OutputTypes[i].compare("qasymms8") == 0)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

556

{

557

outputDataContainers.push_back(std::vector<int8_t>(model.GetOutputSize(i)));

558

} else

559

{

560

ARMNN_LOG(fatal) << "Unsupported tensor data type \"" << params.m_OutputTypes[i] << "\". ";

561

return EXIT_FAILURE;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

562

}

563

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

564

outputs.push_back(outputDataContainers);

565

}

566

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

567

if (params.m_Iterations > 1)

568

{

569

std::stringstream msg;

570

msg << "Network will be executed " << params.m_Iterations;

571

if (params.m_Concurrent)

572

{

573

msg << " times in an asynchronous manner. ";

}

else

{

msg << " times successively. ";

578

}

579

msg << "The input-tensor-data files will be reused recursively if the user didn't provide enough to "

580

"cover each execution.";

581

ARMNN_LOG(info) << msg.str();

582

}

583

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

584

// Synchronous execution

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

585

if (!params.m_Concurrent)

586

{

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

587

for (size_t x = 0; x < params.m_Iterations; x++)

588

{

589

// model.Run returns the inference time elapsed in EnqueueWorkload (in milliseconds)

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

590

auto inference_duration = model.Run(inputs[x], outputs[x]);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

591

592

if (params.m_GenerateTensorData)

593

{

594

ARMNN_LOG(warning) << "The input data was generated, note that the output will not be useful";

595

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

596

if (params.m_DontPrintOutputs)

597

{

598

ARMNN_LOG(info) << "Printing outputs to console is disabled.";

599

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

600

601

// Print output tensors

602

const auto& infosOut = model.GetOutputBindingInfos();

603

for (size_t i = 0; i < numOutputs; i++)

604

{

605

const armnn::TensorInfo& infoOut = infosOut[i].second;

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

606

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

607

// We've made sure before that the number of output files either equals numOutputs, in which

608

// case we override those files when processing the results of each iteration (only the result

609

// of the last iteration will be stored), or there are enough

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

610

// output files for each output of each iteration.

611

size_t outputFileIndex = x * numOutputs + i;

612

if (!params.m_OutputTensorFiles.empty())

613

{

614

outputFileIndex = outputFileIndex % params.m_OutputTensorFiles.size();

615

ARMNN_LOG(info) << "Writing output " << i << " named: '"

616

<< inferenceModelParams.m_OutputBindings[i]

617

<< "' of iteration: " << x+1 << " to file: '"

618

<< params.m_OutputTensorFiles[outputFileIndex] << "'";

619

}

620

auto outputTensorFile = params.m_OutputTensorFiles.empty()

621

? ""

622

: params.m_OutputTensorFiles[outputFileIndex];

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

623

624

TensorPrinter printer(inferenceModelParams.m_OutputBindings[i],

625

infoOut,

626

outputTensorFile,

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

627

params.m_DequantizeOutput,

628

!params.m_DontPrintOutputs);

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

629

mapbox::util::apply_visitor(printer, outputs[x][i]);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

630

}

631

632

ARMNN_LOG(info) << "\nInference time: " << std::setprecision(2)

633

<< std::fixed << inference_duration.count() << " ms\n";

634

635

// If thresholdTime == 0.0 (default), then it hasn't been supplied at command line

636

if (params.m_ThresholdTime != 0.0)

637

{

638

ARMNN_LOG(info) << "Threshold time: " << std::setprecision(2)

639

<< std::fixed << params.m_ThresholdTime << " ms";

640

auto thresholdMinusInference = params.m_ThresholdTime - inference_duration.count();

641

ARMNN_LOG(info) << "Threshold time - Inference time: " << std::setprecision(2)

642

<< std::fixed << thresholdMinusInference << " ms" << "\n";

643

644

if (thresholdMinusInference < 0)

645

{

646

std::string errorMessage = "Elapsed inference time is greater than provided threshold time.";

647

ARMNN_LOG(fatal) << errorMessage;

}

}

}

}

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

652

// Asynchronous execution using the Arm NN thread pool

Kevin May

94dd4db

2021-05-26 16:01:08 +0100

[diff] [blame]

653

else if (params.m_ThreadPoolSize >= 1)

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

{

try

{

ARMNN_LOG(info) << "Asynchronous execution with Arm NN thread pool... \n";

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

658

armnn::AsyncCallbackManager callbackManager;

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

659

std::unordered_map<armnn::InferenceId, std::vector<armnnUtils::TContainer>&> inferenceOutputMap;

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

660

661

// Declare the latest and earliest inference times here to be used when calculating overall time

662

std::chrono::high_resolution_clock::time_point earliestStartTime;

663

std::chrono::high_resolution_clock::time_point latestEndTime =

664

std::chrono::high_resolution_clock::now();

665

666

// For the asynchronous execution, we are adding a pool of working memory handles (1 per thread) in the

667

// LoadedNetwork with each scheduled inference having a specific priority

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

668

for (size_t i = 0; i < params.m_Iterations; ++i)

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

669

{

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

670

std::shared_ptr<armnn::AsyncExecutionCallback> cb = callbackManager.GetNewCallback();

671

inferenceOutputMap.insert({cb->GetInferenceId(), outputs[i]});

672

model.RunAsync(inputs[i], outputs[i], cb);

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

}

// Check the results

unsigned int j = 0;

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

677

for (size_t iteration = 0; iteration < params.m_Iterations; ++iteration)

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

678

{

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

679

auto cb = callbackManager.GetNotifiedCallback();

680

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

681

// Get the results

682

auto endTime = time_point_cast<std::chrono::milliseconds>(cb->GetEndTime());

683

auto startTime = time_point_cast<std::chrono::milliseconds>(cb->GetStartTime());

684

auto inferenceDuration = endTime - startTime;

685

686

if (latestEndTime < cb->GetEndTime())

687

{

688

latestEndTime = cb->GetEndTime();

689

}

690

691

if (earliestStartTime.time_since_epoch().count() == 0)

692

{

693

earliestStartTime = cb->GetStartTime();

694

}

695

else if (earliestStartTime > cb->GetStartTime())

696

{

697

earliestStartTime = cb->GetStartTime();

698

}

699

700

if (params.m_GenerateTensorData)

701

{

702

ARMNN_LOG(warning) << "The input data was generated, note that the output will not be useful";

703

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

704

if (params.m_DontPrintOutputs)

705

{

706

ARMNN_LOG(info) << "Printing outputs to console is disabled.";

707

}

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

708

709

// Print output tensors

710

const auto& infosOut = model.GetOutputBindingInfos();

711

for (size_t i = 0; i < numOutputs; i++)

712

{

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

713

// We've made sure before that the number of output files either equals numOutputs, in which

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

714

// case we override those files when processing the results of each iteration (only the

715

// result of the last iteration will be stored), or there are enough

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

716

// output files for each output of each iteration.

717

size_t outputFileIndex = iteration * numOutputs + i;

718

if (!params.m_OutputTensorFiles.empty())

719

{

720

outputFileIndex = outputFileIndex % params.m_OutputTensorFiles.size();

721

ARMNN_LOG(info) << "Writing output " << i << " named: '"

722

<< inferenceModelParams.m_OutputBindings[i]

723

<< "' of iteration: " << iteration+1 << " to file: '"

724

<< params.m_OutputTensorFiles[outputFileIndex] << "'";

725

}

726

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

727

const armnn::TensorInfo& infoOut = infosOut[i].second;

728

auto outputTensorFile = params.m_OutputTensorFiles.empty()

729

? ""

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

730

: params.m_OutputTensorFiles[outputFileIndex];

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

731

732

TensorPrinter printer(inferenceModelParams.m_OutputBindings[i],

733

infoOut,

734

outputTensorFile,

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

735

params.m_DequantizeOutput,

736

!params.m_DontPrintOutputs);

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

737

mapbox::util::apply_visitor(printer, inferenceOutputMap.at(cb->GetInferenceId())[i]);

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

738

}

739

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

740

CheckInferenceTimeThreshold(inferenceDuration, params.m_ThresholdTime);

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

741

++j;

742

}

743

//print duration difference between overallStartTime and overallEndTime

744

auto overallEndTime = time_point_cast<std::chrono::milliseconds>(latestEndTime);

745

auto overallStartTime = time_point_cast<std::chrono::milliseconds>(earliestStartTime);

746

auto totalInferenceDuration = overallEndTime - overallStartTime;

747

ARMNN_LOG(info) << "\nOverall Inference time: " << std::setprecision(2)

748

<< std::fixed << totalInferenceDuration.count() << " ms\n";

749

}

750

catch (const armnn::Exception& e)

751

{

752

ARMNN_LOG(fatal) << "Armnn Error: " << e.what();

return EXIT_FAILURE;

}

}

// Asynchronous execution using std::launch::async

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

else

{

try

{

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

761

ARMNN_LOG(info) << "Asynchronous Execution with std::launch:async... \n";

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

762

std::vector<std::future<std::tuple<unsigned int,

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

763

std::chrono::duration<double, std::milli>>>> inferenceResults;

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

764

inferenceResults.reserve(params.m_Iterations);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

765

766

// Create WorkingMemHandles for each inference

767

std::vector<std::unique_ptr<armnn::experimental::IWorkingMemHandle>> workingMemHandles;

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

768

workingMemHandles.reserve(params.m_Iterations);

769

for (unsigned int i = 0; i < params.m_Iterations; ++i)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

770

{

771

workingMemHandles.push_back(model.CreateWorkingMemHandle());

772

}

773

774

// Run each inference in its own thread

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

775

// start a timer

776

const auto start_time = armnn::GetTimeNow();

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

777

for (unsigned int i = 0; i < params.m_Iterations; ++i)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

778

{

779

armnn::experimental::IWorkingMemHandle& workingMemHandleRef = *workingMemHandles[i].get();

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

780

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

781

inferenceResults.push_back(std::async(

782

std::launch::async, [&model, &workingMemHandleRef, &inputs, &outputs, i]() {

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

783

return model.RunAsync(workingMemHandleRef, inputs[i], outputs[i], i);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

}

));

}

// Check the results

for (unsigned int j = 0; j < inferenceResults.size(); ++j)

790

{

791

// Get the results

792

auto inferenceResult = inferenceResults[j].get();

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

793

auto inferenceDuration = std::get<1>(inferenceResult);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

794

auto inferenceID = std::get<0>(inferenceResult);

795

796

if (params.m_GenerateTensorData)

797

{

798

ARMNN_LOG(warning) << "The input data was generated, note that the output will not be useful";

799

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

800

if (params.m_DontPrintOutputs)

801

{

802

ARMNN_LOG(info) << "Printing outputs to console is disabled.";

803

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

804

805

// Print output tensors

806

const auto& infosOut = model.GetOutputBindingInfos();

807

for (size_t i = 0; i < numOutputs; i++)

808

{

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

809

// We've made sure before that the number of output files either equals numOutputs, in which

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

810

// case we override those files when processing the results of each iteration (only the

811

// result of the last iteration will be stored), or there are enough

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

812

// output files for each output of each iteration.

813

size_t outputFileIndex = j * numOutputs + i;

814

if (!params.m_OutputTensorFiles.empty())

815

{

816

outputFileIndex = outputFileIndex % params.m_OutputTensorFiles.size();

817

ARMNN_LOG(info) << "Writing output " << i << " named: '"

818

<< inferenceModelParams.m_OutputBindings[i]

819

<< "' of iteration: " << j+1 << " to file: '"

820

<< params.m_OutputTensorFiles[outputFileIndex] << "'";

821

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

822

const armnn::TensorInfo& infoOut = infosOut[i].second;

823

auto outputTensorFile = params.m_OutputTensorFiles.empty()

824

? ""

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

825

: params.m_OutputTensorFiles[outputFileIndex];

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

826

827

TensorPrinter printer(inferenceModelParams.m_OutputBindings[i],

828

infoOut,

829

outputTensorFile,

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

830

params.m_DequantizeOutput,

831

!params.m_DontPrintOutputs);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

832

mapbox::util::apply_visitor(printer, outputs[j][i]);

833

}

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

834

CheckInferenceTimeThreshold(inferenceDuration, params.m_ThresholdTime);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

835

ARMNN_LOG(info) << "Asynchronous Execution is finished for Inference ID: " << inferenceID << " \n";

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

836

}

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

837

// finish timer

838

const auto duration = armnn::GetTimeDuration(start_time);

839

ARMNN_LOG(info) << "\nOverall Inference time: " << std::setprecision(2)

840

<< std::fixed << duration.count() << " ms\n";

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

841

}

842

catch (const armnn::Exception& e)

843

{

844

ARMNN_LOG(fatal) << "Armnn Error: " << e.what();

845

return EXIT_FAILURE;

846

}

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

847

}

848

}

849

catch (const armnn::Exception& e)

850

{

851

ARMNN_LOG(fatal) << "Armnn Error: " << e.what();

return EXIT_FAILURE;

}

return EXIT_SUCCESS;

}

James Conroy

2019-04-11 10:23:58 +0100

[diff] [blame]

858

// MAIN

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

859

int main(int argc, const char* argv[])

860

{

861

// Configures logging for both the ARMNN library and this test program.

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

862

#ifdef NDEBUG

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

863

armnn::LogSeverity level = armnn::LogSeverity::Info;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

864

#else

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

865

armnn::LogSeverity level = armnn::LogSeverity::Debug;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

866

#endif

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

867

armnn::ConfigureLogging(true, true, level);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

868

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

869

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

870

// Get ExecuteNetwork parameters and runtime options from command line

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

871

// This might throw an InvalidArgumentException if the user provided invalid inputs

872

ProgramOptions ProgramOptions;

873

try {

874

ProgramOptions.ParseOptions(argc, argv);

875

} catch (const std::exception &e){

876

ARMNN_LOG(fatal) << e.what();

877

return EXIT_FAILURE;

878

}

Narumol Prangnawarat

d8cc811

2020-03-24 13:54:05 +0000

[diff] [blame]

879

Keith Davis

4914d0c

2021-08-18 17:14:05 +0100

[diff] [blame]

880

if ((ProgramOptions.m_ExNetParams.m_OutputDetailsToStdOut ||

881

ProgramOptions.m_ExNetParams.m_OutputDetailsOnlyToStdOut)

882

&& !ProgramOptions.m_ExNetParams.m_EnableProfiling)

Keith Davis

f487486

2021-08-09 16:49:18 +0100

[diff] [blame]

883

{

884

ARMNN_LOG(fatal) << "You must enable profiling if you would like to output layer details";

return EXIT_FAILURE;

}

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

888

// Create runtime

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

889

std::shared_ptr<armnn::IRuntime> runtime(armnn::IRuntime::Create(ProgramOptions.m_RuntimeOptions));

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

890

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

891

std::string modelFormat = ProgramOptions.m_ExNetParams.m_ModelFormat;

892

893

// Forward to implementation based on the parser type

894

if (modelFormat.find("armnn") != std::string::npos)

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

895

{

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

896

#if defined(ARMNN_SERIALIZER)

897

return MainImpl<armnnDeserializer::IDeserializer, float>(ProgramOptions.m_ExNetParams, runtime);

898

#else

899

ARMNN_LOG(fatal) << "Not built with serialization support.";

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

900

return EXIT_FAILURE;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

901

#endif

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

902

}

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

903

else if (modelFormat.find("onnx") != std::string::npos)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

904

{

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

905

#if defined(ARMNN_ONNX_PARSER)

906

return MainImpl<armnnOnnxParser::IOnnxParser, float>(ProgramOptions.m_ExNetParams, runtime);

907

#else

908

ARMNN_LOG(fatal) << "Not built with Onnx parser support.";

909

return EXIT_FAILURE;

910

#endif

911

}

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

912

else if(modelFormat.find("tflite") != std::string::npos)

913

{

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

914

if (ProgramOptions.m_ExNetParams.m_TfLiteExecutor == ExecuteNetworkParams::TfLiteExecutor::ArmNNTfLiteParser)

915

{

916

#if defined(ARMNN_TF_LITE_PARSER)

917

return MainImpl<armnnTfLiteParser::ITfLiteParser, float>(ProgramOptions.m_ExNetParams, runtime);

918

#else

919

ARMNN_LOG(fatal) << "Not built with Tensorflow-Lite parser support.";

return EXIT_FAILURE;

#endif

}

else if (ProgramOptions.m_ExNetParams.m_TfLiteExecutor ==

924

ExecuteNetworkParams::TfLiteExecutor::ArmNNTfLiteDelegate ||

925

ProgramOptions.m_ExNetParams.m_TfLiteExecutor ==

926

ExecuteNetworkParams::TfLiteExecutor::TfliteInterpreter)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

927

{

928

#if defined(ARMNN_TF_LITE_DELEGATE)

Colm Donelan

4514228

2021-10-21 23:39:52 +0100

[diff] [blame]

929

return TfLiteDelegateMainImpl(ProgramOptions.m_ExNetParams, ProgramOptions.m_RuntimeOptions);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

930

#else

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

931

ARMNN_LOG(fatal) << "Not built with Arm NN Tensorflow-Lite delegate support.";

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

932

return EXIT_FAILURE;

933

#endif

934

}

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

}

else

{

ARMNN_LOG(fatal) << "Unknown model format: '" << modelFormat

Nikhil Raj

5d955cf

2021-04-19 16:59:48 +0100

[diff] [blame]

939

<< "'. Please include 'tflite' or 'onnx'";

Jan Eilers