Blame - tests/ExecuteNetwork/ExecuteNetwork.cpp - ml/armnn

2018-08-31 09:22:23 +0100

[diff] [blame]

5

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

6

#include "NetworkExecutionUtils/NetworkExecutionUtils.hpp"

7

#include "ExecuteNetworkProgramOptions.hpp"

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

8

#include <armnn/IAsyncExecutionCallback.hpp>

9

#include <AsyncExecutionCallback.hpp>

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

10

11

#include <armnn/Logging.hpp>

Rob Hughes

9542f90

2021-07-14 09:48:54 +0100

[diff] [blame]

12

#include <armnnUtils/Filesystem.hpp>

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

13

#include <armnnUtils/TContainer.hpp>

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

14

#include <InferenceTest.hpp>

15

16

#if defined(ARMNN_SERIALIZER)

17

#include "armnnDeserializer/IDeserializer.hpp"

18

#endif

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

19

#if defined(ARMNN_TF_LITE_PARSER)

20

#include "armnnTfLiteParser/ITfLiteParser.hpp"

21

#endif

22

#if defined(ARMNN_ONNX_PARSER)

23

#include "armnnOnnxParser/IOnnxParser.hpp"

24

#endif

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

25

#if defined(ARMNN_TFLITE_DELEGATE)

26

#include <armnn_delegate.hpp>

27

#include <DelegateOptions.hpp>

28

29

#include <tensorflow/lite/builtin_ops.h>

30

#include <tensorflow/lite/c/builtin_op_data.h>

31

#include <tensorflow/lite/c/common.h>

32

#include <tensorflow/lite/optional_debug_tools.h>

33

#include <tensorflow/lite/kernels/builtin_op_kernels.h>

34

#include <tensorflow/lite/interpreter.h>

35

#include <tensorflow/lite/kernels/register.h>

36

#endif

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

37

38

#include <future>

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

39

40

/**

41

* Given a measured duration and a threshold time tell the user whether we succeeded or not.

42

*

43

* @param duration the measured inference duration.

44

* @param thresholdTime the threshold time in milliseconds.

45

* @return false if the measured time exceeded the threshold.

46

*/

47

bool CheckInferenceTimeThreshold(const std::chrono::duration<double, std::milli>& duration,

48

const double& thresholdTime)

49

{

50

ARMNN_LOG(info) << "\nInference time: " << std::setprecision(2)

51

<< std::fixed << duration.count() << " ms\n";

52

// If thresholdTime == 0.0 (default), then it hasn't been supplied at command line

53

if (thresholdTime != 0.0)

54

{

55

ARMNN_LOG(info) << "Threshold time: " << std::setprecision(2)

56

<< std::fixed << thresholdTime << " ms";

57

auto thresholdMinusInference = thresholdTime - duration.count();

58

ARMNN_LOG(info) << "Threshold time - Inference time: " << std::setprecision(2)

59

<< std::fixed << thresholdMinusInference << " ms" << "\n";

60

if (thresholdMinusInference < 0)

61

{

62

std::string errorMessage = "Elapsed inference time is greater than provided threshold time.";

63

ARMNN_LOG(fatal) << errorMessage;

return false;

}

}

return true;

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

70

#if defined(ARMNN_TFLITE_DELEGATE)

Colm Donelan

4514228

2021-10-21 23:39:52 +0100

[diff] [blame]

71

int TfLiteDelegateMainImpl(const ExecuteNetworkParams& params, const armnn::IRuntime::CreationOptions runtimeOptions)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

72

{

73

using namespace tflite;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

74

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

75

std::unique_ptr<tflite::FlatBufferModel> model = tflite::FlatBufferModel::BuildFromFile(params.m_ModelPath.c_str());

76

77

auto tfLiteInterpreter = std::make_unique<Interpreter>();

78

tflite::ops::builtin::BuiltinOpResolver resolver;

79

80

tflite::InterpreterBuilder builder(*model, resolver);

81

builder(&tfLiteInterpreter);

82

tfLiteInterpreter->AllocateTensors();

83

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

84

int status = 0;

85

if (params.m_TfLiteExecutor == ExecuteNetworkParams::TfLiteExecutor::ArmNNTfLiteDelegate)

Sadik Armagan

19a1c03

2021-01-20 12:17:00 +0000

[diff] [blame]

86

{

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

87

// Create the Armnn Delegate

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

88

// Populate a DelegateOptions from the ExecuteNetworkParams.

89

armnnDelegate::DelegateOptions delegateOptions = params.ToDelegateOptions();

90

delegateOptions.SetExternalProfilingParams(runtimeOptions.m_ProfilingOptions);

91

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

92

std::unique_ptr<TfLiteDelegate, decltype(&armnnDelegate::TfLiteArmnnDelegateDelete)>

93

theArmnnDelegate(armnnDelegate::TfLiteArmnnDelegateCreate(delegateOptions),

94

armnnDelegate::TfLiteArmnnDelegateDelete);

95

// Register armnn_delegate to TfLiteInterpreter

96

status = tfLiteInterpreter->ModifyGraphWithDelegate(std::move(theArmnnDelegate));

97

if (status == kTfLiteError)

98

{

99

ARMNN_LOG(fatal) << "Could not register ArmNN TfLite Delegate to TfLiteInterpreter!";

100

return EXIT_FAILURE;

101

}

Sadik Armagan

19a1c03

2021-01-20 12:17:00 +0000

[diff] [blame]

102

}

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

103

else

104

{

105

std::cout << "Running on TfLite without ArmNN delegate\n";

106

}

107

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

108

armnn::Optional<std::string> dataFile = params.m_GenerateTensorData

109

? armnn::EmptyOptional()

110

: armnn::MakeOptional<std::string>(params.m_InputTensorDataFilePaths[0]);

111

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

112

const size_t numInputs = params.m_InputNames.size();

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

113

114

for(unsigned int inputIndex = 0; inputIndex < numInputs; ++inputIndex)

115

{

116

int input = tfLiteInterpreter->inputs()[inputIndex];

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

117

TfLiteIntArray* inputDims = tfLiteInterpreter->tensor(input)->dims;

118

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

119

unsigned int inputSize = 1;

120

if (params.m_InputTensorShapes.size() > 0)

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

121

{

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

122

inputSize = params.m_InputTensorShapes[inputIndex]->GetNumElements();

}

else

{

for (unsigned int dim = 0; dim < static_cast<unsigned int>(inputDims->size); ++dim)

127

{

128

inputSize *= inputDims->data[dim];

129

}

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

130

}

131

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

132

if (params.m_InputTypes[inputIndex].compare("float") == 0)

133

{

134

auto inputData = tfLiteInterpreter->typed_tensor<float>(input);

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

135

Matthew Sloyan

2020-12-07 13:33:24 +0000

[diff] [blame]

136

if(inputData == NULL)

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

137

{

138

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

139

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

143

std::vector<float> tensorData;

144

PopulateTensorWithDataGeneric<float>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

145

inputSize,

146

dataFile,

147

[](const std::string& s)

148

{ return std::stof(s); });

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

149

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

150

std::copy(tensorData.begin(), tensorData.end(), inputData);

151

}

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

152

else if (params.m_InputTypes[inputIndex].compare("qsymms8") == 0)

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

153

{

154

auto inputData = tfLiteInterpreter->typed_tensor<int8_t>(input);

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

155

Matthew Sloyan

2020-12-07 13:33:24 +0000

[diff] [blame]

156

if(inputData == NULL)

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

157

{

158

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

159

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

163

std::vector<int8_t> tensorData;

164

PopulateTensorWithDataGeneric<int8_t>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

165

inputSize,

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

166

dataFile,

167

[](const std::string& s)

168

{ return armnn::numeric_cast<int8_t>(std::stoi(s)); });

169

170

std::copy(tensorData.begin(), tensorData.end(), inputData);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

171

}

172

else if (params.m_InputTypes[inputIndex].compare("int") == 0)

173

{

174

auto inputData = tfLiteInterpreter->typed_tensor<int32_t>(input);

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

175

Matthew Sloyan

2020-12-07 13:33:24 +0000

[diff] [blame]

176

if(inputData == NULL)

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

177

{

178

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

179

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

183

std::vector<int32_t> tensorData;

184

PopulateTensorWithDataGeneric<int32_t>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

185

inputSize,

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

186

dataFile,

187

[](const std::string& s)

188

{ return std::stoi(s); });

189

190

std::copy(tensorData.begin(), tensorData.end(), inputData);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

191

}

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

192

else if (params.m_InputTypes[inputIndex].compare("qasymm8") == 0 ||

193

params.m_InputTypes[inputIndex].compare("qasymmu8") == 0)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

194

{

195

auto inputData = tfLiteInterpreter->typed_tensor<uint8_t>(input);

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

196

Matthew Sloyan

2020-12-07 13:33:24 +0000

[diff] [blame]

197

if(inputData == NULL)

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

198

{

199

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

200

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

204

std::vector<uint8_t> tensorData;

205

PopulateTensorWithDataGeneric<uint8_t>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

206

inputSize,

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

207

dataFile,

208

[](const std::string& s)

209

{ return armnn::numeric_cast<uint8_t>(std::stoi(s)); });

210

211

std::copy(tensorData.begin(), tensorData.end(), inputData);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

212

}

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

213

else if (params.m_InputTypes[inputIndex].compare("qasymms8") == 0)

214

{

215

auto inputData = tfLiteInterpreter->typed_tensor<int8_t>(input);

216

217

if(inputData == NULL)

218

{

219

ARMNN_LOG(fatal) << "Input tensor is null, input type: "

220

"\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

std::vector<int8_t> tensorData;

225

PopulateTensorWithDataGeneric<int8_t>(tensorData,

Mike Kelly

2021-09-01 17:09:12 +0100

[diff] [blame]

226

inputSize,

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

227

dataFile,

228

[](const std::string& s)

229

{ return armnn::numeric_cast<int8_t>(std::stoi(s)); });

230

231

std::copy(tensorData.begin(), tensorData.end(), inputData);

232

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

233

else

234

{

235

ARMNN_LOG(fatal) << "Unsupported input tensor data type \"" << params.m_InputTypes[inputIndex] << "\". ";

return EXIT_FAILURE;

}

}

for (size_t x = 0; x < params.m_Iterations; x++)

241

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

242

// Start timer to record inference time in milliseconds.

243

const auto start_time = armnn::GetTimeNow();

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

244

// Run the inference

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

245

status = tfLiteInterpreter->Invoke();

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

246

const auto duration = armnn::GetTimeDuration(start_time);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

247

248

// Print out the output

249

for (unsigned int outputIndex = 0; outputIndex < params.m_OutputNames.size(); ++outputIndex)

250

{

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

251

auto tfLiteDelegateOutputId = tfLiteInterpreter->outputs()[outputIndex];

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

252

TfLiteIntArray* outputDims = tfLiteInterpreter->tensor(tfLiteDelegateOutputId)->dims;

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

253

// If we've been asked to write to a file then set a file output stream. Otherwise use stdout.

254

FILE* outputTensorFile = stdout;

255

if (!params.m_OutputTensorFiles.empty())

256

{

257

outputTensorFile = fopen(params.m_OutputTensorFiles[outputIndex].c_str(), "w");

258

if (outputTensorFile == NULL)

259

{

260

ARMNN_LOG(fatal) << "Specified output tensor file, \"" <<

261

params.m_OutputTensorFiles[outputIndex] <<

262

"\", cannot be created. Defaulting to stdout. " <<

263

"Error was: " << std::strerror(errno);

264

outputTensorFile = stdout;

}

else

{

ARMNN_LOG(info) << "Writing output " << outputIndex << "' of iteration: " << x+1 << " to file: '"

269

<< params.m_OutputTensorFiles[outputIndex] << "'";

270

}

271

}

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

272

long outputSize = 1;

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

273

for (unsigned int dim = 0; dim < static_cast<unsigned int>(outputDims->size); ++dim)

274

{

Sadik Armagan

2020-11-18 09:37:03 +0000

[diff] [blame]

275

outputSize *= outputDims->data[dim];

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

276

}

277

278

std::cout << params.m_OutputNames[outputIndex] << ": ";

279

if (params.m_OutputTypes[outputIndex].compare("float") == 0)

280

{

281

auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<float>(tfLiteDelegateOutputId);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

282

if(tfLiteDelageOutputData == NULL)

283

{

284

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

285

"\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

289

if (!params.m_DontPrintOutputs)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

290

{

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

291

for (int i = 0; i < outputSize; ++i)

292

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

293

fprintf(outputTensorFile, "%f ", tfLiteDelageOutputData[i]);

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

294

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

295

}

296

}

297

else if (params.m_OutputTypes[outputIndex].compare("int") == 0)

298

{

299

auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<int32_t>(tfLiteDelegateOutputId);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

300

if(tfLiteDelageOutputData == NULL)

301

{

302

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

303

"\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

307

if (!params.m_DontPrintOutputs)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

308

{

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

309

for (int i = 0; i < outputSize; ++i)

310

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

311

fprintf(outputTensorFile, "%d ", tfLiteDelageOutputData[i]);

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

312

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

313

}

314

}

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

315

else if (params.m_OutputTypes[outputIndex].compare("qsymms8") == 0)

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

316

{

317

auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<int8_t>(tfLiteDelegateOutputId);

318

if(tfLiteDelageOutputData == NULL)

319

{

320

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

321

"\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

325

if (!params.m_DontPrintOutputs)

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

326

{

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

327

for (int i = 0; i < outputSize; ++i)

328

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

329

fprintf(outputTensorFile, "%d ", tfLiteDelageOutputData[i]);

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

330

}

Finn Williams

2020-11-20 13:57:53 +0000

[diff] [blame]

331

}

332

}

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

333

else if (params.m_OutputTypes[outputIndex].compare("qasymm8") == 0 ||

334

params.m_OutputTypes[outputIndex].compare("qasymmu8") == 0)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

335

{

336

auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<uint8_t>(tfLiteDelegateOutputId);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

337

if(tfLiteDelageOutputData == NULL)

338

{

339

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

340

"\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";

return EXIT_FAILURE;

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

344

if (!params.m_DontPrintOutputs)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

345

{

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

346

for (int i = 0; i < outputSize; ++i)

347

{

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

348

fprintf(outputTensorFile, "%u ", tfLiteDelageOutputData[i]);

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

349

}

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

}

}

else

{

ARMNN_LOG(fatal) << "Output tensor is null, output type: "

355

"\"" << params.m_OutputTypes[outputIndex] <<

356

"\" may be incorrect. Output type can be specified with -z argument";

357

return EXIT_FAILURE;

358

}

359

std::cout << std::endl;

360

}

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

361

CheckInferenceTimeThreshold(duration, params.m_ThresholdTime);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

}

return status;

}

#endif

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

367

template<typename TParser, typename TDataType>

368

int MainImpl(const ExecuteNetworkParams& params,

369

const std::shared_ptr<armnn::IRuntime>& runtime = nullptr)

370

{

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

371

using namespace std::chrono;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

372

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

373

std::vector<std::vector<armnnUtils::TContainer>> inputs;

374

std::vector<std::vector<armnnUtils::TContainer>> outputs;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

try

{

// Creates an InferenceModel, which will parse the model and load it into an IRuntime.

379

typename InferenceModel<TParser, TDataType>::Params inferenceModelParams;

380

inferenceModelParams.m_ModelPath = params.m_ModelPath;

381

inferenceModelParams.m_IsModelBinary = params.m_IsModelBinary;

382

inferenceModelParams.m_ComputeDevices = params.m_ComputeDevices;

383

inferenceModelParams.m_DynamicBackendsPath = params.m_DynamicBackendsPath;

384

inferenceModelParams.m_PrintIntermediateLayers = params.m_PrintIntermediate;

385

inferenceModelParams.m_VisualizePostOptimizationModel = params.m_EnableLayerDetails;

386

inferenceModelParams.m_ParseUnsupported = params.m_ParseUnsupported;

387

inferenceModelParams.m_InferOutputShape = params.m_InferOutputShape;

388

inferenceModelParams.m_EnableFastMath = params.m_EnableFastMath;

Matthew Sloyan

4243211

2021-01-08 10:30:51 +0000

[diff] [blame]

389

inferenceModelParams.m_SaveCachedNetwork = params.m_SaveCachedNetwork;

390

inferenceModelParams.m_CachedNetworkFilePath = params.m_CachedNetworkFilePath;

Matthew Sloyan

0a7dc6b

2021-02-10 16:50:53 +0000

[diff] [blame]

391

inferenceModelParams.m_NumberOfThreads = params.m_NumberOfThreads;

Finn Williams

4064632

2021-02-11 16:16:42 +0000

[diff] [blame]

392

inferenceModelParams.m_MLGOTuningFilePath = params.m_MLGOTuningFilePath;

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

393

inferenceModelParams.m_AsyncEnabled = params.m_Concurrent;

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

394

inferenceModelParams.m_ThreadPoolSize = params.m_ThreadPoolSize;

Keith Davis

f487486

2021-08-09 16:49:18 +0100

[diff] [blame]

395

inferenceModelParams.m_OutputDetailsToStdOut = params.m_OutputDetailsToStdOut;

Keith Davis

4914d0c

2021-08-18 17:14:05 +0100

[diff] [blame]

396

inferenceModelParams.m_OutputDetailsOnlyToStdOut = params.m_OutputDetailsOnlyToStdOut;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

397

398

for(const std::string& inputName: params.m_InputNames)

399

{

400

inferenceModelParams.m_InputBindings.push_back(inputName);

401

}

402

403

for(unsigned int i = 0; i < params.m_InputTensorShapes.size(); ++i)

404

{

405

inferenceModelParams.m_InputShapes.push_back(*params.m_InputTensorShapes[i]);

406

}

407

408

for(const std::string& outputName: params.m_OutputNames)

409

{

410

inferenceModelParams.m_OutputBindings.push_back(outputName);

411

}

412

413

inferenceModelParams.m_SubgraphId = params.m_SubgraphId;

414

inferenceModelParams.m_EnableFp16TurboMode = params.m_EnableFp16TurboMode;

415

inferenceModelParams.m_EnableBf16TurboMode = params.m_EnableBf16TurboMode;

416

417

InferenceModel<TParser, TDataType> model(inferenceModelParams,

418

params.m_EnableProfiling,

419

params.m_DynamicBackendsPath,

420

runtime);

421

422

const size_t numInputs = inferenceModelParams.m_InputBindings.size();

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

423

424

armnn::Optional<QuantizationParams> qParams = params.m_QuantizeInput ?

425

armnn::MakeOptional<QuantizationParams>(

426

model.GetInputQuantizationParams()) :

427

armnn::EmptyOptional();

428

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

429

if (params.m_InputTensorDataFilePaths.size() > numInputs)

430

{

431

ARMNN_LOG(info) << "Given network has " << numInputs << " input/s. One input-tensor-data file is required "

432

<< "for each input. The user provided "

433

<< params.m_InputTensorDataFilePaths.size()

434

<< " input-tensor-data file/s which will be used to fill the input/s.\n";

435

}

436

437

for(unsigned int j = 0; j < params.m_Iterations ; ++j)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

438

{

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

439

std::vector<armnnUtils::TContainer> inputDataContainers;

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

440

for(unsigned int i = 0; i < numInputs; ++i)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

441

{

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

442

// If there are less input files given than required for the execution of

443

// params.m_Iterations we simply start with the first input file again

444

size_t inputFileIndex = j * numInputs + i;

445

if (!params.m_InputTensorDataFilePaths.empty())

446

{

447

inputFileIndex = inputFileIndex % params.m_InputTensorDataFilePaths.size();

448

}

449

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

450

armnn::Optional<std::string> dataFile = params.m_GenerateTensorData ?

451

armnn::EmptyOptional() :

452

armnn::MakeOptional<std::string>(

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

453

params.m_InputTensorDataFilePaths.at(inputFileIndex));

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

454

455

unsigned int numElements = model.GetInputSize(i);

456

if (params.m_InputTensorShapes.size() > i && params.m_InputTensorShapes[i])

457

{

458

// If the user has provided a tensor shape for the current input,

459

// override numElements

460

numElements = params.m_InputTensorShapes[i]->GetNumElements();

461

}

462

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

463

armnnUtils::TContainer tensorData;

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

464

PopulateTensorWithData(tensorData,

465

numElements,

466

params.m_InputTypes[i],

qParams,

dataFile);

inputDataContainers.push_back(tensorData);

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

471

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

472

inputs.push_back(inputDataContainers);

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

473

}

474

475

const size_t numOutputs = inferenceModelParams.m_OutputBindings.size();

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

476

Colm Donelan

c5e4198

2021-10-28 20:19:43 +0100

[diff] [blame]

477

// The user is allowed to specify the data type of each output tensor. It is used here to construct the

478

// result tensors for each iteration. It is possible for the user to specify a type that does not match

479

// the data type of the corresponding model output. It may not make sense, but it is historically allowed.

480

// The potential problem here is a buffer overrun when a larger data type is written into the space for a

481

// smaller one. Issue a warning to highlight the potential problem.

482

for (unsigned int outputIdx = 0; outputIdx < model.GetOutputBindingInfos().size(); ++outputIdx)

483

{

484

armnn::DataType type = model.GetOutputBindingInfo(outputIdx).second.GetDataType();

485

switch (type)

486

{

David Monahan

67cc5fc

2021-11-03 12:56:41 +0000

[diff] [blame^]

487

// --output-type only supports float, int, qasymms8 or qasymmu8.

Colm Donelan

c5e4198

2021-10-28 20:19:43 +0100

[diff] [blame]

488

case armnn::DataType::Float32:

489

if (params.m_OutputTypes[outputIdx].compare("float") != 0)

490

{

491

ARMNN_LOG(warning) << "Model output index: " << outputIdx << " has data type Float32. The " <<

492

"corresponding --output-type is " << params.m_OutputTypes[outputIdx] <<

493

". This may cause unexpected problems or random failures.";

494

}

495

break;

496

case armnn::DataType::QAsymmU8:

497

if (params.m_OutputTypes[outputIdx].compare("qasymmu8") != 0)

498

{

499

ARMNN_LOG(warning) << "Model output index: " << outputIdx << " has data type QAsymmU8. The " <<

500

"corresponding --output-type is " << params.m_OutputTypes[outputIdx] <<

501

". This may cause unexpected problemsor random failures.";

502

}

503

break;

504

case armnn::DataType::Signed32:

505

if (params.m_OutputTypes[outputIdx].compare("int") != 0)

506

{

507

ARMNN_LOG(warning) << "Model output index: " << outputIdx << " has data type Signed32. The " <<

508

"corresponding --output-type is " << params.m_OutputTypes[outputIdx] <<

509

". This may cause unexpected problems or random failures.";

510

}

511

break;

512

case armnn::DataType::QAsymmS8:

513

if (params.m_OutputTypes[outputIdx].compare("qasymms8") != 0)

514

{

515

ARMNN_LOG(warning) << "Model output index: " << outputIdx << " has data type QAsymmS8. The " <<

516

"corresponding --output-type is " << params.m_OutputTypes[outputIdx] <<

517

". This may cause unexpected problems or random failures.";

}

break;

default:

break;

}

}

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

524

for (unsigned int j = 0; j < params.m_Iterations; ++j)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

525

{

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

526

std::vector <armnnUtils::TContainer> outputDataContainers;

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

527

for (unsigned int i = 0; i < numOutputs; ++i)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

528

{

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

529

if (params.m_OutputTypes[i].compare("float") == 0)

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

530

{

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

531

outputDataContainers.push_back(std::vector<float>(model.GetOutputSize(i)));

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

532

}

533

else if (params.m_OutputTypes[i].compare("int") == 0)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

534

{

535

outputDataContainers.push_back(std::vector<int>(model.GetOutputSize(i)));

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

536

}

537

else if (params.m_OutputTypes[i].compare("qasymm8") == 0 ||

538

params.m_OutputTypes[i].compare("qasymmu8") == 0)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

539

{

540

outputDataContainers.push_back(std::vector<uint8_t>(model.GetOutputSize(i)));

Mike Kelly

2021-07-21 09:42:43 +0100

[diff] [blame]

541

}

542

else if (params.m_OutputTypes[i].compare("qasymms8") == 0)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

543

{

544

outputDataContainers.push_back(std::vector<int8_t>(model.GetOutputSize(i)));

545

} else

546

{

547

ARMNN_LOG(fatal) << "Unsupported tensor data type \"" << params.m_OutputTypes[i] << "\". ";

548

return EXIT_FAILURE;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

549

}

550

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

551

outputs.push_back(outputDataContainers);

552

}

553

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

554

if (params.m_Iterations > 1)

555

{

556

std::stringstream msg;

557

msg << "Network will be executed " << params.m_Iterations;

558

if (params.m_Concurrent)

559

{

560

msg << " times in an asynchronous manner. ";

}

else

{

msg << " times successively. ";

565

}

566

msg << "The input-tensor-data files will be reused recursively if the user didn't provide enough to "

567

"cover each execution.";

568

ARMNN_LOG(info) << msg.str();

569

}

570

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

571

// Synchronous execution

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

572

if (!params.m_Concurrent)

573

{

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

574

for (size_t x = 0; x < params.m_Iterations; x++)

575

{

576

// model.Run returns the inference time elapsed in EnqueueWorkload (in milliseconds)

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

577

auto inference_duration = model.Run(inputs[x], outputs[x]);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

578

579

if (params.m_GenerateTensorData)

580

{

581

ARMNN_LOG(warning) << "The input data was generated, note that the output will not be useful";

582

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

583

if (params.m_DontPrintOutputs)

584

{

585

ARMNN_LOG(info) << "Printing outputs to console is disabled.";

586

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

587

588

// Print output tensors

589

const auto& infosOut = model.GetOutputBindingInfos();

590

for (size_t i = 0; i < numOutputs; i++)

591

{

592

const armnn::TensorInfo& infoOut = infosOut[i].second;

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

593

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

594

// We've made sure before that the number of output files either equals numOutputs, in which

595

// case we override those files when processing the results of each iteration (only the result

596

// of the last iteration will be stored), or there are enough

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

597

// output files for each output of each iteration.

598

size_t outputFileIndex = x * numOutputs + i;

599

if (!params.m_OutputTensorFiles.empty())

600

{

601

outputFileIndex = outputFileIndex % params.m_OutputTensorFiles.size();

602

ARMNN_LOG(info) << "Writing output " << i << " named: '"

603

<< inferenceModelParams.m_OutputBindings[i]

604

<< "' of iteration: " << x+1 << " to file: '"

605

<< params.m_OutputTensorFiles[outputFileIndex] << "'";

606

}

607

auto outputTensorFile = params.m_OutputTensorFiles.empty()

608

? ""

609

: params.m_OutputTensorFiles[outputFileIndex];

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

610

611

TensorPrinter printer(inferenceModelParams.m_OutputBindings[i],

612

infoOut,

613

outputTensorFile,

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

614

params.m_DequantizeOutput,

615

!params.m_DontPrintOutputs);

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

616

mapbox::util::apply_visitor(printer, outputs[x][i]);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

617

}

618

619

ARMNN_LOG(info) << "\nInference time: " << std::setprecision(2)

620

<< std::fixed << inference_duration.count() << " ms\n";

621

622

// If thresholdTime == 0.0 (default), then it hasn't been supplied at command line

623

if (params.m_ThresholdTime != 0.0)

624

{

625

ARMNN_LOG(info) << "Threshold time: " << std::setprecision(2)

626

<< std::fixed << params.m_ThresholdTime << " ms";

627

auto thresholdMinusInference = params.m_ThresholdTime - inference_duration.count();

628

ARMNN_LOG(info) << "Threshold time - Inference time: " << std::setprecision(2)

629

<< std::fixed << thresholdMinusInference << " ms" << "\n";

630

631

if (thresholdMinusInference < 0)

632

{

633

std::string errorMessage = "Elapsed inference time is greater than provided threshold time.";

634

ARMNN_LOG(fatal) << errorMessage;

}

}

}

}

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

639

// Asynchronous execution using the Arm NN thread pool

Kevin May

94dd4db

2021-05-26 16:01:08 +0100

[diff] [blame]

640

else if (params.m_ThreadPoolSize >= 1)

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

{

try

{

ARMNN_LOG(info) << "Asynchronous execution with Arm NN thread pool... \n";

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

645

armnn::AsyncCallbackManager callbackManager;

Francis Murtagh

2021-10-28 11:11:35 +0100

[diff] [blame]

646

std::unordered_map<armnn::InferenceId, std::vector<armnnUtils::TContainer>&> inferenceOutputMap;

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

647

648

// Declare the latest and earliest inference times here to be used when calculating overall time

649

std::chrono::high_resolution_clock::time_point earliestStartTime;

650

std::chrono::high_resolution_clock::time_point latestEndTime =

651

std::chrono::high_resolution_clock::now();

652

653

// For the asynchronous execution, we are adding a pool of working memory handles (1 per thread) in the

654

// LoadedNetwork with each scheduled inference having a specific priority

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

655

for (size_t i = 0; i < params.m_Iterations; ++i)

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

656

{

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

657

std::shared_ptr<armnn::AsyncExecutionCallback> cb = callbackManager.GetNewCallback();

658

inferenceOutputMap.insert({cb->GetInferenceId(), outputs[i]});

659

model.RunAsync(inputs[i], outputs[i], cb);

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

}

// Check the results

unsigned int j = 0;

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

664

for (size_t iteration = 0; iteration < params.m_Iterations; ++iteration)

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

665

{

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

666

auto cb = callbackManager.GetNotifiedCallback();

667

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

668

// Get the results

669

auto endTime = time_point_cast<std::chrono::milliseconds>(cb->GetEndTime());

670

auto startTime = time_point_cast<std::chrono::milliseconds>(cb->GetStartTime());

671

auto inferenceDuration = endTime - startTime;

672

673

if (latestEndTime < cb->GetEndTime())

674

{

675

latestEndTime = cb->GetEndTime();

676

}

677

678

if (earliestStartTime.time_since_epoch().count() == 0)

679

{

680

earliestStartTime = cb->GetStartTime();

681

}

682

else if (earliestStartTime > cb->GetStartTime())

683

{

684

earliestStartTime = cb->GetStartTime();

685

}

686

687

if (params.m_GenerateTensorData)

688

{

689

ARMNN_LOG(warning) << "The input data was generated, note that the output will not be useful";

690

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

691

if (params.m_DontPrintOutputs)

692

{

693

ARMNN_LOG(info) << "Printing outputs to console is disabled.";

694

}

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

695

696

// Print output tensors

697

const auto& infosOut = model.GetOutputBindingInfos();

698

for (size_t i = 0; i < numOutputs; i++)

699

{

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

700

// We've made sure before that the number of output files either equals numOutputs, in which

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

701

// case we override those files when processing the results of each iteration (only the

702

// result of the last iteration will be stored), or there are enough

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

703

// output files for each output of each iteration.

704

size_t outputFileIndex = iteration * numOutputs + i;

705

if (!params.m_OutputTensorFiles.empty())

706

{

707

outputFileIndex = outputFileIndex % params.m_OutputTensorFiles.size();

708

ARMNN_LOG(info) << "Writing output " << i << " named: '"

709

<< inferenceModelParams.m_OutputBindings[i]

710

<< "' of iteration: " << iteration+1 << " to file: '"

711

<< params.m_OutputTensorFiles[outputFileIndex] << "'";

712

}

713

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

714

const armnn::TensorInfo& infoOut = infosOut[i].second;

715

auto outputTensorFile = params.m_OutputTensorFiles.empty()

716

? ""

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

717

: params.m_OutputTensorFiles[outputFileIndex];

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

718

719

TensorPrinter printer(inferenceModelParams.m_OutputBindings[i],

720

infoOut,

721

outputTensorFile,

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

722

params.m_DequantizeOutput,

723

!params.m_DontPrintOutputs);

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

724

mapbox::util::apply_visitor(printer, inferenceOutputMap.at(cb->GetInferenceId())[i]);

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

725

}

726

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

727

CheckInferenceTimeThreshold(inferenceDuration, params.m_ThresholdTime);

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

728

++j;

729

}

730

//print duration difference between overallStartTime and overallEndTime

731

auto overallEndTime = time_point_cast<std::chrono::milliseconds>(latestEndTime);

732

auto overallStartTime = time_point_cast<std::chrono::milliseconds>(earliestStartTime);

733

auto totalInferenceDuration = overallEndTime - overallStartTime;

734

ARMNN_LOG(info) << "\nOverall Inference time: " << std::setprecision(2)

735

<< std::fixed << totalInferenceDuration.count() << " ms\n";

736

}

737

catch (const armnn::Exception& e)

738

{

739

ARMNN_LOG(fatal) << "Armnn Error: " << e.what();

return EXIT_FAILURE;

}

}

// Asynchronous execution using std::launch::async

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

else

{

try

{

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

748

ARMNN_LOG(info) << "Asynchronous Execution with std::launch:async... \n";

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

749

std::vector<std::future<std::tuple<unsigned int,

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

750

std::chrono::duration<double, std::milli>>>> inferenceResults;

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

751

inferenceResults.reserve(params.m_Iterations);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

752

753

// Create WorkingMemHandles for each inference

754

std::vector<std::unique_ptr<armnn::experimental::IWorkingMemHandle>> workingMemHandles;

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

755

workingMemHandles.reserve(params.m_Iterations);

756

for (unsigned int i = 0; i < params.m_Iterations; ++i)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

757

{

758

workingMemHandles.push_back(model.CreateWorkingMemHandle());

759

}

760

761

// Run each inference in its own thread

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

762

// start a timer

763

const auto start_time = armnn::GetTimeNow();

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

764

for (unsigned int i = 0; i < params.m_Iterations; ++i)

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

765

{

766

armnn::experimental::IWorkingMemHandle& workingMemHandleRef = *workingMemHandles[i].get();

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

767

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

768

inferenceResults.push_back(std::async(

769

std::launch::async, [&model, &workingMemHandleRef, &inputs, &outputs, i]() {

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

770

return model.RunAsync(workingMemHandleRef, inputs[i], outputs[i], i);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

}

));

}

// Check the results

for (unsigned int j = 0; j < inferenceResults.size(); ++j)

777

{

778

// Get the results

779

auto inferenceResult = inferenceResults[j].get();

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

780

auto inferenceDuration = std::get<1>(inferenceResult);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

781

auto inferenceID = std::get<0>(inferenceResult);

782

783

if (params.m_GenerateTensorData)

784

{

785

ARMNN_LOG(warning) << "The input data was generated, note that the output will not be useful";

786

}

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

787

if (params.m_DontPrintOutputs)

788

{

789

ARMNN_LOG(info) << "Printing outputs to console is disabled.";

790

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

791

792

// Print output tensors

793

const auto& infosOut = model.GetOutputBindingInfos();

794

for (size_t i = 0; i < numOutputs; i++)

795

{

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

796

// We've made sure before that the number of output files either equals numOutputs, in which

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

797

// case we override those files when processing the results of each iteration (only the

798

// result of the last iteration will be stored), or there are enough

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

799

// output files for each output of each iteration.

800

size_t outputFileIndex = j * numOutputs + i;

801

if (!params.m_OutputTensorFiles.empty())

802

{

803

outputFileIndex = outputFileIndex % params.m_OutputTensorFiles.size();

804

ARMNN_LOG(info) << "Writing output " << i << " named: '"

805

<< inferenceModelParams.m_OutputBindings[i]

806

<< "' of iteration: " << j+1 << " to file: '"

807

<< params.m_OutputTensorFiles[outputFileIndex] << "'";

808

}

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

809

const armnn::TensorInfo& infoOut = infosOut[i].second;

810

auto outputTensorFile = params.m_OutputTensorFiles.empty()

811

? ""

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

812

: params.m_OutputTensorFiles[outputFileIndex];

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

813

814

TensorPrinter printer(inferenceModelParams.m_OutputBindings[i],

815

infoOut,

816

outputTensorFile,

Jan Eilers

2021-09-07 12:46:15 +0100

[diff] [blame]

817

params.m_DequantizeOutput,

818

!params.m_DontPrintOutputs);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

819

mapbox::util::apply_visitor(printer, outputs[j][i]);

820

}

Colm Donelan

2021-10-12 15:06:19 +0100

[diff] [blame]

821

CheckInferenceTimeThreshold(inferenceDuration, params.m_ThresholdTime);

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

822

ARMNN_LOG(info) << "Asynchronous Execution is finished for Inference ID: " << inferenceID << " \n";

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

823

}

Kevin May

2021-05-21 16:42:21 +0100

[diff] [blame]

824

// finish timer

825

const auto duration = armnn::GetTimeDuration(start_time);

826

ARMNN_LOG(info) << "\nOverall Inference time: " << std::setprecision(2)

827

<< std::fixed << duration.count() << " ms\n";

Sadik Armagan

2021-04-27 10:02:10 +0100

[diff] [blame]

828

}

829

catch (const armnn::Exception& e)

830

{

831

ARMNN_LOG(fatal) << "Armnn Error: " << e.what();

832

return EXIT_FAILURE;

833

}

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

834

}

835

}

836

catch (const armnn::Exception& e)

837

{

838

ARMNN_LOG(fatal) << "Armnn Error: " << e.what();

return EXIT_FAILURE;

}

return EXIT_SUCCESS;

}

James Conroy

2019-04-11 10:23:58 +0100

[diff] [blame]

845

// MAIN

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

846

int main(int argc, const char* argv[])

847

{

848

// Configures logging for both the ARMNN library and this test program.

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

849

#ifdef NDEBUG

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

850

armnn::LogSeverity level = armnn::LogSeverity::Info;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

851

#else

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

852

armnn::LogSeverity level = armnn::LogSeverity::Debug;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

853

#endif

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

854

armnn::ConfigureLogging(true, true, level);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

855

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

856

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

857

// Get ExecuteNetwork parameters and runtime options from command line

Jan Eilers

2021-07-26 22:20:00 +0100

[diff] [blame]

858

// This might throw an InvalidArgumentException if the user provided invalid inputs

859

ProgramOptions ProgramOptions;

860

try {

861

ProgramOptions.ParseOptions(argc, argv);

862

} catch (const std::exception &e){

863

ARMNN_LOG(fatal) << e.what();

864

return EXIT_FAILURE;

865

}

Narumol Prangnawarat

d8cc811

2020-03-24 13:54:05 +0000

[diff] [blame]

866

Keith Davis

4914d0c

2021-08-18 17:14:05 +0100

[diff] [blame]

867

if ((ProgramOptions.m_ExNetParams.m_OutputDetailsToStdOut ||

868

ProgramOptions.m_ExNetParams.m_OutputDetailsOnlyToStdOut)

869

&& !ProgramOptions.m_ExNetParams.m_EnableProfiling)

Keith Davis

f487486

2021-08-09 16:49:18 +0100

[diff] [blame]

870

{

871

ARMNN_LOG(fatal) << "You must enable profiling if you would like to output layer details";

return EXIT_FAILURE;

}

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

875

// Create runtime

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

876

std::shared_ptr<armnn::IRuntime> runtime(armnn::IRuntime::Create(ProgramOptions.m_RuntimeOptions));

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

877

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

878

std::string modelFormat = ProgramOptions.m_ExNetParams.m_ModelFormat;

879

880

// Forward to implementation based on the parser type

881

if (modelFormat.find("armnn") != std::string::npos)

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

882

{

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

883

#if defined(ARMNN_SERIALIZER)

884

return MainImpl<armnnDeserializer::IDeserializer, float>(ProgramOptions.m_ExNetParams, runtime);

885

#else

886

ARMNN_LOG(fatal) << "Not built with serialization support.";

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

887

return EXIT_FAILURE;

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

888

#endif

Finn Williams

2020-04-23 17:55:18 +0100

[diff] [blame]

889

}

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

890

else if (modelFormat.find("onnx") != std::string::npos)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

891

{

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

892

#if defined(ARMNN_ONNX_PARSER)

893

return MainImpl<armnnOnnxParser::IOnnxParser, float>(ProgramOptions.m_ExNetParams, runtime);

894

#else

895

ARMNN_LOG(fatal) << "Not built with Onnx parser support.";

896

return EXIT_FAILURE;

897

#endif

898

}

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

899

else if(modelFormat.find("tflite") != std::string::npos)

900

{

Finn Williams

2021-02-22 15:13:12 +0000

[diff] [blame]

901

if (ProgramOptions.m_ExNetParams.m_TfLiteExecutor == ExecuteNetworkParams::TfLiteExecutor::ArmNNTfLiteParser)

902

{

903

#if defined(ARMNN_TF_LITE_PARSER)

904

return MainImpl<armnnTfLiteParser::ITfLiteParser, float>(ProgramOptions.m_ExNetParams, runtime);

905

#else

906

ARMNN_LOG(fatal) << "Not built with Tensorflow-Lite parser support.";

return EXIT_FAILURE;

#endif

}

else if (ProgramOptions.m_ExNetParams.m_TfLiteExecutor ==

911

ExecuteNetworkParams::TfLiteExecutor::ArmNNTfLiteDelegate ||

912

ProgramOptions.m_ExNetParams.m_TfLiteExecutor ==

913

ExecuteNetworkParams::TfLiteExecutor::TfliteInterpreter)

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

914

{

915

#if defined(ARMNN_TF_LITE_DELEGATE)

Colm Donelan

4514228

2021-10-21 23:39:52 +0100

[diff] [blame]

916

return TfLiteDelegateMainImpl(ProgramOptions.m_ExNetParams, ProgramOptions.m_RuntimeOptions);

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

917

#else

Finn Williams

2020-11-25 14:32:42 +0000

[diff] [blame]

918

ARMNN_LOG(fatal) << "Not built with Arm NN Tensorflow-Lite delegate support.";

Sadik Armagan

2020-11-17 16:43:56 +0000

[diff] [blame]

919

return EXIT_FAILURE;

920

#endif

921

}

Jan Eilers

2020-10-15 18:34:43 +0100

[diff] [blame]

}

else

{

ARMNN_LOG(fatal) << "Unknown model format: '" << modelFormat

Nikhil Raj

5d955cf

2021-04-19 16:59:48 +0100

[diff] [blame]

926

<< "'. Please include 'tflite' or 'onnx'";

Jan Eilers