blob: cd760a8199c595fed9f899f06e72f54d9675d64d [file] [log] [blame]
Laurent Carlier749294b2020-06-01 09:03:17 +01001//
Sadik Armagana9c2ce12020-07-14 10:02:22 +01002// Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
telsoa01c577f2c2018-08-31 09:22:23 +01005
Jan Eilers45274902020-10-15 18:34:43 +01006#include "NetworkExecutionUtils/NetworkExecutionUtils.hpp"
7#include "ExecuteNetworkProgramOptions.hpp"
Kevin Mayb4b3ac92021-05-21 16:42:21 +01008#include <armnn/IAsyncExecutionCallback.hpp>
9#include <AsyncExecutionCallback.hpp>
Jan Eilers45274902020-10-15 18:34:43 +010010
11#include <armnn/Logging.hpp>
12#include <Filesystem.hpp>
13#include <InferenceTest.hpp>
14
15#if defined(ARMNN_SERIALIZER)
16#include "armnnDeserializer/IDeserializer.hpp"
17#endif
Jan Eilers45274902020-10-15 18:34:43 +010018#if defined(ARMNN_TF_LITE_PARSER)
19#include "armnnTfLiteParser/ITfLiteParser.hpp"
20#endif
21#if defined(ARMNN_ONNX_PARSER)
22#include "armnnOnnxParser/IOnnxParser.hpp"
23#endif
Sadik Armagan5d03e312020-11-17 16:43:56 +000024#if defined(ARMNN_TFLITE_DELEGATE)
25#include <armnn_delegate.hpp>
26#include <DelegateOptions.hpp>
27
28#include <tensorflow/lite/builtin_ops.h>
29#include <tensorflow/lite/c/builtin_op_data.h>
30#include <tensorflow/lite/c/common.h>
31#include <tensorflow/lite/optional_debug_tools.h>
32#include <tensorflow/lite/kernels/builtin_op_kernels.h>
33#include <tensorflow/lite/interpreter.h>
34#include <tensorflow/lite/kernels/register.h>
35#endif
Jan Eilers45274902020-10-15 18:34:43 +010036
37#include <future>
Sadik Armagan5d03e312020-11-17 16:43:56 +000038#if defined(ARMNN_TFLITE_DELEGATE)
39int TfLiteDelegateMainImpl(const ExecuteNetworkParams& params,
40 const std::shared_ptr<armnn::IRuntime>& runtime = nullptr)
41{
42 using namespace tflite;
Jan Eilers45274902020-10-15 18:34:43 +010043
Sadik Armagan5d03e312020-11-17 16:43:56 +000044 std::unique_ptr<tflite::FlatBufferModel> model = tflite::FlatBufferModel::BuildFromFile(params.m_ModelPath.c_str());
45
46 auto tfLiteInterpreter = std::make_unique<Interpreter>();
47 tflite::ops::builtin::BuiltinOpResolver resolver;
48
49 tflite::InterpreterBuilder builder(*model, resolver);
50 builder(&tfLiteInterpreter);
51 tfLiteInterpreter->AllocateTensors();
52
Finn Williamsf806c4d2021-02-22 15:13:12 +000053 int status = 0;
54 if (params.m_TfLiteExecutor == ExecuteNetworkParams::TfLiteExecutor::ArmNNTfLiteDelegate)
Sadik Armagan19a1c032021-01-20 12:17:00 +000055 {
Finn Williamsf806c4d2021-02-22 15:13:12 +000056 // Create the Armnn Delegate
57 armnnDelegate::DelegateOptions delegateOptions(params.m_ComputeDevices);
58 std::unique_ptr<TfLiteDelegate, decltype(&armnnDelegate::TfLiteArmnnDelegateDelete)>
59 theArmnnDelegate(armnnDelegate::TfLiteArmnnDelegateCreate(delegateOptions),
60 armnnDelegate::TfLiteArmnnDelegateDelete);
61 // Register armnn_delegate to TfLiteInterpreter
62 status = tfLiteInterpreter->ModifyGraphWithDelegate(std::move(theArmnnDelegate));
63 if (status == kTfLiteError)
64 {
65 ARMNN_LOG(fatal) << "Could not register ArmNN TfLite Delegate to TfLiteInterpreter!";
66 return EXIT_FAILURE;
67 }
Sadik Armagan19a1c032021-01-20 12:17:00 +000068 }
Finn Williamsf806c4d2021-02-22 15:13:12 +000069 else
70 {
71 std::cout << "Running on TfLite without ArmNN delegate\n";
72 }
73
Sadik Armagan5d03e312020-11-17 16:43:56 +000074
75 std::vector<std::string> inputBindings;
76 for (const std::string& inputName: params.m_InputNames)
77 {
78 inputBindings.push_back(inputName);
79 }
80
81 armnn::Optional<std::string> dataFile = params.m_GenerateTensorData
82 ? armnn::EmptyOptional()
83 : armnn::MakeOptional<std::string>(params.m_InputTensorDataFilePaths[0]);
84
85 const size_t numInputs = inputBindings.size();
86
87 for(unsigned int inputIndex = 0; inputIndex < numInputs; ++inputIndex)
88 {
89 int input = tfLiteInterpreter->inputs()[inputIndex];
Sadik Armagan15f7fae2020-11-18 09:37:03 +000090 TfLiteIntArray* inputDims = tfLiteInterpreter->tensor(input)->dims;
91
92 long inputSize = 1;
93 for (unsigned int dim = 0; dim < static_cast<unsigned int>(inputDims->size); ++dim)
94 {
95 inputSize *= inputDims->data[dim];
96 }
97
Sadik Armagan5d03e312020-11-17 16:43:56 +000098 if (params.m_InputTypes[inputIndex].compare("float") == 0)
99 {
100 auto inputData = tfLiteInterpreter->typed_tensor<float>(input);
Finn Williamsbbbefec2020-11-25 14:32:42 +0000101
Matthew Sloyanf00f6c22020-12-07 13:33:24 +0000102 if(inputData == NULL)
Finn Williamsbbbefec2020-11-25 14:32:42 +0000103 {
104 ARMNN_LOG(fatal) << "Input tensor is null, input type: "
105 "\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";
106 return EXIT_FAILURE;
107 }
108
Finn Williams56870182020-11-20 13:57:53 +0000109 std::vector<float> tensorData;
110 PopulateTensorWithDataGeneric<float>(tensorData,
111 params.m_InputTensorShapes[inputIndex]->GetNumElements(),
112 dataFile,
113 [](const std::string& s)
114 { return std::stof(s); });
Sadik Armagan15f7fae2020-11-18 09:37:03 +0000115
Finn Williams56870182020-11-20 13:57:53 +0000116 std::copy(tensorData.begin(), tensorData.end(), inputData);
117 }
Finn Williamsf806c4d2021-02-22 15:13:12 +0000118 else if (params.m_InputTypes[inputIndex].compare("qsymms8") == 0)
Finn Williams56870182020-11-20 13:57:53 +0000119 {
120 auto inputData = tfLiteInterpreter->typed_tensor<int8_t>(input);
Finn Williamsbbbefec2020-11-25 14:32:42 +0000121
Matthew Sloyanf00f6c22020-12-07 13:33:24 +0000122 if(inputData == NULL)
Finn Williamsbbbefec2020-11-25 14:32:42 +0000123 {
124 ARMNN_LOG(fatal) << "Input tensor is null, input type: "
125 "\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";
126 return EXIT_FAILURE;
127 }
128
Finn Williams56870182020-11-20 13:57:53 +0000129 std::vector<int8_t> tensorData;
130 PopulateTensorWithDataGeneric<int8_t>(tensorData,
131 params.m_InputTensorShapes[inputIndex]->GetNumElements(),
132 dataFile,
133 [](const std::string& s)
134 { return armnn::numeric_cast<int8_t>(std::stoi(s)); });
135
136 std::copy(tensorData.begin(), tensorData.end(), inputData);
Sadik Armagan5d03e312020-11-17 16:43:56 +0000137 }
138 else if (params.m_InputTypes[inputIndex].compare("int") == 0)
139 {
140 auto inputData = tfLiteInterpreter->typed_tensor<int32_t>(input);
Finn Williamsbbbefec2020-11-25 14:32:42 +0000141
Matthew Sloyanf00f6c22020-12-07 13:33:24 +0000142 if(inputData == NULL)
Finn Williamsbbbefec2020-11-25 14:32:42 +0000143 {
144 ARMNN_LOG(fatal) << "Input tensor is null, input type: "
145 "\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";
146 return EXIT_FAILURE;
147 }
148
Finn Williams56870182020-11-20 13:57:53 +0000149 std::vector<int32_t> tensorData;
150 PopulateTensorWithDataGeneric<int32_t>(tensorData,
151 params.m_InputTensorShapes[inputIndex]->GetNumElements(),
152 dataFile,
153 [](const std::string& s)
154 { return std::stoi(s); });
155
156 std::copy(tensorData.begin(), tensorData.end(), inputData);
Sadik Armagan5d03e312020-11-17 16:43:56 +0000157 }
158 else if (params.m_InputTypes[inputIndex].compare("qasymm8") == 0)
159 {
160 auto inputData = tfLiteInterpreter->typed_tensor<uint8_t>(input);
Finn Williamsbbbefec2020-11-25 14:32:42 +0000161
Matthew Sloyanf00f6c22020-12-07 13:33:24 +0000162 if(inputData == NULL)
Finn Williamsbbbefec2020-11-25 14:32:42 +0000163 {
164 ARMNN_LOG(fatal) << "Input tensor is null, input type: "
165 "\"" << params.m_InputTypes[inputIndex] << "\" may be incorrect.";
166 return EXIT_FAILURE;
167 }
168
Finn Williams56870182020-11-20 13:57:53 +0000169 std::vector<uint8_t> tensorData;
170 PopulateTensorWithDataGeneric<uint8_t>(tensorData,
171 params.m_InputTensorShapes[inputIndex]->GetNumElements(),
172 dataFile,
173 [](const std::string& s)
174 { return armnn::numeric_cast<uint8_t>(std::stoi(s)); });
175
176 std::copy(tensorData.begin(), tensorData.end(), inputData);
Sadik Armagan5d03e312020-11-17 16:43:56 +0000177 }
178 else
179 {
180 ARMNN_LOG(fatal) << "Unsupported input tensor data type \"" << params.m_InputTypes[inputIndex] << "\". ";
181 return EXIT_FAILURE;
182 }
183 }
184
185 for (size_t x = 0; x < params.m_Iterations; x++)
186 {
187 // Run the inference
Finn Williamsf806c4d2021-02-22 15:13:12 +0000188 status = tfLiteInterpreter->Invoke();
Sadik Armagan5d03e312020-11-17 16:43:56 +0000189
190 // Print out the output
191 for (unsigned int outputIndex = 0; outputIndex < params.m_OutputNames.size(); ++outputIndex)
192 {
Sadik Armagan5d03e312020-11-17 16:43:56 +0000193 auto tfLiteDelegateOutputId = tfLiteInterpreter->outputs()[outputIndex];
Sadik Armagan15f7fae2020-11-18 09:37:03 +0000194 TfLiteIntArray* outputDims = tfLiteInterpreter->tensor(tfLiteDelegateOutputId)->dims;
Sadik Armagan5d03e312020-11-17 16:43:56 +0000195
Sadik Armagan15f7fae2020-11-18 09:37:03 +0000196 long outputSize = 1;
Sadik Armagan5d03e312020-11-17 16:43:56 +0000197 for (unsigned int dim = 0; dim < static_cast<unsigned int>(outputDims->size); ++dim)
198 {
Sadik Armagan15f7fae2020-11-18 09:37:03 +0000199 outputSize *= outputDims->data[dim];
Sadik Armagan5d03e312020-11-17 16:43:56 +0000200 }
201
202 std::cout << params.m_OutputNames[outputIndex] << ": ";
203 if (params.m_OutputTypes[outputIndex].compare("float") == 0)
204 {
205 auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<float>(tfLiteDelegateOutputId);
Sadik Armagan5d03e312020-11-17 16:43:56 +0000206 if(tfLiteDelageOutputData == NULL)
207 {
208 ARMNN_LOG(fatal) << "Output tensor is null, output type: "
209 "\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";
210 return EXIT_FAILURE;
211 }
212
213 for (int i = 0; i < outputSize; ++i)
214 {
Finn Williamsf806c4d2021-02-22 15:13:12 +0000215 printf("%f ", tfLiteDelageOutputData[i]);
Sadik Armagan5d03e312020-11-17 16:43:56 +0000216 }
217 }
218 else if (params.m_OutputTypes[outputIndex].compare("int") == 0)
219 {
220 auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<int32_t>(tfLiteDelegateOutputId);
Sadik Armagan5d03e312020-11-17 16:43:56 +0000221 if(tfLiteDelageOutputData == NULL)
222 {
223 ARMNN_LOG(fatal) << "Output tensor is null, output type: "
224 "\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";
225 return EXIT_FAILURE;
226 }
227
228 for (int i = 0; i < outputSize; ++i)
229 {
Finn Williamsf806c4d2021-02-22 15:13:12 +0000230 printf("%d ", tfLiteDelageOutputData[i]);
Sadik Armagan5d03e312020-11-17 16:43:56 +0000231 }
232 }
Finn Williamsf806c4d2021-02-22 15:13:12 +0000233 else if (params.m_OutputTypes[outputIndex].compare("qsymms8") == 0)
Finn Williams56870182020-11-20 13:57:53 +0000234 {
235 auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<int8_t>(tfLiteDelegateOutputId);
236 if(tfLiteDelageOutputData == NULL)
237 {
238 ARMNN_LOG(fatal) << "Output tensor is null, output type: "
239 "\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";
240 return EXIT_FAILURE;
241 }
242
243 for (int i = 0; i < outputSize; ++i)
244 {
Finn Williamsf806c4d2021-02-22 15:13:12 +0000245 printf("%d ", tfLiteDelageOutputData[i]);
Finn Williams56870182020-11-20 13:57:53 +0000246 }
247 }
Sadik Armagan5d03e312020-11-17 16:43:56 +0000248 else if (params.m_OutputTypes[outputIndex].compare("qasymm8") == 0)
249 {
250 auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<uint8_t>(tfLiteDelegateOutputId);
Sadik Armagan5d03e312020-11-17 16:43:56 +0000251 if(tfLiteDelageOutputData == NULL)
252 {
253 ARMNN_LOG(fatal) << "Output tensor is null, output type: "
254 "\"" << params.m_OutputTypes[outputIndex] << "\" may be incorrect.";
255 return EXIT_FAILURE;
256 }
257
258 for (int i = 0; i < outputSize; ++i)
259 {
Finn Williamsf806c4d2021-02-22 15:13:12 +0000260 printf("%u ", tfLiteDelageOutputData[i]);
Sadik Armagan5d03e312020-11-17 16:43:56 +0000261 }
262 }
263 else
264 {
265 ARMNN_LOG(fatal) << "Output tensor is null, output type: "
266 "\"" << params.m_OutputTypes[outputIndex] <<
267 "\" may be incorrect. Output type can be specified with -z argument";
268 return EXIT_FAILURE;
269 }
270 std::cout << std::endl;
271 }
272 }
273
274 return status;
275}
276#endif
Jan Eilers45274902020-10-15 18:34:43 +0100277template<typename TParser, typename TDataType>
278int MainImpl(const ExecuteNetworkParams& params,
279 const std::shared_ptr<armnn::IRuntime>& runtime = nullptr)
280{
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100281 using namespace std::chrono;
Jan Eilers45274902020-10-15 18:34:43 +0100282
Sadik Armagana04a9d72021-04-27 10:02:10 +0100283 std::vector<std::vector<TContainer>> inputs;
284 std::vector<std::vector<TContainer>> outputs;
Jan Eilers45274902020-10-15 18:34:43 +0100285
286 try
287 {
288 // Creates an InferenceModel, which will parse the model and load it into an IRuntime.
289 typename InferenceModel<TParser, TDataType>::Params inferenceModelParams;
290 inferenceModelParams.m_ModelPath = params.m_ModelPath;
291 inferenceModelParams.m_IsModelBinary = params.m_IsModelBinary;
292 inferenceModelParams.m_ComputeDevices = params.m_ComputeDevices;
293 inferenceModelParams.m_DynamicBackendsPath = params.m_DynamicBackendsPath;
294 inferenceModelParams.m_PrintIntermediateLayers = params.m_PrintIntermediate;
295 inferenceModelParams.m_VisualizePostOptimizationModel = params.m_EnableLayerDetails;
296 inferenceModelParams.m_ParseUnsupported = params.m_ParseUnsupported;
297 inferenceModelParams.m_InferOutputShape = params.m_InferOutputShape;
298 inferenceModelParams.m_EnableFastMath = params.m_EnableFastMath;
Matthew Sloyan42432112021-01-08 10:30:51 +0000299 inferenceModelParams.m_SaveCachedNetwork = params.m_SaveCachedNetwork;
300 inferenceModelParams.m_CachedNetworkFilePath = params.m_CachedNetworkFilePath;
Matthew Sloyan0a7dc6b2021-02-10 16:50:53 +0000301 inferenceModelParams.m_NumberOfThreads = params.m_NumberOfThreads;
Finn Williams40646322021-02-11 16:16:42 +0000302 inferenceModelParams.m_MLGOTuningFilePath = params.m_MLGOTuningFilePath;
Sadik Armagana04a9d72021-04-27 10:02:10 +0100303 inferenceModelParams.m_AsyncEnabled = params.m_Concurrent;
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100304 inferenceModelParams.m_ThreadPoolSize = params.m_ThreadPoolSize;
Jan Eilers45274902020-10-15 18:34:43 +0100305
306 for(const std::string& inputName: params.m_InputNames)
307 {
308 inferenceModelParams.m_InputBindings.push_back(inputName);
309 }
310
311 for(unsigned int i = 0; i < params.m_InputTensorShapes.size(); ++i)
312 {
313 inferenceModelParams.m_InputShapes.push_back(*params.m_InputTensorShapes[i]);
314 }
315
316 for(const std::string& outputName: params.m_OutputNames)
317 {
318 inferenceModelParams.m_OutputBindings.push_back(outputName);
319 }
320
321 inferenceModelParams.m_SubgraphId = params.m_SubgraphId;
322 inferenceModelParams.m_EnableFp16TurboMode = params.m_EnableFp16TurboMode;
323 inferenceModelParams.m_EnableBf16TurboMode = params.m_EnableBf16TurboMode;
324
325 InferenceModel<TParser, TDataType> model(inferenceModelParams,
326 params.m_EnableProfiling,
327 params.m_DynamicBackendsPath,
328 runtime);
329
330 const size_t numInputs = inferenceModelParams.m_InputBindings.size();
Sadik Armagana04a9d72021-04-27 10:02:10 +0100331
332 armnn::Optional<QuantizationParams> qParams = params.m_QuantizeInput ?
333 armnn::MakeOptional<QuantizationParams>(
334 model.GetInputQuantizationParams()) :
335 armnn::EmptyOptional();
336
337 for(unsigned int j = 0; j < params.m_SimultaneousIterations ; ++j)
Jan Eilers45274902020-10-15 18:34:43 +0100338 {
Sadik Armagana04a9d72021-04-27 10:02:10 +0100339 std::vector<TContainer> inputDataContainers;
340 for(unsigned int i = 0; i < numInputs; ++i)
Jan Eilers45274902020-10-15 18:34:43 +0100341 {
Sadik Armagana04a9d72021-04-27 10:02:10 +0100342 armnn::Optional<std::string> dataFile = params.m_GenerateTensorData ?
343 armnn::EmptyOptional() :
344 armnn::MakeOptional<std::string>(
345 params.m_InputTensorDataFilePaths[(j * numInputs) + i]);
346
347 unsigned int numElements = model.GetInputSize(i);
348 if (params.m_InputTensorShapes.size() > i && params.m_InputTensorShapes[i])
349 {
350 // If the user has provided a tensor shape for the current input,
351 // override numElements
352 numElements = params.m_InputTensorShapes[i]->GetNumElements();
353 }
354
355 TContainer tensorData;
356 PopulateTensorWithData(tensorData,
357 numElements,
358 params.m_InputTypes[i],
359 qParams,
360 dataFile);
361
362 inputDataContainers.push_back(tensorData);
Jan Eilers45274902020-10-15 18:34:43 +0100363 }
Sadik Armagana04a9d72021-04-27 10:02:10 +0100364 inputs.push_back(inputDataContainers);
Jan Eilers45274902020-10-15 18:34:43 +0100365 }
366
367 const size_t numOutputs = inferenceModelParams.m_OutputBindings.size();
Jan Eilers45274902020-10-15 18:34:43 +0100368
Sadik Armagana04a9d72021-04-27 10:02:10 +0100369 for (unsigned int j = 0; j < params.m_SimultaneousIterations; ++j)
Jan Eilers45274902020-10-15 18:34:43 +0100370 {
Sadik Armagana04a9d72021-04-27 10:02:10 +0100371 std::vector <TContainer> outputDataContainers;
372 for (unsigned int i = 0; i < numOutputs; ++i)
Jan Eilers45274902020-10-15 18:34:43 +0100373 {
Sadik Armagana04a9d72021-04-27 10:02:10 +0100374 if (params.m_OutputTypes[i].compare("float") == 0)
Jan Eilers45274902020-10-15 18:34:43 +0100375 {
Sadik Armagana04a9d72021-04-27 10:02:10 +0100376 outputDataContainers.push_back(std::vector<float>(model.GetOutputSize(i)));
377 } else if (params.m_OutputTypes[i].compare("int") == 0)
378 {
379 outputDataContainers.push_back(std::vector<int>(model.GetOutputSize(i)));
380 } else if (params.m_OutputTypes[i].compare("qasymm8") == 0)
381 {
382 outputDataContainers.push_back(std::vector<uint8_t>(model.GetOutputSize(i)));
383 } else if (params.m_OutputTypes[i].compare("qsymms8") == 0)
384 {
385 outputDataContainers.push_back(std::vector<int8_t>(model.GetOutputSize(i)));
386 } else
387 {
388 ARMNN_LOG(fatal) << "Unsupported tensor data type \"" << params.m_OutputTypes[i] << "\". ";
389 return EXIT_FAILURE;
Jan Eilers45274902020-10-15 18:34:43 +0100390 }
391 }
Sadik Armagana04a9d72021-04-27 10:02:10 +0100392 outputs.push_back(outputDataContainers);
393 }
394
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100395 // Synchronous execution
Sadik Armagana04a9d72021-04-27 10:02:10 +0100396 if (!params.m_Concurrent)
397 {
Sadik Armagana04a9d72021-04-27 10:02:10 +0100398 for (size_t x = 0; x < params.m_Iterations; x++)
399 {
400 // model.Run returns the inference time elapsed in EnqueueWorkload (in milliseconds)
401 auto inference_duration = model.Run(inputs[0], outputs[0]);
402
403 if (params.m_GenerateTensorData)
404 {
405 ARMNN_LOG(warning) << "The input data was generated, note that the output will not be useful";
406 }
407
408 // Print output tensors
409 const auto& infosOut = model.GetOutputBindingInfos();
410 for (size_t i = 0; i < numOutputs; i++)
411 {
412 const armnn::TensorInfo& infoOut = infosOut[i].second;
413 auto outputTensorFile = params.m_OutputTensorFiles.empty() ? "" : params.m_OutputTensorFiles[i];
414
415 TensorPrinter printer(inferenceModelParams.m_OutputBindings[i],
416 infoOut,
417 outputTensorFile,
418 params.m_DequantizeOutput);
419 mapbox::util::apply_visitor(printer, outputs[0][i]);
420 }
421
422 ARMNN_LOG(info) << "\nInference time: " << std::setprecision(2)
423 << std::fixed << inference_duration.count() << " ms\n";
424
425 // If thresholdTime == 0.0 (default), then it hasn't been supplied at command line
426 if (params.m_ThresholdTime != 0.0)
427 {
428 ARMNN_LOG(info) << "Threshold time: " << std::setprecision(2)
429 << std::fixed << params.m_ThresholdTime << " ms";
430 auto thresholdMinusInference = params.m_ThresholdTime - inference_duration.count();
431 ARMNN_LOG(info) << "Threshold time - Inference time: " << std::setprecision(2)
432 << std::fixed << thresholdMinusInference << " ms" << "\n";
433
434 if (thresholdMinusInference < 0)
435 {
436 std::string errorMessage = "Elapsed inference time is greater than provided threshold time.";
437 ARMNN_LOG(fatal) << errorMessage;
438 }
439 }
440 }
441 }
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100442 // Asynchronous execution using the Arm NN thread pool
443 else if (params.m_ThreadPoolSize >= 2)
444 {
445 try
446 {
447 ARMNN_LOG(info) << "Asynchronous execution with Arm NN thread pool... \n";
448 std::vector<armnn::experimental::IAsyncExecutionCallbackPtr> callbacks;
449
450 // Create callbacks that will be checked post scheduling
451 for (size_t i = 0; i < params.m_SimultaneousIterations; ++i)
452 {
453 // Point to ArmNN example implementation of AsyncExecutionCallback
454 callbacks.emplace_back(std::make_shared<armnn::experimental::AsyncExecutionCallback>());
455 }
456
457 // Declare the latest and earliest inference times here to be used when calculating overall time
458 std::chrono::high_resolution_clock::time_point earliestStartTime;
459 std::chrono::high_resolution_clock::time_point latestEndTime =
460 std::chrono::high_resolution_clock::now();
461
462 // For the asynchronous execution, we are adding a pool of working memory handles (1 per thread) in the
463 // LoadedNetwork with each scheduled inference having a specific priority
464 for (size_t i = 0; i < callbacks.size(); ++i)
465 {
466 model.RunAsync(inputs[i], outputs[i], callbacks[i]);
467 }
468
469 // Check the results
470 unsigned int j = 0;
471 for (armnn::experimental::IAsyncExecutionCallbackPtr cb : callbacks)
472 {
473 // Get the results
474 auto endTime = time_point_cast<std::chrono::milliseconds>(cb->GetEndTime());
475 auto startTime = time_point_cast<std::chrono::milliseconds>(cb->GetStartTime());
476 auto inferenceDuration = endTime - startTime;
477
478 if (latestEndTime < cb->GetEndTime())
479 {
480 latestEndTime = cb->GetEndTime();
481 }
482
483 if (earliestStartTime.time_since_epoch().count() == 0)
484 {
485 earliestStartTime = cb->GetStartTime();
486 }
487 else if (earliestStartTime > cb->GetStartTime())
488 {
489 earliestStartTime = cb->GetStartTime();
490 }
491
492 if (params.m_GenerateTensorData)
493 {
494 ARMNN_LOG(warning) << "The input data was generated, note that the output will not be useful";
495 }
496
497 // Print output tensors
498 const auto& infosOut = model.GetOutputBindingInfos();
499 for (size_t i = 0; i < numOutputs; i++)
500 {
501 const armnn::TensorInfo& infoOut = infosOut[i].second;
502 auto outputTensorFile = params.m_OutputTensorFiles.empty()
503 ? ""
504 : params.m_OutputTensorFiles[(j * numOutputs) + i];
505
506 TensorPrinter printer(inferenceModelParams.m_OutputBindings[i],
507 infoOut,
508 outputTensorFile,
509 params.m_DequantizeOutput);
510 mapbox::util::apply_visitor(printer, outputs[j][i]);
511 }
512
513 ARMNN_LOG(info) << "\nInference time: " << std::setprecision(2)
514 << std::fixed << inferenceDuration.count() << " ms\n";
515
516 // If thresholdTime == 0.0 (default), then it hasn't been supplied at command line
517 if (params.m_ThresholdTime != 0.0)
518 {
519 ARMNN_LOG(info) << "Threshold time: " << std::setprecision(2)
520 << std::fixed << params.m_ThresholdTime << " ms";
521 auto thresholdMinusInference =
522 params.m_ThresholdTime - duration<double, std::milli>(inferenceDuration).count();
523 ARMNN_LOG(info) << "Threshold time - Inference time: " << std::setprecision(2)
524 << std::fixed << thresholdMinusInference << " ms" << "\n";
525
526 if (thresholdMinusInference < 0)
527 {
528 ARMNN_LOG(fatal) << "Elapsed inference time is greater than provided threshold time. \n";
529 }
530 }
531 ++j;
532 }
533 //print duration difference between overallStartTime and overallEndTime
534 auto overallEndTime = time_point_cast<std::chrono::milliseconds>(latestEndTime);
535 auto overallStartTime = time_point_cast<std::chrono::milliseconds>(earliestStartTime);
536 auto totalInferenceDuration = overallEndTime - overallStartTime;
537 ARMNN_LOG(info) << "\nOverall Inference time: " << std::setprecision(2)
538 << std::fixed << totalInferenceDuration.count() << " ms\n";
539 }
540 catch (const armnn::Exception& e)
541 {
542 ARMNN_LOG(fatal) << "Armnn Error: " << e.what();
543 return EXIT_FAILURE;
544 }
545 }
546 // Asynchronous execution using std::launch::async
Sadik Armagana04a9d72021-04-27 10:02:10 +0100547 else
548 {
549 try
550 {
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100551 ARMNN_LOG(info) << "Asynchronous Execution with std::launch:async... \n";
Sadik Armagana04a9d72021-04-27 10:02:10 +0100552 std::vector<std::future<std::tuple<armnn::profiling::ProfilingGuid,
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100553 std::chrono::duration<double, std::milli>>>> inferenceResults;
Sadik Armagana04a9d72021-04-27 10:02:10 +0100554 inferenceResults.reserve(params.m_SimultaneousIterations);
555
556 // Create WorkingMemHandles for each inference
557 std::vector<std::unique_ptr<armnn::experimental::IWorkingMemHandle>> workingMemHandles;
558 workingMemHandles.reserve(params.m_SimultaneousIterations);
559 for (unsigned int i = 0; i < params.m_SimultaneousIterations; ++i)
560 {
561 workingMemHandles.push_back(model.CreateWorkingMemHandle());
562 }
563
564 // Run each inference in its own thread
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100565 // start a timer
566 const auto start_time = armnn::GetTimeNow();
Sadik Armagana04a9d72021-04-27 10:02:10 +0100567 for (unsigned int i = 0; i < params.m_SimultaneousIterations; ++i)
568 {
569 armnn::experimental::IWorkingMemHandle& workingMemHandleRef = *workingMemHandles[i].get();
570 inferenceResults.push_back(std::async(
571 std::launch::async, [&model, &workingMemHandleRef, &inputs, &outputs, i]() {
572 return model.RunAsync(workingMemHandleRef, inputs[i], outputs[i]);
573 }
574 ));
575 }
576
577 // Check the results
578 for (unsigned int j = 0; j < inferenceResults.size(); ++j)
579 {
580 // Get the results
581 auto inferenceResult = inferenceResults[j].get();
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100582 auto inferenceDuration = std::get<1>(inferenceResult);
Sadik Armagana04a9d72021-04-27 10:02:10 +0100583 auto inferenceID = std::get<0>(inferenceResult);
584
585 if (params.m_GenerateTensorData)
586 {
587 ARMNN_LOG(warning) << "The input data was generated, note that the output will not be useful";
588 }
589
590 // Print output tensors
591 const auto& infosOut = model.GetOutputBindingInfos();
592 for (size_t i = 0; i < numOutputs; i++)
593 {
594 const armnn::TensorInfo& infoOut = infosOut[i].second;
595 auto outputTensorFile = params.m_OutputTensorFiles.empty()
596 ? ""
597 : params.m_OutputTensorFiles[(j * numOutputs) + i];
598
599 TensorPrinter printer(inferenceModelParams.m_OutputBindings[i],
600 infoOut,
601 outputTensorFile,
602 params.m_DequantizeOutput);
603 mapbox::util::apply_visitor(printer, outputs[j][i]);
604 }
605
606 ARMNN_LOG(info) << "\nInference time: " << std::setprecision(2)
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100607 << std::fixed << inferenceDuration.count() << " ms\n";
Sadik Armagana04a9d72021-04-27 10:02:10 +0100608
609 // If thresholdTime == 0.0 (default), then it hasn't been supplied at command line
610 if (params.m_ThresholdTime != 0.0)
611 {
612 ARMNN_LOG(info) << "Threshold time: " << std::setprecision(2)
613 << std::fixed << params.m_ThresholdTime << " ms";
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100614 auto thresholdMinusInference = params.m_ThresholdTime - inferenceDuration.count();
Sadik Armagana04a9d72021-04-27 10:02:10 +0100615 ARMNN_LOG(info) << "Threshold time - Inference time: " << std::setprecision(2)
616 << std::fixed << thresholdMinusInference << " ms" << "\n";
617
618 if (thresholdMinusInference < 0)
619 {
620 ARMNN_LOG(fatal) << "Elapsed inference time is greater than provided threshold time. \n";
621 }
622 }
623 ARMNN_LOG(info) << "Asynchronous Execution is finished for Inference ID: " << inferenceID << " \n";
624
625 }
Kevin Mayb4b3ac92021-05-21 16:42:21 +0100626 // finish timer
627 const auto duration = armnn::GetTimeDuration(start_time);
628 ARMNN_LOG(info) << "\nOverall Inference time: " << std::setprecision(2)
629 << std::fixed << duration.count() << " ms\n";
Sadik Armagana04a9d72021-04-27 10:02:10 +0100630 }
631 catch (const armnn::Exception& e)
632 {
633 ARMNN_LOG(fatal) << "Armnn Error: " << e.what();
634 return EXIT_FAILURE;
635 }
Jan Eilers45274902020-10-15 18:34:43 +0100636 }
637 }
638 catch (const armnn::Exception& e)
639 {
640 ARMNN_LOG(fatal) << "Armnn Error: " << e.what();
641 return EXIT_FAILURE;
642 }
643
644 return EXIT_SUCCESS;
645}
646
telsoa01c577f2c2018-08-31 09:22:23 +0100647
James Conroy7b4886f2019-04-11 10:23:58 +0100648// MAIN
telsoa01c577f2c2018-08-31 09:22:23 +0100649int main(int argc, const char* argv[])
650{
651 // Configures logging for both the ARMNN library and this test program.
Jan Eilers45274902020-10-15 18:34:43 +0100652 #ifdef NDEBUG
telsoa01c577f2c2018-08-31 09:22:23 +0100653 armnn::LogSeverity level = armnn::LogSeverity::Info;
Jan Eilers45274902020-10-15 18:34:43 +0100654 #else
telsoa01c577f2c2018-08-31 09:22:23 +0100655 armnn::LogSeverity level = armnn::LogSeverity::Debug;
Jan Eilers45274902020-10-15 18:34:43 +0100656 #endif
telsoa01c577f2c2018-08-31 09:22:23 +0100657 armnn::ConfigureLogging(true, true, level);
telsoa01c577f2c2018-08-31 09:22:23 +0100658
telsoa01c577f2c2018-08-31 09:22:23 +0100659
Jan Eilers45274902020-10-15 18:34:43 +0100660 // Get ExecuteNetwork parameters and runtime options from command line
661 ProgramOptions ProgramOptions(argc, argv);
Narumol Prangnawaratd8cc8112020-03-24 13:54:05 +0000662
Finn Williamsd7fcafa2020-04-23 17:55:18 +0100663 // Create runtime
Jan Eilers45274902020-10-15 18:34:43 +0100664 std::shared_ptr<armnn::IRuntime> runtime(armnn::IRuntime::Create(ProgramOptions.m_RuntimeOptions));
Finn Williamsd7fcafa2020-04-23 17:55:18 +0100665
Jan Eilers45274902020-10-15 18:34:43 +0100666 std::string modelFormat = ProgramOptions.m_ExNetParams.m_ModelFormat;
667
668 // Forward to implementation based on the parser type
669 if (modelFormat.find("armnn") != std::string::npos)
Finn Williamsd7fcafa2020-04-23 17:55:18 +0100670 {
Jan Eilers45274902020-10-15 18:34:43 +0100671 #if defined(ARMNN_SERIALIZER)
672 return MainImpl<armnnDeserializer::IDeserializer, float>(ProgramOptions.m_ExNetParams, runtime);
673 #else
674 ARMNN_LOG(fatal) << "Not built with serialization support.";
Finn Williamsd7fcafa2020-04-23 17:55:18 +0100675 return EXIT_FAILURE;
Jan Eilers45274902020-10-15 18:34:43 +0100676 #endif
Finn Williamsd7fcafa2020-04-23 17:55:18 +0100677 }
Jan Eilers45274902020-10-15 18:34:43 +0100678 else if (modelFormat.find("onnx") != std::string::npos)
telsoa01c577f2c2018-08-31 09:22:23 +0100679 {
Jan Eilers45274902020-10-15 18:34:43 +0100680 #if defined(ARMNN_ONNX_PARSER)
681 return MainImpl<armnnOnnxParser::IOnnxParser, float>(ProgramOptions.m_ExNetParams, runtime);
682 #else
683 ARMNN_LOG(fatal) << "Not built with Onnx parser support.";
684 return EXIT_FAILURE;
685 #endif
686 }
Jan Eilers45274902020-10-15 18:34:43 +0100687 else if(modelFormat.find("tflite") != std::string::npos)
688 {
Finn Williamsf806c4d2021-02-22 15:13:12 +0000689 if (ProgramOptions.m_ExNetParams.m_TfLiteExecutor == ExecuteNetworkParams::TfLiteExecutor::ArmNNTfLiteParser)
690 {
691 #if defined(ARMNN_TF_LITE_PARSER)
692 return MainImpl<armnnTfLiteParser::ITfLiteParser, float>(ProgramOptions.m_ExNetParams, runtime);
693 #else
694 ARMNN_LOG(fatal) << "Not built with Tensorflow-Lite parser support.";
695 return EXIT_FAILURE;
696 #endif
697 }
698 else if (ProgramOptions.m_ExNetParams.m_TfLiteExecutor ==
699 ExecuteNetworkParams::TfLiteExecutor::ArmNNTfLiteDelegate ||
700 ProgramOptions.m_ExNetParams.m_TfLiteExecutor ==
701 ExecuteNetworkParams::TfLiteExecutor::TfliteInterpreter)
Sadik Armagan5d03e312020-11-17 16:43:56 +0000702 {
703 #if defined(ARMNN_TF_LITE_DELEGATE)
704 return TfLiteDelegateMainImpl(ProgramOptions.m_ExNetParams, runtime);
705 #else
Finn Williamsbbbefec2020-11-25 14:32:42 +0000706 ARMNN_LOG(fatal) << "Not built with Arm NN Tensorflow-Lite delegate support.";
Sadik Armagan5d03e312020-11-17 16:43:56 +0000707 return EXIT_FAILURE;
708 #endif
709 }
Jan Eilers45274902020-10-15 18:34:43 +0100710 }
711 else
712 {
713 ARMNN_LOG(fatal) << "Unknown model format: '" << modelFormat
Nikhil Raj5d955cf2021-04-19 16:59:48 +0100714 << "'. Please include 'tflite' or 'onnx'";
Jan Eilers45274902020-10-15 18:34:43 +0100715 return EXIT_FAILURE;
telsoa014fcda012018-03-09 14:13:49 +0000716 }
717}