Blame - source/use_case/ad/src/UseCaseHandler.cc - ml/ethos-u/ml-embedded-evaluation-kit

2021-03-26 21:42:19 +0000

[diff] [blame]

1

/*

2

3

* SPDX-License-Identifier: Apache-2.0

4

*

5

* Licensed under the Apache License, Version 2.0 (the "License");

6

* you may not use this file except in compliance with the License.

7

* You may obtain a copy of the License at

8

*

9

* http://www.apache.org/licenses/LICENSE-2.0

10

*

11

* Unless required by applicable law or agreed to in writing, software

12

* distributed under the License is distributed on an "AS IS" BASIS,

13

* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

* See the License for the specific language governing permissions and

15

* limitations under the License.

16

*/

17

#include "UseCaseHandler.hpp"

18

19

#include "AdModel.hpp"

20

#include "InputFiles.hpp"

21

#include "Classifier.hpp"

22

#include "hal.h"

23

#include "AdMelSpectrogram.hpp"

24

#include "AudioUtils.hpp"

25

#include "UseCaseCommonUtils.hpp"

26

#include "AdPostProcessing.hpp"

namespace arm {

namespace app {

/**

* @brief Helper function to increment current audio clip index

Isabella Gottardi

2021-05-12 08:27:15 +0100

[diff] [blame^]

33

* @param[in,out] ctx pointer to the application context object

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

34

**/

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

35

static void IncrementAppCtxClipIdx(ApplicationContext& ctx);

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

36

37

/**

38

* @brief Helper function to set the audio clip index

Isabella Gottardi

2021-05-12 08:27:15 +0100

[diff] [blame^]

39

* @param[in,out] ctx pointer to the application context object

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

40

* @param[in] idx value to be set

41

* @return true if index is set, false otherwise

42

**/

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

43

static bool SetAppCtxClipIdx(ApplicationContext& ctx, uint32_t idx);

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

44

45

/**

46

* @brief Presents inference results using the data presentation

47

* object.

48

* @param[in] platform reference to the hal platform object

49

* @param[in] result average sum of classification results

Isabella Gottardi

2021-05-12 08:27:15 +0100

[diff] [blame^]

50

* @param[in] threshold if larger than this value we have an anomaly

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

51

* @return true if successful, false otherwise

52

**/

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

53

static bool PresentInferenceResult(hal_platform& platform, float result, float threshold);

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

54

55

/**

56

* @brief Returns a function to perform feature calculation and populates input tensor data with

57

* MelSpe data.

58

*

59

* Input tensor data type check is performed to choose correct MFCC feature data type.

60

* If tensor has an integer data type then original features are quantised.

61

*

62

* Warning: mfcc calculator provided as input must have the same life scope as returned function.

63

*

Isabella Gottardi

2021-05-12 08:27:15 +0100

[diff] [blame^]

64

* @param[in] melSpec MFCC feature calculator.

65

* @param[in,out] inputTensor Input tensor pointer to store calculated features.

66

* @param[in] cacheSize Size of the feture vectors cache (number of feature vectors).

67

* @param[in] trainingMean Training mean.

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

68

* @return function function to be called providing audio sample and sliding window index.

69

*/

70

static std::function<void (std::vector<int16_t>&, int, bool, size_t, size_t)>

71

GetFeatureCalculator(audio::AdMelSpectrogram& melSpec,

72

TfLiteTensor* inputTensor,

size_t cacheSize,

float trainingMean);

/* Vibration classification handler */

77

bool ClassifyVibrationHandler(ApplicationContext& ctx, uint32_t clipIndex, bool runAll)

78

{

79

auto& platform = ctx.Get<hal_platform&>("platform");

Isabella Gottardi

8df12f3

2021-04-07 17:15:31 +0100

[diff] [blame]

80

auto& profiler = ctx.Get<Profiler&>("profiler");

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

81

82

constexpr uint32_t dataPsnTxtInfStartX = 20;

83

constexpr uint32_t dataPsnTxtInfStartY = 40;

84

85

platform.data_psn->clear(COLOR_BLACK);

86

87

auto& model = ctx.Get<Model&>("model");

88

89

/* If the request has a valid size, set the audio index */

90

if (clipIndex < NUMBER_OF_FILES) {

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

91

if (!SetAppCtxClipIdx(ctx, clipIndex)) {

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

return false;

}

}

if (!model.IsInited()) {

96

printf_err("Model is not initialised! Terminating processing.\n");

return false;

}

const auto frameLength = ctx.Get<int>("frameLength");

101

const auto frameStride = ctx.Get<int>("frameStride");

102

const auto scoreThreshold = ctx.Get<float>("scoreThreshold");

Isabella Gottardi

8df12f3

2021-04-07 17:15:31 +0100

[diff] [blame]

103

const auto trainingMean = ctx.Get<float>("trainingMean");

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

104

auto startClipIdx = ctx.Get<uint32_t>("clipIndex");

105

106

TfLiteTensor* outputTensor = model.GetOutputTensor(0);

107

TfLiteTensor* inputTensor = model.GetInputTensor(0);

108

109

if (!inputTensor->dims) {

110

printf_err("Invalid input tensor dims\n");

return false;

}

TfLiteIntArray* inputShape = model.GetInputShape(0);

115

const uint32_t kNumRows = inputShape->data[1];

116

const uint32_t kNumCols = inputShape->data[2];

117

118

audio::AdMelSpectrogram melSpec = audio::AdMelSpectrogram(frameLength);

119

melSpec.Init();

120

121

/* Deduce the data length required for 1 inference from the network parameters. */

122

const uint8_t inputResizeScale = 2;

123

const uint32_t audioDataWindowSize = (((inputResizeScale * kNumCols) - 1) * frameStride) + frameLength;

124

125

/* We are choosing to move by 20 frames across the audio for each inference. */

126

const uint8_t nMelSpecVectorsInAudioStride = 20;

127

128

auto audioDataStride = nMelSpecVectorsInAudioStride * frameStride;

129

130

do {

131

auto currentIndex = ctx.Get<uint32_t>("clipIndex");

132

133

/* Get the output index to look at based on id in the filename. */

134

int8_t machineOutputIndex = OutputIndexFromFileName(get_filename(currentIndex));

135

if (machineOutputIndex == -1) {

return false;

}

/* Creating a Mel Spectrogram sliding window for the data required for 1 inference.

140

* "resizing" done here by multiplying stride by resize scale. */

141

auto audioMelSpecWindowSlider = audio::SlidingWindow<const int16_t>(

142

get_audio_array(currentIndex),

143

audioDataWindowSize, frameLength,

144

frameStride * inputResizeScale);

145

146

/* Creating a sliding window through the whole audio clip. */

147

auto audioDataSlider = audio::SlidingWindow<const int16_t>(

148

get_audio_array(currentIndex),

149

get_audio_array_size(currentIndex),

150

audioDataWindowSize, audioDataStride);

151

152

/* Calculate number of the feature vectors in the window overlap region taking into account resizing.

153

* These feature vectors will be reused.*/

154

auto numberOfReusedFeatureVectors = kNumRows - (nMelSpecVectorsInAudioStride / inputResizeScale);

155

156

/* Construct feature calculation function. */

157

auto melSpecFeatureCalc = GetFeatureCalculator(melSpec, inputTensor,

158

numberOfReusedFeatureVectors, trainingMean);

159

if (!melSpecFeatureCalc){

return false;

}

/* Result is an averaged sum over inferences. */

164

float result = 0;

165

166

/* Display message on the LCD - inference running. */

167

std::string str_inf{"Running inference... "};

168

platform.data_psn->present_data_text(

169

str_inf.c_str(), str_inf.size(),

170

dataPsnTxtInfStartX, dataPsnTxtInfStartY, 0);

Kshitij Sisodia

f9c19ea

2021-05-07 16:08:14 +0100

[diff] [blame]

171

info("Running inference on audio clip %" PRIu32 " => %s\n", currentIndex, get_filename(currentIndex));

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

172

173

/* Start sliding through audio clip. */

174

while (audioDataSlider.HasNext()) {

175

const int16_t *inferenceWindow = audioDataSlider.Next();

176

177

/* We moved to the next window - set the features sliding to the new address. */

178

audioMelSpecWindowSlider.Reset(inferenceWindow);

179

180

/* The first window does not have cache ready. */

181

bool useCache = audioDataSlider.Index() > 0 && numberOfReusedFeatureVectors > 0;

182

183

/* Start calculating features inside one audio sliding window. */

184

while (audioMelSpecWindowSlider.HasNext()) {

185

const int16_t *melSpecWindow = audioMelSpecWindowSlider.Next();

186

std::vector<int16_t> melSpecAudioData = std::vector<int16_t>(melSpecWindow,

187

melSpecWindow + frameLength);

188

189

/* Compute features for this window and write them to input tensor. */

190

melSpecFeatureCalc(melSpecAudioData, audioMelSpecWindowSlider.Index(),

191

useCache, nMelSpecVectorsInAudioStride, inputResizeScale);

192

}

193

194

info("Inference %zu/%zu\n", audioDataSlider.Index() + 1,

195

audioDataSlider.TotalStrides() + 1);

196

197

/* Run inference over this audio clip sliding window */

alexander

27b62d9

2021-05-04 20:46:08 +0100

[diff] [blame]

198

if (!RunInference(model, profiler)) {

199

return false;

200

}

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

201

202

/* Use the negative softmax score of the corresponding index as the outlier score */

203

std::vector<float> dequantOutput = Dequantize<int8_t>(outputTensor);

204

Softmax(dequantOutput);

205

result += -dequantOutput[machineOutputIndex];

206

207

#if VERIFY_TEST_OUTPUT

208

arm::app::DumpTensor(outputTensor);

209

#endif /* VERIFY_TEST_OUTPUT */

210

} /* while (audioDataSlider.HasNext()) */

211

212

/* Use average over whole clip as final score. */

213

result /= (audioDataSlider.TotalStrides() + 1);

214

215

/* Erase. */

216

str_inf = std::string(str_inf.size(), ' ');

217

platform.data_psn->present_data_text(

218

str_inf.c_str(), str_inf.size(),

219

dataPsnTxtInfStartX, dataPsnTxtInfStartY, 0);

220

221

ctx.Set<float>("result", result);

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

222

if (!PresentInferenceResult(platform, result, scoreThreshold)) {

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

return false;

}

Isabella Gottardi

2021-04-07 17:15:31 +0100

[diff] [blame]

226

profiler.PrintProfilingResult();

227

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

228

IncrementAppCtxClipIdx(ctx);

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

229

230

} while (runAll && ctx.Get<uint32_t>("clipIndex") != startClipIdx);

return true;

}

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

235

static void IncrementAppCtxClipIdx(ApplicationContext& ctx)

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

236

{

237

auto curAudioIdx = ctx.Get<uint32_t>("clipIndex");

238

239

if (curAudioIdx + 1 >= NUMBER_OF_FILES) {

240

ctx.Set<uint32_t>("clipIndex", 0);

return;

}

++curAudioIdx;

ctx.Set<uint32_t>("clipIndex", curAudioIdx);

245

}

246

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

247

static bool SetAppCtxClipIdx(ApplicationContext& ctx, uint32_t idx)

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

248

{

249

if (idx >= NUMBER_OF_FILES) {

Kshitij Sisodia

f9c19ea

2021-05-07 16:08:14 +0100

[diff] [blame]

250

printf_err("Invalid idx %" PRIu32 " (expected less than %u)\n",

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

251

idx, NUMBER_OF_FILES);

252

return false;

253

}

254

ctx.Set<uint32_t>("clipIndex", idx);

return true;

}

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

258

static bool PresentInferenceResult(hal_platform& platform, float result, float threshold)

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

259

{

260

constexpr uint32_t dataPsnTxtStartX1 = 20;

261

constexpr uint32_t dataPsnTxtStartY1 = 30;

262

constexpr uint32_t dataPsnTxtYIncr = 16; /* Row index increment */

263

264

platform.data_psn->set_text_color(COLOR_GREEN);

265

266

/* Display each result */

267

uint32_t rowIdx1 = dataPsnTxtStartY1 + 2 * dataPsnTxtYIncr;

268

269

std::string resultStr = std::string{"Average anomaly score is: "} + std::to_string(result) +

270

std::string("\n") + std::string("Anomaly threshold is: ") + std::to_string(threshold) +

271

std::string("\n");

272

273

if (result > threshold) {

274

resultStr += std::string("Anomaly detected!");

275

} else {

276

resultStr += std::string("Everything fine, no anomaly detected!");

277

}

278

279

platform.data_psn->present_data_text(

280

resultStr.c_str(), resultStr.size(),

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

281

dataPsnTxtStartX1, rowIdx1, false);

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

282

283

info("%s\n", resultStr.c_str());

return true;

}

/**

* @brief Generic feature calculator factory.

290

*

291

* Returns lambda function to compute features using features cache.

292

* Real features math is done by a lambda function provided as a parameter.

293

* Features are written to input tensor memory.

294

*

295

* @tparam T feature vector type.

296

* @param inputTensor model input tensor pointer.

297

* @param cacheSize number of feature vectors to cache. Defined by the sliding window overlap.

298

* @param compute features calculator function.

299

* @return lambda function to compute features.

300

*/

301

template<class T>

302

std::function<void (std::vector<int16_t>&, size_t, bool, size_t, size_t)>

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

303

FeatureCalc(TfLiteTensor* inputTensor, size_t cacheSize,

304

std::function<std::vector<T> (std::vector<int16_t>& )> compute)

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

305

{

306

/* Feature cache to be captured by lambda function*/

307

static std::vector<std::vector<T>> featureCache = std::vector<std::vector<T>>(cacheSize);

308

309

return [=](std::vector<int16_t>& audioDataWindow,

310

size_t index,

311

bool useCache,

312

size_t featuresOverlapIndex,

313

size_t resizeScale)

314

{

315

T *tensorData = tflite::GetTensorData<T>(inputTensor);

316

std::vector<T> features;

317

318

/* Reuse features from cache if cache is ready and sliding windows overlap.

319

* Overlap is in the beginning of sliding window with a size of a feature cache. */

320

if (useCache && index < featureCache.size()) {

321

features = std::move(featureCache[index]);

322

} else {

323

features = std::move(compute(audioDataWindow));

324

}

325

auto size = features.size() / resizeScale;

326

auto sizeBytes = sizeof(T);

327

328

/* Input should be transposed and "resized" by skipping elements. */

329

for (size_t outIndex = 0; outIndex < size; outIndex++) {

330

std::memcpy(tensorData + (outIndex*size) + index, &features[outIndex*resizeScale], sizeBytes);

331

}

332

333

/* Start renewing cache as soon iteration goes out of the windows overlap. */

334

if (index >= featuresOverlapIndex / resizeScale) {

335

featureCache[index - featuresOverlapIndex / resizeScale] = std::move(features);

}

};

}

template std::function<void (std::vector<int16_t>&, size_t , bool, size_t, size_t)>

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

341

FeatureCalc<int8_t>(TfLiteTensor* inputTensor,

342

size_t cacheSize,

343

std::function<std::vector<int8_t> (std::vector<int16_t>&)> compute);

344

345

template std::function<void (std::vector<int16_t>&, size_t , bool, size_t, size_t)>

346

FeatureCalc<uint8_t>(TfLiteTensor* inputTensor,

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

347

size_t cacheSize,

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

348

std::function<std::vector<uint8_t> (std::vector<int16_t>&)> compute);

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

349

350

template std::function<void (std::vector<int16_t>&, size_t , bool, size_t, size_t)>

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

351

FeatureCalc<int16_t>(TfLiteTensor* inputTensor,

352

size_t cacheSize,

353

std::function<std::vector<int16_t> (std::vector<int16_t>&)> compute);

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

354

355

template std::function<void(std::vector<int16_t>&, size_t, bool, size_t, size_t)>

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

356

FeatureCalc<float>(TfLiteTensor *inputTensor,

357

size_t cacheSize,

358

std::function<std::vector<float>(std::vector<int16_t>&)> compute);

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

359

360

361

static std::function<void (std::vector<int16_t>&, int, bool, size_t, size_t)>

362

GetFeatureCalculator(audio::AdMelSpectrogram& melSpec, TfLiteTensor* inputTensor, size_t cacheSize, float trainingMean)

363

{

364

std::function<void (std::vector<int16_t>&, size_t, bool, size_t, size_t)> melSpecFeatureCalc;

365

366

TfLiteQuantization quant = inputTensor->quantization;

367

368

if (kTfLiteAffineQuantization == quant.type) {

369

370

auto *quantParams = (TfLiteAffineQuantization *) quant.params;

371

const float quantScale = quantParams->scale->data[0];

372

const int quantOffset = quantParams->zero_point->data[0];

373

374

switch (inputTensor->type) {

375

case kTfLiteInt8: {

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

376

melSpecFeatureCalc = FeatureCalc<int8_t>(inputTensor,

377

cacheSize,

378

[=, &melSpec](std::vector<int16_t>& audioDataWindow) {

379

return melSpec.MelSpecComputeQuant<int8_t>(

audioDataWindow,

quantScale,

quantOffset,

trainingMean);

}

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

);

break;

}

case kTfLiteUInt8: {

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

389

melSpecFeatureCalc = FeatureCalc<uint8_t>(inputTensor,

390

cacheSize,

391

[=, &melSpec](std::vector<int16_t>& audioDataWindow) {

392

return melSpec.MelSpecComputeQuant<uint8_t>(

audioDataWindow,

quantScale,

quantOffset,

trainingMean);

}

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

);

break;

}

case kTfLiteInt16: {

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

402

melSpecFeatureCalc = FeatureCalc<int16_t>(inputTensor,

403

cacheSize,

404

[=, &melSpec](std::vector<int16_t>& audioDataWindow) {

405

return melSpec.MelSpecComputeQuant<int16_t>(

audioDataWindow,

quantScale,

quantOffset,

trainingMean);

}

alexander

2021-03-26 21:42:19 +0000

[diff] [blame]

);

break;

}

default:

printf_err("Tensor type %s not supported\n", TfLiteTypeGetName(inputTensor->type));

}

} else {

alexander

2021-04-29 20:36:09 +0100

[diff] [blame]

420

melSpecFeatureCalc = melSpecFeatureCalc = FeatureCalc<float>(inputTensor,

421

cacheSize,

422

[=, &melSpec](

423

std::vector<int16_t>& audioDataWindow) {

424

return melSpec.ComputeMelSpec(

425

audioDataWindow,

426

trainingMean);

427

});

alexander