blob: 9fb87fd3c97b90b70ba27b4f9463526536eca445 [file] [log] [blame]
//
// Copyright © 2021 Arm Ltd and Contributors. All rights reserved.
// SPDX-License-Identifier: MIT
//
#include <catch.hpp>
#include <map>
#include <cinttypes>
#include "KeywordSpottingPipeline.hpp"
#include "DsCNNPreprocessor.hpp"
static std::string GetResourceFilePath(const std::string& filename)
{
std::string testResources = TEST_RESOURCE_DIR;
if (testResources.empty())
{
throw std::invalid_argument("Invalid test resources directory provided");
}
else
{
if(testResources.back() != '/')
{
return testResources + "/" + filename;
}
else
{
return testResources + filename;
}
}
}
TEST_CASE("Test Keyword spotting pipeline")
{
const int8_t ifm0_kws [] =
{
-0x1b, 0x4f, 0x7a, -0x55, 0x6, -0x11, 0x6e, -0x6, 0x67, -0x7e, -0xd, 0x6, 0x49, 0x79, -0x1e, 0xe,
0x1d, 0x6e, 0x6f, 0x6f, -0x2e, -0x4b, 0x2, -0x3e, 0x40, -0x4b, -0x7, 0x31, -0x38, -0x64, -0x28,
0xc, -0x1d, 0xf, 0x1c, 0x5a, -0x4b, 0x56, 0x7e, 0x9, -0x29, 0x13, -0x65, -0xa, 0x34, -0x59, 0x41,
-0x6f, 0x75, 0x67, -0x5f, 0x17, 0x4a, -0x76, -0x7a, 0x49, -0x19, -0x41, 0x78, 0x40, 0x44, 0xe,
-0x51, -0x5c, 0x3d, 0x24, 0x76, -0x66, -0x11, 0x5e, 0x7b, -0x4, 0x7a, 0x9, 0x13, 0x8, -0x21, -0x11,
0x13, 0x7a, 0x25, 0x6, -0x68, 0x6a, -0x30, -0x16, -0x43, -0x27, 0x4c, 0x6b, -0x14, -0x12, -0x5f,
0x49, -0x2a, 0x44, 0x57, -0x78, -0x72, 0x62, -0x8, -0x38, -0x73, -0x2, -0x80, 0x79, -0x3f, 0x57,
0x9, -0x7e, -0x34, -0x59, 0x19, -0x66, 0x58, -0x3b, -0x69, -0x1a, 0x13, -0x2f, -0x2f, 0x13, 0x35,
-0x30, 0x1e, 0x3b, -0x71, 0x67, 0x7d, -0x5d, 0x1a, 0x69, -0x53, -0x38, -0xf, 0x76, 0x2, 0x7e, 0x45,
-0xa, 0x59, -0x6b, -0x28, -0x5d, -0x63, -0x7d, -0x3, 0x48, 0x74, -0x75, -0x7a, 0x1f, -0x53, 0x5b,
0x4d, -0x18, -0x4a, 0x39, -0x52, 0x5a, -0x6b, -0x41, -0x3e, -0x61, -0x80, -0x52, 0x67, 0x71, -0x47,
0x79, -0x41, 0x3a, -0x8, -0x1f, 0x4d, -0x7, 0x5b, 0x6b, -0x1b, -0x8, -0x20, -0x21, 0x7c, -0x74,
0x25, -0x68, -0xe, -0x7e, -0x45, -0x28, 0x45, -0x1a, -0x39, 0x78, 0x11, 0x48, -0x6b, -0x7b, -0x43,
-0x21, 0x38, 0x46, 0x7c, -0x5d, 0x59, 0x53, -0x3f, -0x15, 0x59, -0x17, 0x75, 0x2f, 0x7c, 0x68, 0x6a,
0x0, -0x10, 0x5b, 0x61, 0x36, -0x41, 0x33, 0x23, -0x80, -0x1d, -0xb, -0x56, 0x2d, 0x68, -0x68,
0x2f, 0x48, -0x5d, -0x44, 0x64, -0x27, 0x68, -0x13, 0x39, -0x3f, 0x18, 0x31, 0x15, -0x78, -0x2,
0x72, 0x60, 0x59, -0x30, -0x22, 0x73, 0x61, 0x76, -0x4, -0x62, -0x64, -0x80, -0x32, -0x16, 0x51,
-0x2, -0x70, 0x71, 0x3f, -0x5f, -0x35, -0x3c, 0x79, 0x48, 0x61, 0x5b, -0x20, -0x1e, -0x68, -0x1c,
0x6c, 0x3a, 0x28, -0x36, -0x3e, 0x5f, -0x75, -0x73, 0x1e, 0x75, -0x66, -0x22, 0x20, -0x64, 0x67,
0x36, 0x14, 0x37, -0xa, -0xe, 0x8, -0x37, -0x43, 0x21, -0x8, 0x54, 0x1, 0x34, -0x2c, -0x73, -0x11,
-0x48, -0x1c, -0x40, 0x14, 0x4e, -0x53, 0x25, 0x5e, 0x14, 0x4f, 0x7c, 0x6d, -0x61, -0x38, 0x35,
-0x5a, -0x44, 0x12, 0x52, -0x60, 0x22, -0x1c, -0x8, -0x4, -0x6b, -0x71, 0x43, 0xb, 0x7b, -0x7,
-0x3c, -0x3b, -0x40, -0xd, 0x44, 0x6, 0x30, 0x38, 0x57, 0x1f, -0x7, 0x2, 0x4f, 0x64, 0x7c, -0x3,
-0x13, -0x71, -0x45, -0x53, -0x52, 0x2b, -0x11, -0x1d, -0x2, -0x29, -0x37, 0x3d, 0x19, 0x76, 0x18,
0x1d, 0x12, -0x29, -0x5e, -0x54, -0x48, 0x5d, -0x41, -0x3f, 0x7e, -0x2a, 0x41, 0x57, -0x65, -0x15,
0x12, 0x1f, -0x57, 0x79, -0x64, 0x3a, -0x2f, 0x7f, -0x6c, 0xa, 0x52, -0x1f, -0x41, 0x6e, -0x4b,
0x3d, -0x1b, -0x42, 0x22, -0x3c, -0x35, -0xf, 0xc, 0x32, -0x15, -0x68, -0x21, 0x0, -0x16, 0x14,
-0x10, -0x5b, 0x2f, 0x21, 0x41, -0x8, -0x12, -0xa, 0x10, 0xf, 0x7e, -0x76, -0x1d, 0x2b, -0x49,
0x42, -0x25, -0x78, -0x69, -0x2c, 0x3f, 0xc, 0x52, 0x6d, 0x2e, -0x13, 0x76, 0x37, -0x36, -0x51,
-0x5, -0x63, -0x4f, 0x1c, 0x6b, -0x4b, 0x71, -0x12, 0x72, -0x3f,-0x4a, 0xf, 0x3a, -0xd, 0x38, 0x3b,
-0x5d, 0x75, -0x43, -0x10, -0xa, -0x7a, 0x1a, -0x44, 0x1c, 0x6a, 0x43, -0x1b, -0x35, 0x7d, -0x2c,
-0x10, 0x5b, -0x42, -0x4f, 0x69, 0x1f, 0x1b, -0x64, -0x21, 0x19, -0x5d, 0x2e, -0x2a, -0x65, -0x13,
-0x70, -0x6e
};
const int8_t ofm0_kws [] =
{
-0x80, 0x7f, -0x80, -0x80, -0x80, -0x80, -0x80, -0x80, -0x80, -0x80, -0x80, -0x80
};
// First 640 samples from yes.wav.
std::vector<int16_t> testWav = std::vector<int16_t>
{
139, 143, 164, 163, 157, 156, 151, 148, 172, 171,
165, 169, 149, 142, 145, 147, 166, 146, 112, 132,
132, 136, 165, 176, 176, 152, 138, 158, 179, 185,
183, 148, 121, 130, 167, 204, 163, 132, 165, 184,
193, 205, 210, 204, 195, 178, 168, 197, 207, 201,
197, 177, 185, 196, 191, 198, 196, 183, 193, 181,
157, 170, 167, 159, 164, 152, 146, 167, 180, 171,
194, 232, 204, 173, 171, 172, 184, 169, 175, 199,
200, 195, 185, 214, 214, 193, 196, 191, 204, 191,
172, 187, 183, 192, 203, 172, 182, 228, 232, 205,
177, 174, 191, 210, 210, 211, 197, 177, 198, 217,
233, 236, 203, 191, 169, 145, 149, 161, 198, 206,
176, 137, 142, 181, 200, 215, 201, 188, 166, 162,
184, 155, 135, 132, 126, 142, 169, 184, 172, 156,
132, 119, 150, 147, 154, 160, 125, 130, 137, 154,
161, 168, 195, 182, 160, 134, 138, 146, 130, 120,
101, 122, 137, 118, 117, 131, 145, 140, 146, 148,
148, 168, 159, 134, 114, 114, 130, 147, 147, 134,
125, 98, 107, 127, 99, 79, 84, 107, 117, 114,
93, 92, 127, 112, 109, 110, 96, 118, 97, 87,
110, 95, 128, 153, 147, 165, 146, 106, 101, 137,
139, 96, 73, 90, 91, 51, 69, 102, 100, 103,
96, 101, 123, 107, 82, 89, 118, 127, 99, 100,
111, 97, 111, 123, 106, 121, 133, 103, 100, 88,
85, 111, 114, 125, 102, 91, 97, 84, 139, 157,
109, 66, 72, 129, 111, 90, 127, 126, 101, 109,
142, 138, 129, 159, 140, 80, 74, 78, 76, 98,
68, 42, 106, 143, 112, 102, 115, 114, 82, 75,
92, 80, 110, 114, 66, 86, 119, 101, 101, 103,
118, 145, 85, 40, 62, 88, 95, 87, 73, 64,
86, 71, 71, 105, 80, 73, 96, 92, 85, 90,
81, 86, 105, 100, 89, 78, 102, 114, 95, 98,
69, 70, 108, 112, 111, 90, 104, 137, 143, 160,
145, 121, 98, 86, 91, 87, 115, 123, 109, 99,
85, 120, 131, 116, 125, 144, 153, 111, 98, 110,
93, 89, 101, 137, 155, 142, 108, 94, 136, 145,
129, 129, 122, 109, 90, 76, 81, 110, 119, 96,
95, 102, 105, 111, 90, 89, 111, 115, 86, 51,
107, 140, 105, 105, 110, 142, 125, 76, 75, 69,
65, 52, 61, 69, 55, 42, 47, 58, 37, 35,
24, 20, 44, 22, 16, 26, 6, 3, 4, 23,
60, 51, 30, 12, 24, 31, -9, -16, -13, 13,
19, 9, 37, 55, 70, 36, 23, 57, 45, 33,
50, 59, 18, 11, 62, 74, 52, 8, -3, 26,
51, 48, -5, -9, 12, -7, -12, -5, 28, 41,
-2, -30, -13, 31, 33, -12, -22, -8, -15, -17,
2, -6, -25, -27, -24, -8, 4, -9, -52, -47,
-9, -32, -45, -5, 41, 15, -32, -14, 2, -1,
-10, -30, -32, -25, -21, -17, -14, 8, -4, -13,
34, 18, -36, -38, -18, -19, -28, -17, -14, -16,
-2, -20, -27, 12, 11, -17, -33, -12, -22, -64,
-42, -26, -23, -22, -37, -51, -53, -30, -18, -48,
-69, -38, -54, -96, -72, -49, -50, -57, -41, -22,
-43, -64, -54, -23, -49, -69, -41, -44, -42, -49,
-40, -26, -54, -50, -38, -49, -70, -94, -89, -69,
-56, -65, -71, -47, -39, -49, -79, -91, -56, -46,
-62, -86, -64, -32, -47, -50, -71, -77, -65, -68,
-52, -51, -61, -67, -61, -81, -93, -52, -59, -62,
-51, -75, -76, -50, -32, -54, -68, -70, -43, 1,
-42, -92, -80, -41, -38, -79, -69, -49, -82, -122,
-93, -21, -24, -61, -70, -73, -62, -74, -69, -43,
-25, -15, -43, -23, -26, -69, -44, -12, 1, -51,
-78, -13, 3, -53, -105, -72, -24, -62, -66, -31,
-40, -65, -86, -64, -44, -55, -63, -61, -37, -41,
};
// Golden audio ops mfcc output for the above wav.
const std::vector<float> testWavMfcc
{
-22.67135, -0.61615, 2.07233, 0.58137, 1.01655, 0.85816, 0.46039, 0.03393, 1.16511, 0.0072,
};
std::vector<float> testWavFloat(640);
constexpr float normaliser = 1.0/(1u<<15u);
std::transform(testWav.begin(), testWav.end(), testWavFloat.begin(),
std::bind1st(std::multiplies<float>(), normaliser));
const float DsCNNInputQuantizationScale = 1.107164;
const int DsCNNInputQuantizationOffset = 95;
std::map<int,std::string> labels =
{
{0,"silence"},
{1, "unknown"},
{ 2, "yes"},
{ 3,"no"},
{ 4, "up"},
{ 5, "down"},
{ 6, "left"},
{ 7, "right"},
{ 8, "on"},
{ 9, "off"},
{ 10, "stop"},
{11, "go"}
};
common::PipelineOptions options;
options.m_ModelFilePath = GetResourceFilePath("ds_cnn_clustered_int8.tflite");
options.m_ModelName = "DS_CNN_CLUSTERED_INT8";
options.m_backends = {"CpuAcc", "CpuRef"};
kws::IPipelinePtr kwsPipeline = kws::CreatePipeline(options);
CHECK(kwsPipeline->getInputSamplesSize() == 16000);
std::vector<int8_t> expectedWavMfcc;
for(auto& i : testWavMfcc)
{
expectedWavMfcc.push_back(
(i + DsCNNInputQuantizationScale * DsCNNInputQuantizationOffset) / DsCNNInputQuantizationScale);
}
SECTION("Pre-processing")
{
testWavFloat.resize(16000);
expectedWavMfcc.resize(49 * 10);
std::vector<int8_t> preprocessedData = kwsPipeline->PreProcessing(testWavFloat);
CHECK(preprocessedData.size() == expectedWavMfcc.size());
for(int i = 0; i < 10; ++i)
{
CHECK(expectedWavMfcc[i] == Approx(preprocessedData[i]).margin(1));
}
}
SECTION("Execute inference")
{
common::InferenceResults<int8_t> result;
std::vector<int8_t> IFM(std::begin(ifm0_kws), std::end(ifm0_kws));
kwsPipeline->Inference(IFM, result);
std::vector<int8_t> OFM(std::begin(ofm0_kws), std::end(ofm0_kws));
CHECK(1 == result.size());
CHECK(OFM.size() == result[0].size());
int count = 0;
for (auto& i : result)
{
for (signed char& j : i)
{
CHECK(j == OFM[count++]);
}
}
}
SECTION("Convert inference result to keyword")
{
std::vector< std::vector< int8_t >> modelOutput = {{1, 4, 2, 3, 1, 1, 3, 1, 43, 1, 6, 1}};
kwsPipeline->PostProcessing(modelOutput, labels,
[](int index, std::string& label, float prob) -> void {
CHECK(index == 8);
CHECK(label == "on");
});
}
}