blob: c1c5f635b6dd28c15f9b064cf686fc297db0a7f2 [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5#include "MnistDatabase.hpp"
6
Derek Lamberti08446972019-11-26 16:38:31 +00007#include <armnn/Logging.hpp>
8
telsoa014fcda012018-03-09 14:13:49 +00009#include <boost/numeric/conversion/cast.hpp>
Narumol Prangnawaratac2770a2020-04-01 16:51:23 +010010
telsoa014fcda012018-03-09 14:13:49 +000011#include <fstream>
12#include <vector>
13
14constexpr int g_kMnistImageByteSize = 28 * 28;
15
16void EndianSwap(unsigned int &x)
17{
18 x = (x >> 24) | ((x << 8) & 0x00FF0000) | ((x >> 8) & 0x0000FF00) | (x << 24);
19}
20
21MnistDatabase::MnistDatabase(const std::string& binaryFileDirectory, bool scaleValues)
22 : m_BinaryDirectory(binaryFileDirectory)
23 , m_ScaleValues(scaleValues)
24{
25}
26
27std::unique_ptr<MnistDatabase::TTestCaseData> MnistDatabase::GetTestCaseData(unsigned int testCaseId)
28{
29 std::vector<unsigned char> I(g_kMnistImageByteSize);
30 unsigned int label = 0;
31
32 std::string imagePath = m_BinaryDirectory + std::string("t10k-images.idx3-ubyte");
33 std::string labelPath = m_BinaryDirectory + std::string("t10k-labels.idx1-ubyte");
34
35 std::ifstream imageStream(imagePath, std::ios::binary);
36 std::ifstream labelStream(labelPath, std::ios::binary);
37
38 if (!imageStream.is_open())
39 {
Derek Lamberti08446972019-11-26 16:38:31 +000040 ARMNN_LOG(fatal) << "Failed to load " << imagePath;
telsoa014fcda012018-03-09 14:13:49 +000041 return nullptr;
42 }
43 if (!labelStream.is_open())
44 {
Derek Lamberti08446972019-11-26 16:38:31 +000045 ARMNN_LOG(fatal) << "Failed to load " << imagePath;
telsoa014fcda012018-03-09 14:13:49 +000046 return nullptr;
47 }
48
49 unsigned int magic, num, row, col;
50
telsoa01c577f2c2018-08-31 09:22:23 +010051 // Checks the files have the correct header.
telsoa014fcda012018-03-09 14:13:49 +000052 imageStream.read(reinterpret_cast<char*>(&magic), sizeof(magic));
53 if (magic != 0x03080000)
54 {
Derek Lamberti08446972019-11-26 16:38:31 +000055 ARMNN_LOG(fatal) << "Failed to read " << imagePath;
telsoa014fcda012018-03-09 14:13:49 +000056 return nullptr;
57 }
58 labelStream.read(reinterpret_cast<char*>(&magic), sizeof(magic));
59 if (magic != 0x01080000)
60 {
Derek Lamberti08446972019-11-26 16:38:31 +000061 ARMNN_LOG(fatal) << "Failed to read " << labelPath;
telsoa014fcda012018-03-09 14:13:49 +000062 return nullptr;
63 }
64
telsoa01c577f2c2018-08-31 09:22:23 +010065 // Endian swaps the image and label file - all the integers in the files are stored in MSB first(high endian)
66 // format, hence it needs to flip the bytes of the header if using it on Intel processors or low-endian machines
telsoa014fcda012018-03-09 14:13:49 +000067 labelStream.read(reinterpret_cast<char*>(&num), sizeof(num));
68 imageStream.read(reinterpret_cast<char*>(&num), sizeof(num));
69 EndianSwap(num);
70 imageStream.read(reinterpret_cast<char*>(&row), sizeof(row));
71 EndianSwap(row);
72 imageStream.read(reinterpret_cast<char*>(&col), sizeof(col));
73 EndianSwap(col);
74
telsoa01c577f2c2018-08-31 09:22:23 +010075 // Reads image and label into memory.
telsoa014fcda012018-03-09 14:13:49 +000076 imageStream.seekg(testCaseId * g_kMnistImageByteSize, std::ios_base::cur);
77 imageStream.read(reinterpret_cast<char*>(&I[0]), g_kMnistImageByteSize);
78 labelStream.seekg(testCaseId, std::ios_base::cur);
79 labelStream.read(reinterpret_cast<char*>(&label), 1);
80
81 if (!imageStream.good())
82 {
Derek Lamberti08446972019-11-26 16:38:31 +000083 ARMNN_LOG(fatal) << "Failed to read " << imagePath;
telsoa014fcda012018-03-09 14:13:49 +000084 return nullptr;
85 }
86 if (!labelStream.good())
87 {
Derek Lamberti08446972019-11-26 16:38:31 +000088 ARMNN_LOG(fatal) << "Failed to read " << labelPath;
telsoa014fcda012018-03-09 14:13:49 +000089 return nullptr;
90 }
91
92 std::vector<float> inputImageData;
93 inputImageData.resize(g_kMnistImageByteSize);
94
95 for (unsigned int i = 0; i < col * row; ++i)
96 {
97 inputImageData[i] = boost::numeric_cast<float>(I[i]);
98
99 if(m_ScaleValues)
100 {
101 inputImageData[i] /= 255.0f;
102 }
103 }
104
105 return std::make_unique<TTestCaseData>(label, std::move(inputImageData));
106}