blob: edc89286a21ea0ba87c3af247f4e89b69596dc63 [file] [log] [blame]
Georgios Pinitas7c3b9242018-06-21 19:01:25 +01001/*
2 * Copyright (c) 2018 ARM Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#ifndef __UTILS_IMAGE_LOADER_H__
25#define __UTILS_IMAGE_LOADER_H__
26
27#include "arm_compute/core/Error.h"
28#include "arm_compute/core/ITensor.h"
29#include "arm_compute/core/TensorInfo.h"
30#include "arm_compute/core/Types.h"
31
32#include "utils/Utils.h"
33
34#pragma GCC diagnostic push
35#pragma GCC diagnostic ignored "-Wswitch-default"
36#define STB_IMAGE_IMPLEMENTATION
37#include "stb/stb_image.h"
38#pragma GCC diagnostic pop
39
40#include <cstdlib>
41#include <memory>
42#include <string>
43
44namespace arm_compute
45{
46namespace utils
47{
48/** Image feeder interface */
49class IImageDataFeeder
50{
51public:
52 /** Virtual base destructor */
53 virtual ~IImageDataFeeder() = default;
54 /** Gets a character from an image feed */
55 virtual uint8_t get() = 0;
56 /** Feed a whole row to a destination pointer
57 *
58 * @param[out] dst Destination pointer
59 * @param[in] row_size Row size in terms of bytes
60 */
61 virtual void get_row(uint8_t *dst, size_t row_size) = 0;
62};
63/** File Image feeder concrete implementation */
64class FileImageFeeder : public IImageDataFeeder
65{
66public:
67 /** Default constructor
68 *
69 * @param[in] fs Image file stream
70 */
71 FileImageFeeder(std::ifstream &fs)
72 : _fs(fs)
73 {
74 }
75 // Inherited overridden methods
76 uint8_t get() override
77 {
78 return _fs.get();
79 }
80 void get_row(uint8_t *dst, size_t row_size) override
81 {
82 ARM_COMPUTE_ERROR_ON(dst == nullptr);
83 _fs.read(reinterpret_cast<std::fstream::char_type *>(dst), row_size);
84 }
85
86private:
87 std::ifstream &_fs;
88};
89/** Memory Image feeder concrete implementation */
90class MemoryImageFeeder : public IImageDataFeeder
91{
92public:
93 /** Default constructor
94 *
95 * @param[in] data Pointer to data
96 */
97 MemoryImageFeeder(const uint8_t *data)
98 : _data(data)
99 {
100 }
101 /** Prevent instances of this class from being copied (As this class contains pointers) */
102 MemoryImageFeeder(const MemoryImageFeeder &) = delete;
103 /** Default move constructor */
104 MemoryImageFeeder(MemoryImageFeeder &&) = default;
105 /** Prevent instances of this class from being copied (As this class contains pointers) */
106 MemoryImageFeeder &operator=(const MemoryImageFeeder &) = delete;
107 /** Default move assignment operator */
108 MemoryImageFeeder &operator=(MemoryImageFeeder &&) = default;
109 // Inherited overridden methods
110 uint8_t get() override
111 {
112 return *_data++;
113 }
114 void get_row(uint8_t *dst, size_t row_size) override
115 {
116 ARM_COMPUTE_ERROR_ON(dst == nullptr);
117 memcpy(dst, _data, row_size);
118 _data += row_size;
119 }
120
121private:
122 const uint8_t *_data;
123};
124
125/** Image loader interface */
126class IImageLoader
127{
128public:
129 /** Default Constructor */
130 IImageLoader()
131 : _feeder(nullptr), _width(0), _height(0)
132 {
133 }
134 /** Virtual base destructor */
135 virtual ~IImageLoader() = default;
136 /** Return the width of the currently open image file. */
137 unsigned int width() const
138 {
139 return _width;
140 }
141 /** Return the height of the currently open image file. */
142 unsigned int height() const
143 {
144 return _height;
145 }
146 /** Return true if the image file is currently open */
147 virtual bool is_open() = 0;
148 /** Open an image file and reads its metadata (Width, height)
149 *
150 * @param[in] filename File to open
151 */
152 virtual void open(const std::string &filename) = 0;
153 /** Closes an image file */
154 virtual void close() = 0;
155 /** Initialise an image's metadata with the dimensions of the image file currently open
156 *
157 * @param[out] image Image to initialise
158 * @param[in] format Format to use for the image (Must be RGB888 or U8)
159 */
160 template <typename T>
161 void init_image(T &image, Format format)
162 {
163 ARM_COMPUTE_ERROR_ON(!is_open());
164 ARM_COMPUTE_ERROR_ON(format != Format::RGB888 && format != Format::U8);
165
166 // Use the size of the input image
167 TensorInfo image_info(_width, _height, format);
168 image.allocator()->init(image_info);
169 }
170 /** Fill an image with the content of the currently open image file.
171 *
172 * @note If the image is a CLImage, the function maps and unmaps the image
173 *
174 * @param[in,out] image Image to fill (Must be allocated, and of matching dimensions with the opened image file).
175 */
176 template <typename T>
177 void fill_image(T &image)
178 {
179 ARM_COMPUTE_ERROR_ON(!is_open());
180 ARM_COMPUTE_ERROR_ON(image.info()->dimension(0) != _width || image.info()->dimension(1) != _height);
181 ARM_COMPUTE_ERROR_ON_FORMAT_NOT_IN(&image, Format::U8, Format::RGB888);
182 ARM_COMPUTE_ERROR_ON(_feeder.get() == nullptr);
183 try
184 {
185 // Map buffer if creating a CLTensor/GCTensor
186 map(image, true);
187
188 // Validate feeding data
189 validate_info(image.info());
190
191 switch(image.info()->format())
192 {
193 case Format::U8:
194 {
195 // We need to convert the data from RGB to grayscale:
196 // Iterate through every pixel of the image
197 Window window;
198 window.set(Window::DimX, Window::Dimension(0, _width, 1));
199 window.set(Window::DimY, Window::Dimension(0, _height, 1));
200
201 Iterator out(&image, window);
202
203 unsigned char red = 0;
204 unsigned char green = 0;
205 unsigned char blue = 0;
206
207 execute_window_loop(window, [&](const Coordinates & id)
208 {
209 red = _feeder->get();
210 green = _feeder->get();
211 blue = _feeder->get();
212
213 *out.ptr() = 0.2126f * red + 0.7152f * green + 0.0722f * blue;
214 },
215 out);
216
217 break;
218 }
219 case Format::RGB888:
220 {
221 // There is no format conversion needed: we can simply copy the content of the input file to the image one row at the time.
222 // Create a vertical window to iterate through the image's rows:
223 Window window;
224 window.set(Window::DimY, Window::Dimension(0, _height, 1));
225
226 Iterator out(&image, window);
227 size_t row_size = _width * image.info()->element_size();
228
229 execute_window_loop(window, [&](const Coordinates & id)
230 {
231 _feeder->get_row(out.ptr(), row_size);
232 },
233 out);
234
235 break;
236 }
237 default:
238 ARM_COMPUTE_ERROR("Unsupported format");
239 }
240
241 // Unmap buffer if creating a CLTensor/GCTensor
242 unmap(image);
243 }
244 catch(const std::ifstream::failure &e)
245 {
246 ARM_COMPUTE_ERROR("Loading image file: %s", e.what());
247 }
248 }
249 /** Fill a tensor with 3 planes (one for each channel) with the content of the currently open image file.
250 *
251 * @note If the image is a CLImage, the function maps and unmaps the image
252 *
253 * @param[in,out] tensor Tensor with 3 planes to fill (Must be allocated, and of matching dimensions with the opened image). Data types supported: U8/F32
254 * @param[in] bgr (Optional) Fill the first plane with blue channel (default = false)
255 */
256 template <typename T>
257 void fill_planar_tensor(T &tensor, bool bgr = false)
258 {
259 ARM_COMPUTE_ERROR_ON(!is_open());
260 ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(&tensor, 1, DataType::U8, DataType::F32);
261
262 const DataLayout data_layout = tensor.info()->data_layout();
263 const TensorShape tensor_shape = tensor.info()->tensor_shape();
264
265 ARM_COMPUTE_UNUSED(tensor_shape);
266 ARM_COMPUTE_ERROR_ON(tensor_shape[get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH)] != _width);
267 ARM_COMPUTE_ERROR_ON(tensor_shape[get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT)] != _height);
268 ARM_COMPUTE_ERROR_ON(tensor_shape[get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL)] != 3);
269
270 ARM_COMPUTE_ERROR_ON(_feeder.get() == nullptr);
271
272 try
273 {
274 // Map buffer if creating a CLTensor
275 map(tensor, true);
276
277 // Validate feeding data
278 validate_info(tensor.info());
279
280 // Stride across channels
281 size_t stride_z = 0;
282
283 // Iterate through every pixel of the image
284 Window window;
285 if(data_layout == DataLayout::NCHW)
286 {
287 window.set(Window::DimX, Window::Dimension(0, _width, 1));
288 window.set(Window::DimY, Window::Dimension(0, _height, 1));
289 window.set(Window::DimZ, Window::Dimension(0, 1, 1));
290 stride_z = tensor.info()->strides_in_bytes()[2];
291 }
292 else
293 {
294 window.set(Window::DimX, Window::Dimension(0, 1, 1));
295 window.set(Window::DimY, Window::Dimension(0, _width, 1));
296 window.set(Window::DimZ, Window::Dimension(0, _height, 1));
297 stride_z = tensor.info()->strides_in_bytes()[0];
298 }
299
300 Iterator out(&tensor, window);
301
302 unsigned char red = 0;
303 unsigned char green = 0;
304 unsigned char blue = 0;
305
306 execute_window_loop(window, [&](const Coordinates & id)
307 {
308 red = _feeder->get();
309 green = _feeder->get();
310 blue = _feeder->get();
311
312 switch(tensor.info()->data_type())
313 {
314 case DataType::U8:
315 {
316 *(out.ptr() + 0 * stride_z) = bgr ? blue : red;
317 *(out.ptr() + 1 * stride_z) = green;
318 *(out.ptr() + 2 * stride_z) = bgr ? red : blue;
319 break;
320 }
321 case DataType::F32:
322 {
323 *reinterpret_cast<float *>(out.ptr() + 0 * stride_z) = static_cast<float>(bgr ? blue : red);
324 *reinterpret_cast<float *>(out.ptr() + 1 * stride_z) = static_cast<float>(green);
325 *reinterpret_cast<float *>(out.ptr() + 2 * stride_z) = static_cast<float>(bgr ? red : blue);
326 break;
327 }
328 default:
329 {
330 ARM_COMPUTE_ERROR("Unsupported data type");
331 }
332 }
333 },
334 out);
335
336 // Unmap buffer if creating a CLTensor
337 unmap(tensor);
338 }
339 catch(const std::ifstream::failure &e)
340 {
341 ARM_COMPUTE_ERROR("Loading image file: %s", e.what());
342 }
343 }
344
345protected:
346 /** Validate metadata */
347 virtual void validate_info(const ITensorInfo *tensor_info)
348 {
349 }
350
351protected:
352 std::unique_ptr<IImageDataFeeder> _feeder;
353 unsigned int _width;
354 unsigned int _height;
355};
356
357/** PPM Image loader concrete implementation */
358class PPMLoader : public IImageLoader
359{
360public:
361 /** Default Constructor */
362 PPMLoader()
363 : IImageLoader(), _fs()
364 {
365 }
366
367 // Inherited methods overridden:
368 bool is_open() override
369 {
370 return _fs.is_open();
371 }
372 void open(const std::string &filename) override
373 {
374 ARM_COMPUTE_ERROR_ON(is_open());
375 try
376 {
377 _fs.exceptions(std::ifstream::failbit | std::ifstream::badbit);
378 _fs.open(filename, std::ios::in | std::ios::binary);
379
380 unsigned int max_val = 0;
381 std::tie(_width, _height, max_val) = parse_ppm_header(_fs);
382
383 ARM_COMPUTE_ERROR_ON_MSG(max_val >= 256, "2 bytes per colour channel not supported in file %s",
384 filename.c_str());
385
386 _feeder = support::cpp14::make_unique<FileImageFeeder>(_fs);
387 }
388 catch(std::runtime_error &e)
389 {
390 ARM_COMPUTE_ERROR("Accessing %s: %s", filename.c_str(), e.what());
391 }
392 }
393 void close() override
394 {
395 if(is_open())
396 {
397 _fs.close();
398 _feeder = nullptr;
399 }
400 ARM_COMPUTE_ERROR_ON(is_open());
401 }
402
403protected:
404 // Inherited methods overridden:
405 void validate_info(const ITensorInfo *tensor_info) override
406 {
407 // Check if the file is large enough to fill the image
408 const size_t current_position = _fs.tellg();
409 _fs.seekg(0, std::ios_base::end);
410 const size_t end_position = _fs.tellg();
411 _fs.seekg(current_position, std::ios_base::beg);
412
413 ARM_COMPUTE_ERROR_ON_MSG((end_position - current_position) < tensor_info->tensor_shape().total_size(),
414 "Not enough data in file");
415 ARM_COMPUTE_UNUSED(end_position);
416 }
417
418private:
419 std::ifstream _fs;
420};
421
422/** Class to load the content of a JPEG file into an Image */
423class JPEGLoader : public IImageLoader
424{
425private:
426 /** Custom malloc deleter struct */
427 struct malloc_deleter
428 {
429 void operator()(uint8_t *p) const
430 {
431 free(p);
432 }
433 };
434
435public:
436 /** Default Constructor */
437 JPEGLoader()
438 : IImageLoader(), _is_loaded(false), _data(nullptr)
439 {
440 }
441
442 // Inherited methods overridden:
443 bool is_open() override
444 {
445 return _is_loaded;
446 }
447 void open(const std::string &filename) override
448 {
449 int bpp, width, height;
450 uint8_t *rgb_image = stbi_load(filename.c_str(), &width, &height, &bpp, 3);
451 if(rgb_image == NULL)
452 {
453 ARM_COMPUTE_ERROR("Accessing %s failed", filename.c_str());
454 }
455 else
456 {
457 _width = width;
458 _height = height;
459 _data = std::unique_ptr<uint8_t, malloc_deleter>(rgb_image);
460 _is_loaded = true;
461 _feeder = support::cpp14::make_unique<MemoryImageFeeder>(_data.get());
462 }
463 }
464 void close() override
465 {
466 if(is_open())
467 {
468 _width = 0;
469 _height = 0;
470 release();
471 }
472 ARM_COMPUTE_ERROR_ON(is_open());
473 }
474 /** Explicitly Releases the memory of the loaded data */
475 void release()
476 {
477 if(_is_loaded)
478 {
479 _data.reset();
480 _is_loaded = false;
481 _feeder = nullptr;
482 }
483 }
484
485private:
486 bool _is_loaded;
487 std::unique_ptr<uint8_t, malloc_deleter> _data;
488};
489} // namespace utils
490} // namespace arm_compute
491#endif /* __UTILS_IMAGE_LOADER_H__*/