blob: 4c84c674fc8faf27dc5b3c556fe350b85dff1671 [file] [log] [blame]
Anthony Barbier7068f992017-10-26 15:23:08 +01001/*
Joel Liangabd03cf2018-01-08 15:20:48 +08002 * Copyright (c) 2017, 2018 ARM Limited.
Anthony Barbier7068f992017-10-26 15:23:08 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#include "arm_compute/core/GLES_COMPUTE/GCKernelLibrary.h"
25
26#include "arm_compute/core/Error.h"
27#include "arm_compute/core/Utils.h"
28
29#include <fstream>
30#include <iomanip>
31#include <iostream>
32#include <regex>
33#include <utility>
34#include <vector>
35
36using namespace arm_compute;
37
38GCProgram::GCProgram()
39 : _name(), _source()
40{
41}
42
43GCProgram::GCProgram(std::string name, std::string source)
44 : _name(std::move(name)), _source(std::move(source))
45{
46}
47
48GLuint GCProgram::link_program(GLuint shader)
49{
50 GLuint program = ARM_COMPUTE_GL_CHECK(glCreateProgram());
51
52 GLint rvalue;
53 GLsizei length;
54
55 ARM_COMPUTE_GL_CHECK(glAttachShader(program, shader));
56 ARM_COMPUTE_GL_CHECK(glLinkProgram(program));
57 ARM_COMPUTE_GL_CHECK(glDetachShader(program, shader));
58 ARM_COMPUTE_GL_CHECK(glDeleteShader(shader));
59
60 // Check if there were some issues when linking the shader.
61 ARM_COMPUTE_GL_CHECK(glGetProgramiv(program, GL_LINK_STATUS, &rvalue));
62
63 if(rvalue == 0)
64 {
65 ARM_COMPUTE_GL_CHECK(glGetProgramiv(program, GL_INFO_LOG_LENGTH, &length));
66
67 std::vector<GLchar> log(length);
68 ARM_COMPUTE_GL_CHECK(glGetProgramInfoLog(program, length, nullptr, log.data()));
69 ARM_COMPUTE_ERROR("Error: Linker log:\n%s\n", log.data());
70
71 return 0;
72 }
73
74 ARM_COMPUTE_GL_CHECK(glUseProgram(program));
75
76 return program;
77}
78
79GLuint GCProgram::compile_shader(const std::string &build_options)
80{
81 GLuint shader = ARM_COMPUTE_GL_CHECK(glCreateShader(GL_COMPUTE_SHADER));
82
83 const char *src[]
84 {
85 "#version 310 es\n",
86 build_options.c_str(),
87 _source.c_str()
88 };
89
90 ARM_COMPUTE_GL_CHECK(glShaderSource(shader, sizeof(src) / sizeof(src[0]), src, nullptr));
91
92 ARM_COMPUTE_GL_CHECK(glCompileShader(shader));
93
94 // Check if there were any issues when compiling the shader
95 GLint rvalue;
96 GLsizei length;
97
98 ARM_COMPUTE_GL_CHECK(glGetShaderiv(shader, GL_COMPILE_STATUS, &rvalue));
99
100 if(rvalue == 0)
101 {
102 ARM_COMPUTE_GL_CHECK(glGetShaderiv(shader, GL_INFO_LOG_LENGTH, &length));
103
104 std::vector<GLchar> log(length);
105 ARM_COMPUTE_GL_CHECK(glGetShaderInfoLog(shader, length, nullptr, log.data()));
106
107#ifdef ARM_COMPUTE_DEBUG_ENABLED
108 std::istringstream ss(_source);
109 std::stringstream output_stream;
110 std::string line;
111 size_t line_num = 1;
112
113 ARM_COMPUTE_LOG_INFO_MSG_WITH_FORMAT_CORE("GLES Shader build options:\n%s\n", build_options.c_str());
114 while(std::getline(ss, line, '\n'))
115 {
116 output_stream << std::setw(6) << line_num << ": " << line << std::endl;
117 line_num++;
118 }
Joel Liangf1f3ebd2017-11-10 09:59:19 +0800119 ARM_COMPUTE_LOG_INFO_STREAM_CORE("GLES Shader source code:\n"
120 << output_stream.rdbuf());
Anthony Barbier7068f992017-10-26 15:23:08 +0100121#endif /* ARM_COMPUTE_DEBUG_ENABLED */
122
123 ARM_COMPUTE_ERROR("Error: Compiler log:\n%s\n", log.data());
124
125 return 0;
126 }
127
128 return shader;
129}
130
131GCKernel::GCKernel()
Joel Liangf1f3ebd2017-11-10 09:59:19 +0800132 : _name(), _program(), _shader_arguments(), _shader_params_ubo_name(), _shader_params_binding_point(), _shader_params_index(), _shader_params_size()
Anthony Barbier7068f992017-10-26 15:23:08 +0100133{
134}
135
Joel Liang5542ba82017-12-01 15:33:41 +0800136// Add a default destructor in cpp file to workaround the free unallocated value issue on Android
137GCKernel::~GCKernel() // NOLINT
138{
139}
140
Anthony Barbier7068f992017-10-26 15:23:08 +0100141GCKernel::GCKernel(std::string name, GLuint program)
142 : _name(std::move(name)),
143 _program(program),
Joel Liangf1f3ebd2017-11-10 09:59:19 +0800144 _shader_arguments(),
145 _shader_params_ubo_name(0),
Anthony Barbier7068f992017-10-26 15:23:08 +0100146 _shader_params_binding_point(0),
147 _shader_params_index(0),
148 _shader_params_size(0)
149{
Joel Liangf1f3ebd2017-11-10 09:59:19 +0800150 _shader_arguments.clear();
Anthony Barbier7068f992017-10-26 15:23:08 +0100151
Joel Liangf1f3ebd2017-11-10 09:59:19 +0800152 ARM_COMPUTE_GL_CHECK(glGenBuffers(1, &_shader_params_ubo_name));
Anthony Barbier7068f992017-10-26 15:23:08 +0100153
154 _shader_params_index = ARM_COMPUTE_GL_CHECK(glGetUniformBlockIndex(_program, _shader_params_name));
155 ARM_COMPUTE_ERROR_ON_MSG((_shader_params_index == GL_INVALID_INDEX), "Failed to get index of %s", _shader_params_name);
156 ARM_COMPUTE_GL_CHECK(glGetActiveUniformBlockiv(_program, _shader_params_index, GL_UNIFORM_BLOCK_DATA_SIZE, &_shader_params_size));
157 ARM_COMPUTE_ERROR_ON_MSG((_shader_params_size == 0), "Failed to get size of %s", _shader_params_name);
158}
159
160void GCKernel::cleanup()
161{
Joel Liangf1f3ebd2017-11-10 09:59:19 +0800162 ARM_COMPUTE_GL_CHECK(glDeleteBuffers(1, &_shader_params_ubo_name));
Anthony Barbier7068f992017-10-26 15:23:08 +0100163 ARM_COMPUTE_GL_CHECK(glBindBuffer(GL_UNIFORM_BUFFER, 0));
164 ARM_COMPUTE_GL_CHECK(glDeleteProgram(_program));
165 ARM_COMPUTE_GL_CHECK(glUseProgram(0));
166}
167
168void GCKernel::use()
169{
170 ARM_COMPUTE_GL_CHECK(glUseProgram(_program));
171}
172
173void GCKernel::unuse()
174{
175 ARM_COMPUTE_GL_CHECK(glUseProgram(0));
176}
177
178void GCKernel::update_shader_params()
179{
Joel Liangf1f3ebd2017-11-10 09:59:19 +0800180 ARM_COMPUTE_ERROR_ON_MSG((_shader_params_size != (int)(_shader_arguments.size() * sizeof(_shader_arguments[0]))), "Arguments size (%d) is not equal to shader params block size (%d)",
181 _shader_arguments.size() * sizeof(_shader_arguments[0]), _shader_params_size);
Anthony Barbier7068f992017-10-26 15:23:08 +0100182
183 ARM_COMPUTE_GL_CHECK(glUniformBlockBinding(_program, _shader_params_index, _shader_params_binding_point));
Joel Liangf1f3ebd2017-11-10 09:59:19 +0800184 ARM_COMPUTE_GL_CHECK(glBindBufferBase(GL_UNIFORM_BUFFER, _shader_params_binding_point, _shader_params_ubo_name));
185 ARM_COMPUTE_GL_CHECK(glBindBuffer(GL_UNIFORM_BUFFER, _shader_params_ubo_name));
186 ARM_COMPUTE_GL_CHECK(glBufferData(GL_UNIFORM_BUFFER, _shader_params_size, _shader_arguments.data(), GL_DYNAMIC_DRAW));
Anthony Barbier7068f992017-10-26 15:23:08 +0100187 ARM_COMPUTE_GL_CHECK(glBindBuffer(GL_UNIFORM_BUFFER, 0));
188}
189
190const std::map<std::string, std::string> GCKernelLibrary::_shader_program_map =
191{
192 { "absdiff", "absdiff.cs" },
193 { "col2im", "convolution_layer.cs" },
194 { "direct_convolution1x1", "direct_convolution1x1.cs" },
195 { "direct_convolution3x3", "direct_convolution3x3.cs" },
196 { "direct_convolution5x5", "direct_convolution5x5.cs" },
197 { "pooling_layer_2", "pooling_layer.cs" },
198 { "pooling_layer_3", "pooling_layer.cs" },
199 { "pooling_layer_7", "pooling_layer.cs" },
200 { "pooling_layer_3_optimized", "pooling_layer.cs" },
201 { "pooling_layer_n", "pooling_layer.cs" },
202 { "fill_image_borders_replicate", "fill_border.cs" },
203 { "fill_image_borders_constant", "fill_border.cs" },
204 { "gemm_accumulate_biases", "gemm.cs" },
205 { "gemm_interleave4x4", "gemm.cs" },
206 { "gemm_ma", "gemm.cs" },
207 { "gemm_mm_interleaved_transposed", "gemm.cs" },
208 { "gemm_mm_floating_point", "gemm.cs" },
209 { "gemm_transpose1x4", "gemm.cs" },
210 { "im2col_kernel3x3_padx0_pady0", "convolution_layer.cs" },
211 { "im2col_generic", "convolution_layer.cs" },
212 { "im2col_reduced", "convolution_layer.cs" },
213 { "transpose", "transpose.cs" },
214 { "activation_layer", "activation_layer.cs" },
215 { "softmax_layer_max", "softmax_layer.cs" },
216 { "softmax_layer_shift_exp_sum", "softmax_layer.cs" },
217 { "softmax_layer_norm", "softmax_layer.cs" },
218 { "pixelwise_mul_float", "pixelwise_mul_float.cs" },
219 { "normalization_layer", "normalization_layer.cs" },
220 { "batchnormalization_layer", "batchnormalization_layer.cs" },
221 { "concatenate_depth", "concatenate.cs" },
222 { "dropout", "dropout.cs" },
zhenglin0fb6cf52017-12-12 15:56:09 +0800223 { "normalize_planar_yuv_layer", "normalize_planar_yuv_layer.cs" },
Frank Lei57a150a2017-12-19 10:14:57 +0800224 { "scale_nearest_neighbour", "scale.cs" },
zhenglin926d5e12017-12-21 15:36:50 +0800225 { "arithmetic_add", "arithmetic_add.cs" },
Frank Lei8cdfdb82018-01-02 16:49:33 +0800226 { "depthwise_convolution_3x3", "depthwise_convolution3x3.cs" },
Anthony Barbier7068f992017-10-26 15:23:08 +0100227};
228
229const std::map<std::string, std::string> GCKernelLibrary::_program_source_map =
230{
231#ifdef EMBEDDED_KERNELS
232 {
233 "absdiff.cs",
234#include "./cs_shaders/absdiff.csembed"
235 },
236 {
237 "convolution_layer.cs",
238#include "./cs_shaders/convolution_layer.csembed"
239 },
240 {
241 "direct_convolution1x1.cs",
242#include "./cs_shaders/direct_convolution1x1.csembed"
243 },
244 {
245 "direct_convolution3x3.cs",
246#include "./cs_shaders/direct_convolution3x3.csembed"
247 },
248 {
249 "direct_convolution5x5.cs",
250#include "./cs_shaders/direct_convolution5x5.csembed"
251 },
252 {
253 "pooling_layer.cs",
254#include "./cs_shaders/pooling_layer.csembed"
255 },
256 {
257 "fill_border.cs",
258#include "./cs_shaders/fill_border.csembed"
259 },
260 {
261 "gemm.cs",
262#include "./cs_shaders/gemm.csembed"
263 },
264 {
265 "transpose.cs",
266#include "./cs_shaders/transpose.csembed"
267 },
268 {
269 "activation_layer.cs",
270#include "./cs_shaders/activation_layer.csembed"
271 },
272 {
273 "softmax_layer.cs",
274#include "./cs_shaders/softmax_layer.csembed"
275 },
276 {
277 "pixelwise_mul_float.cs",
278#include "./cs_shaders/pixelwise_mul_float.csembed"
279 },
280 {
281 "normalization_layer.cs",
282#include "./cs_shaders/normalization_layer.csembed"
283 },
284 {
285 "batchnormalization_layer.cs",
286#include "./cs_shaders/batchnormalization_layer.csembed"
287 },
288 {
289 "concatenate.cs",
290#include "./cs_shaders/concatenate.csembed"
291 },
292 {
293 "dropout.cs",
294#include "./cs_shaders/dropout.csembed"
295 },
zhenglin0fb6cf52017-12-12 15:56:09 +0800296 {
297 "normalize_planar_yuv_layer.cs",
298#include "./cs_shaders/normalize_planar_yuv_layer.csembed"
299 },
Frank Lei57a150a2017-12-19 10:14:57 +0800300 {
301 "scale.cs",
302#include "./cs_shaders/scale.csembed"
303 },
zhenglin926d5e12017-12-21 15:36:50 +0800304 {
305 "arithmetic_add.cs",
306#include "./cs_shaders/arithmetic_add.csembed"
307 },
Frank Lei8cdfdb82018-01-02 16:49:33 +0800308 {
309 "depthwise_convolution3x3.cs",
310#include "./cs_shaders/depthwise_convolution3x3.csembed"
311 },
Anthony Barbier7068f992017-10-26 15:23:08 +0100312#endif /* EMBEDDED_KERNELS */
313};
314
315GCKernelLibrary::GCKernelLibrary()
Ioan-Cristian Szabo77eb21f2017-12-22 17:32:17 +0000316 : _display(EGL_NO_DISPLAY), _context(EGL_NO_CONTEXT), _frame_buffer(0), _tex_rt(0), _shader_path("./"), _programs_map(), _built_programs_map()
Anthony Barbier7068f992017-10-26 15:23:08 +0100317{
318}
319
320GCKernelLibrary &GCKernelLibrary::get()
321{
322 static GCKernelLibrary _kernel_library;
323 return _kernel_library;
324}
325
326GCKernel GCKernelLibrary::create_kernel(const std::string &shader_name, const StringSet &build_options_set) const
327{
328 // Find which program contains the kernel
329 auto shader_program_it = _shader_program_map.find(shader_name);
330
331 if(_shader_program_map.end() == shader_program_it)
332 {
333 ARM_COMPUTE_ERROR("Shader %s not found in the GCKernelLibrary", shader_name.c_str());
334 }
335
336 // Check if the program has been built before with same build options.
337 const std::string program_name = shader_program_it->second;
338 const std::string build_options = stringify_set(build_options_set);
339 const std::string built_program_name = program_name + "_" + build_options;
340 auto built_program_it = _built_programs_map.find(built_program_name);
341
342 GCKernel kernel;
343
344 if(_built_programs_map.end() != built_program_it)
345 {
346 // If program has been built, retrieve to create kernel from it
347 kernel = built_program_it->second;
Anthony Barbier7068f992017-10-26 15:23:08 +0100348 }
349 else
350 {
351 GCProgram program = load_program(program_name);
352
353 std::string source_name = _shader_path + shader_program_it->second;
354
355 // load shader
356 GLuint shader = program.compile_shader(build_options);
357
358 // Build program
359 GLuint gles_program = program.link_program(shader);
360
361 // Create GCKernel
362 kernel = GCKernel(shader_name, gles_program);
363
364 // Add built program to internal map
365 _built_programs_map.emplace(built_program_name, kernel);
366 }
367
Joel Liangf1f3ebd2017-11-10 09:59:19 +0800368 kernel.use();
369 kernel.clear_arguments();
370 // set shader params binding point
371 kernel.set_shader_params_binding_point(0);
372
Anthony Barbier7068f992017-10-26 15:23:08 +0100373 return kernel;
374}
375
376const std::string GCKernelLibrary::preprocess_shader(const std::string &shader_source) const
377{
378 enum class ParserStage
379 {
380 FIRST,
381 SKIP_COMMENTS = FIRST,
382 RESOLVE_INCLUDES,
Anthony Barbier7068f992017-10-26 15:23:08 +0100383 LAST
384 };
385
Anthony Barbier7068f992017-10-26 15:23:08 +0100386 // Define a GLES compute shader parser function
387 std::function<std::string(const std::string &, ParserStage, int)> cs_parser;
388 cs_parser = [&](const std::string & src, ParserStage stage, int nested_level) -> std::string
389 {
390 std::string dst;
391
392 if(stage == ParserStage::LAST || std::regex_match(src, std::regex(R"(\s*)")))
393 {
394 return src;
395 }
396 auto next_stage = static_cast<ParserStage>(static_cast<int>(stage) + 1);
397
398 std::string search_pattern;
399 switch(stage)
400 {
401 case ParserStage::SKIP_COMMENTS:
402 search_pattern = R"((/\*([^*]|\n|(\*+([^*/]|\n)))*\*+/)|(//.*))";
403 break;
404 case ParserStage::RESOLVE_INCLUDES:
405 search_pattern = R"rgx((?:^|\n)[ \t]*#include "(.*)")rgx";
406 break;
Anthony Barbier7068f992017-10-26 15:23:08 +0100407 default:
408 break;
409 }
410
411 std::regex search_regex(search_pattern);
412 std::smatch match;
413 ptrdiff_t parsed_pos = 0;
414 if(std::regex_search(src, match, search_regex))
415 {
416 // Pass the content before the match to the next stage
417 dst.append(cs_parser(src.substr(0, match.position()), next_stage, 0));
418 parsed_pos = match.position() + match.length();
419
420 // Deal with the matched content
421 switch(stage)
422 {
423 case ParserStage::RESOLVE_INCLUDES:
424 {
425 // Replace with the included file contents
426 // And parse the content from the first stage
427 const std::string source_name = _shader_path + match.str(1);
428 dst.append(cs_parser(read_file(source_name, false), ParserStage::FIRST, 0));
429 break;
430 }
Anthony Barbier7068f992017-10-26 15:23:08 +0100431 case ParserStage::SKIP_COMMENTS:
Anthony Barbier7068f992017-10-26 15:23:08 +0100432 default:
433 dst.append(match.str());
434 break;
435 }
436 next_stage = stage;
437 }
438 dst.append(cs_parser(src.substr(parsed_pos, src.length() - parsed_pos), next_stage, 0));
439
440 return dst;
441 };
442
443 return cs_parser(shader_source, ParserStage::FIRST, 0);
444}
445
446const GCProgram &GCKernelLibrary::load_program(const std::string &program_name) const
447{
448 const auto program_it = _programs_map.find(program_name);
449
450 if(program_it != _programs_map.end())
451 {
452 return program_it->second;
453 }
454
455 GCProgram program;
456
457#ifdef EMBEDDED_KERNELS
458 const auto program_source_it = _program_source_map.find(program_name);
459
460 if(_program_source_map.end() == program_source_it)
461 {
462 ARM_COMPUTE_ERROR("Embedded program for %s does not exist.", program_name.c_str());
463 }
464
Joel Liangabd03cf2018-01-08 15:20:48 +0800465 program = GCProgram(program_name, program_source_it->second);
Anthony Barbier7068f992017-10-26 15:23:08 +0100466#else /* EMBEDDED_KERNELS */
467 // Check for binary
468 std::string source_name = _shader_path + program_name;
469 if(std::ifstream(source_name).is_open())
470 {
471 program = GCProgram(program_name, preprocess_shader(read_file(source_name, false)));
472 }
473 else
474 {
475 ARM_COMPUTE_ERROR("Shader file %s does not exist.", source_name.c_str());
476 }
477#endif /* EMBEDDED_KERNELS */
478
479 // Insert program to program map
480 const auto new_program = _programs_map.emplace(program_name, std::move(program));
481
482 return new_program.first->second;
483}
484
Anthony Barbier7068f992017-10-26 15:23:08 +0100485void GCKernelLibrary::setup_dummy_fbo()
486{
487 ARM_COMPUTE_GL_CHECK(glGenFramebuffers(1, &_frame_buffer));
488 ARM_COMPUTE_GL_CHECK(glBindFramebuffer(GL_FRAMEBUFFER, _frame_buffer));
489 ARM_COMPUTE_GL_CHECK(glGenTextures(1, &_tex_rt));
490 ARM_COMPUTE_GL_CHECK(glBindTexture(GL_TEXTURE_2D, _tex_rt));
491 ARM_COMPUTE_GL_CHECK(glTexImage2D(GL_TEXTURE_2D, 0, GL_RGB, 1, 1, 0, GL_RGB, GL_UNSIGNED_BYTE, nullptr));
492 ARM_COMPUTE_GL_CHECK(glFramebufferTexture2D(GL_FRAMEBUFFER, GL_COLOR_ATTACHMENT0, GL_TEXTURE_2D, _tex_rt, 0));
493}
494
495GCKernelLibrary::~GCKernelLibrary()
496{
497 for(auto &program : _built_programs_map)
498 {
499 static_cast<GCKernel>(program.second).cleanup();
500 }
501
502 ARM_COMPUTE_GL_CHECK(glBindTexture(GL_TEXTURE_2D, 0));
503 ARM_COMPUTE_GL_CHECK(glBindFramebuffer(GL_FRAMEBUFFER, 0));
504 ARM_COMPUTE_GL_CHECK(glDeleteTextures(1, &_tex_rt));
505 ARM_COMPUTE_GL_CHECK(glDeleteFramebuffers(1, &_frame_buffer));
Anthony Barbier7068f992017-10-26 15:23:08 +0100506}
507
508std::string GCKernelLibrary::stringify_set(const StringSet &s) const
509{
510 std::string concat_set;
511
512 // Concatenate set
513 for(const auto &el : s)
514 {
515 concat_set += el + "\n";
516 }
517
518 return concat_set;
519}