blob: 91bfe5b21383d6007083b5d61b21faa1493571c1 [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
2 * Copyright (c) 2016, 2017 ARM Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#ifndef __ARM_COMPUTE_CLSCHEDULER_H__
25#define __ARM_COMPUTE_CLSCHEDULER_H__
26
27#include "arm_compute/core/CL/CLHelpers.h"
28#include "arm_compute/core/CL/CLKernelLibrary.h"
29#include "arm_compute/core/CL/CLTypes.h"
30#include "arm_compute/core/CL/OpenCL.h"
31#include "arm_compute/core/Error.h"
32#include "arm_compute/core/Types.h"
Gian Marcode691f02017-09-08 16:13:11 +010033#include "arm_compute/runtime/CL/CLTuner.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010034
steniu01f01f9de2017-09-27 17:00:11 +010035#if defined(ARM_COMPUTE_DEBUG_ENABLED)
36namespace
37{
38void printf_callback(const char *buffer, unsigned int len, size_t complete, void *user_data)
39{
40 printf("%.*s", len, buffer);
41}
steniu01f01f9de2017-09-27 17:00:11 +010042}
43#endif /* defined(ARM_COMPUTE_DEBUG_ENABLED) */
44
Anthony Barbier6ff3b192017-09-04 18:44:23 +010045namespace arm_compute
46{
47class ICLKernel;
48
49/** Provides global access to a CL context and command queue. */
50class CLScheduler
51{
52private:
53 /** Constructor */
54 CLScheduler();
Gian Marcode691f02017-09-08 16:13:11 +010055 /** Prevent instances of this class from being copied (As this class contains pointers) */
56 CLScheduler(const CLScheduler &) = delete;
57 /** Prevent instances of this class from being copied (As this class contains pointers) */
58 CLScheduler &operator=(const CLScheduler &) = delete;
Anthony Barbier6ff3b192017-09-04 18:44:23 +010059
60public:
61 /** Access the scheduler singleton.
62 *
63 * @return The scheduler
64 */
65 static CLScheduler &get();
66 /** Initialises the context and command queue used by the scheduler to default values
67 * and sets a default device and kernel path for the @ref CLKernelLibrary.
Gian Marcode691f02017-09-08 16:13:11 +010068 *
69 * @param[in] cl_tuner (Optional) Pointer to ICLTuner (default=nullptr)
Anthony Barbier6ff3b192017-09-04 18:44:23 +010070 */
Gian Marcode691f02017-09-08 16:13:11 +010071 void default_init(ICLTuner *cl_tuner = nullptr)
Anthony Barbier6ff3b192017-09-04 18:44:23 +010072 {
steniu01f01f9de2017-09-27 17:00:11 +010073#if defined(ARM_COMPUTE_DEBUG_ENABLED)
Anthony Barbiera9e15332017-12-22 16:37:30 +000074 // Create a cl_context with a printf_callback and user specified buffer size.
75 cl_context_properties properties[] =
76 {
77 // Enable a printf callback function for this context.
78 CL_PRINTF_CALLBACK_ARM, reinterpret_cast<cl_context_properties>(printf_callback),
79 // Request a minimum printf buffer size of 4MB for devices in the
80 // context that support this extension.
81 CL_PRINTF_BUFFERSIZE_ARM, static_cast<cl_context_properties>(0x100000),
82 CL_CONTEXT_PLATFORM, reinterpret_cast<cl_context_properties>(cl::Platform::get()()),
83 0
84 };
steniu01f01f9de2017-09-27 17:00:11 +010085 cl::Context::setDefault(cl::Context(CL_DEVICE_TYPE_DEFAULT, properties));
86#endif // defined(ARM_COMPUTE_DEBUG_ENABLED)
87
Anthony Barbier6ff3b192017-09-04 18:44:23 +010088 CLKernelLibrary::get().init("./cl_kernels/", cl::Context::getDefault(), cl::Device::getDefault());
Gian Marcode691f02017-09-08 16:13:11 +010089 init(cl::Context::getDefault(), cl::CommandQueue::getDefault(), cl::Device::getDefault(), cl_tuner);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010090 }
91 /** Schedule the execution of the passed kernel if possible.
92 *
93 * @param[in] kernel Kernel to execute.
94 * @param[in] flush (Optional) Specifies if the command queue will be flushed after running the kernel.
95 */
96 void enqueue(ICLKernel &kernel, bool flush = true);
97
98 /** Initialises the context and command queue to be used by the scheduler.
99 *
Gian Marcode691f02017-09-08 16:13:11 +0100100 * @param[in] context A CL context.
101 * @param[in] queue A CL command queue.
102 * @param[in] device A CL device.
103 * @param[in] cl_tuner (Optional) Pointer to OpenCL tuner (default=nullptr)
104 * Note: It is caller's responsibility to release the allocated memory for CLTuner
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100105 */
106 void init(cl::Context context = cl::Context::getDefault(), cl::CommandQueue queue = cl::CommandQueue::getDefault(),
Gian Marcode691f02017-09-08 16:13:11 +0100107 cl::Device device = cl::Device::getDefault(), ICLTuner *cl_tuner = nullptr)
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100108 {
steniu0134702472017-07-11 09:22:58 +0100109 _context = std::move(context);
110 _queue = std::move(queue);
111 _target = get_target_from_device(device);
112 _is_initialised = true;
Gian Marcode691f02017-09-08 16:13:11 +0100113 _cl_tuner = cl_tuner;
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100114 }
115
116 /** Accessor for the associated CL context.
117 *
118 * @return A CL context.
119 */
120 cl::Context &context()
121 {
steniu0134702472017-07-11 09:22:58 +0100122 ARM_COMPUTE_ERROR_ON(!_is_initialised);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100123 return _context;
124 }
125
126 /** Accessor to set the CL context to be used by the scheduler.
127 *
128 * @param[in] context A CL context.
129 */
130 void set_context(cl::Context context)
131 {
132 _context = std::move(context);
133 }
134
135 /** Accessor for the associated CL command queue.
136 *
137 * @return A CL command queue.
138 */
139 cl::CommandQueue &queue()
140 {
steniu0134702472017-07-11 09:22:58 +0100141 ARM_COMPUTE_ERROR_ON(!_is_initialised);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100142 return _queue;
143 }
144
145 /** Get the target GPU.
146 *
147 * @return The target GPU.
148 */
149 GPUTarget target() const
150 {
151 return _target;
152 }
153
154 /** Accessor to set the CL command queue to be used by the scheduler.
155 *
156 * @param[in] queue A CL command queue.
157 */
158 void set_queue(cl::CommandQueue queue)
159 {
160 _queue = std::move(queue);
161 }
162
163 /** Accessor to set target GPU to be used by the scheduler.
164 *
165 * @param[in] target The target GPU.
166 */
167 void set_target(GPUTarget target)
168 {
169 _target = target;
170 }
171
172 /** Blocks until all commands in the associated command queue have finished. */
173 void sync()
174 {
175 _queue.finish();
176 }
177
178 /** Enqueues a marker into the associated command queue and return the event.
179 *
180 * @return An event that can be waited on to block the executing thread.
181 */
182 cl::Event enqueue_sync_event()
183 {
184 cl::Event event;
185 _queue.enqueueMarker(&event);
186
187 return event;
188 }
189
190private:
Gian Marcode691f02017-09-08 16:13:11 +0100191 /** Tune OpenCL kernel
192 *
193 * @note This method uses a brute force approach to find the optimal LWS
194 *
195 * @param[in] kernel Kernel to tune
196 *
197 * @return The optimal LWS for the specified kernel
198 */
199 cl::NDRange tune_kernel(ICLKernel &kernel);
200
Ioan-Cristian Szabo77eb21f2017-12-22 17:32:17 +0000201 /** Flag to ensure symbols initialisation is happening before Scheduler creation */
202 static std::once_flag _initialize_symbols;
203
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100204 cl::Context _context;
205 cl::CommandQueue _queue;
206 GPUTarget _target;
steniu0134702472017-07-11 09:22:58 +0100207 bool _is_initialised;
Gian Marcode691f02017-09-08 16:13:11 +0100208 ICLTuner *_cl_tuner;
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100209};
210}
211#endif /* __ARM_COMPUTE_CLSCHEDULER_H__ */