Compute Library
 23.05
CLScheduler.h
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2016-2022 Arm Limited.
3  *
4  * SPDX-License-Identifier: MIT
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a copy
7  * of this software and associated documentation files (the "Software"), to
8  * deal in the Software without restriction, including without limitation the
9  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10  * sell copies of the Software, and to permit persons to whom the Software is
11  * furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in all
14  * copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  */
24 #ifndef ARM_COMPUTE_CLSCHEDULER_H
25 #define ARM_COMPUTE_CLSCHEDULER_H
26 
30 #include "arm_compute/core/Error.h"
31 #include "arm_compute/core/Types.h"
37 
38 namespace arm_compute
39 {
40 class ICLKernel;
41 class ICLTuner;
42 /** Provides global access to a CL context and command queue. */
43 class CLScheduler final
44 {
45 public:
46  /** Constructor */
47  CLScheduler();
48  /** Prevent instances of this class from being copied (As this class contains pointers) */
49  CLScheduler(const CLScheduler &) = delete;
50  /** Prevent instances of this class from being copied (As this class contains pointers) */
51  CLScheduler &operator=(const CLScheduler &) = delete;
52  /** Default destructor */
53  ~CLScheduler() = default;
54  /** Access the scheduler singleton.
55  * This method has been deprecated and will be removed in future releases
56  * @return The scheduler
57  */
58  static CLScheduler &get();
59  /** Initialises the context and command queue used by the scheduler to default values
60  * and sets a default device and kernel path for the @ref CLKernelLibrary.
61  *
62  * @param[in] cl_tuner (Optional) Pointer to ICLTuner (default=nullptr)
63  * @param[in] gemm_h (Optional) Pointer to CLGEMMHeuristicsHandle (default = nullptr)
64  * @param[in] cl_backend_type (Optional) Type of backend to use (default = CLBackendType::Native)
65  */
66  void default_init(ICLTuner *cl_tuner = nullptr, CLGEMMHeuristicsHandle *gemm_h = nullptr, CLBackendType cl_backend_type = CLBackendType::Native);
67  /** Initialises the scheduler with context and device provided by the user
68  *
69  * @param[in] device OpenCL device to be used
70  * @param[in] ctx OpenCL ctx to be used
71  * @param[in] cl_tuner (Optional) Pointer to ICLTuner (default=nullptr)
72  * @param[in] gemm_h (Optional) Pointer to CLGEMMHeuristicsHandle (default = nullptr)
73  */
74  void default_init_with_context(cl::Device &device, cl::Context &ctx, ICLTuner *cl_tuner = nullptr, CLGEMMHeuristicsHandle *gemm_h = nullptr);
75 
76  /** Re-initializes the context and command queue used by the scheduler to default values
77  * and sets a default device and kernel path for the @ref CLKernelLibrary.
78  *
79  * @param[in] cl_tuner (Optional) Pointer to ICLTuner (default=nullptr)
80  * @param[in] gemm_h (Optional) Pointer to CLGEMMHeuristicsHandle (default = nullptr)
81  * @param[in] cl_backend_type (Optional) Type of backend to use (default = CLBackendType::Native)
82  */
83  void default_reinit(ICLTuner *cl_tuner = nullptr, CLGEMMHeuristicsHandle *gemm_h = nullptr, CLBackendType cl_backend_type = CLBackendType::Native);
84 
85  /** Schedule the execution of the passed kernel if possible.
86  *
87  * @param[in] kernel Kernel to execute.
88  * @param[in] flush (Optional) Specifies if the command queue will be flushed after running the kernel. This will be ignored if job chaining is enabled.
89  */
90  void enqueue(ICLKernel &kernel, bool flush = true);
91  /** Schedule the execution of the passed kernel if possible.
92  *
93  * @param[in] kernel Kernel to execute.
94  * @param[in] tensors Vector containing the tensors to operate on.
95  * @param[in] flush (Optional) Specifies if the command queue will be flushed after running the kernel. This will be ignored if job chaining is enabled.
96  */
97  void enqueue_op(ICLKernel &kernel, ITensorPack &tensors, bool flush = true);
98  /** Initialises the context and command queue to be used by the scheduler.
99  *
100  * @param[in] context A CL context.
101  * @param[in] queue A CL command queue.
102  * @param[in] device A CL device.
103  * @param[in] cl_tuner (Optional) Pointer to OpenCL tuner (default=nullptr)
104  * Note: It is caller's responsibility to release the allocated memory for CLTuner
105  * @param[in] gemm_h (Optional) Pointer to CLGEMMHeuristicsHandle (default = nullptr)
106  * @param[in] cl_backend_type (Optional) Type of backend to use (default = CLBackendType::Native)
107  */
108  void init(cl::Context context, cl::CommandQueue queue, const cl::Device &device, ICLTuner *cl_tuner = nullptr, CLGEMMHeuristicsHandle *gemm_h = nullptr,
109  CLBackendType cl_backend_type = CLBackendType::Native);
110 
111  /** Accessor for the associated CL context.
112  *
113  * @return A CL context.
114  */
115  cl::Context &context();
116 
117  /** Accessor for the associated CL command queue.
118  *
119  * @return A CL command queue.
120  */
121  cl::CommandQueue &queue();
122 
123  /** Get the target GPU.
124  *
125  * @return The target GPU.
126  */
127  GPUTarget target() const;
128 
129  /** Accessor for the associated CLGEMMHeuristicsHandle
130  *
131  * @return Pointer to CLGEMMHeuristicsHandle
132  */
134 
135  /** Accessor to set the CL context to be used by the scheduler.
136  *
137  * @param[in] context A CL context.
138  */
139  void set_context(cl::Context context);
140 
141  /** Accessor to set the CL command queue to be used by the scheduler.
142  *
143  * @param[in] queue A CL command queue.
144  */
145  void set_queue(cl::CommandQueue queue);
146 
147  /** Accessor to set target GPU to be used by the scheduler.
148  *
149  * @param[in] target The target GPU.
150  */
151  void set_target(GPUTarget target);
152 
153  /** Accessor to set the CL tuner to be used by the scheduler.
154  *
155  * @param[in] tuner A CL tuner
156  */
157  void set_tuner(ICLTuner *tuner);
158 
159  /** Blocks until all commands in the associated command queue have finished. */
160  void sync();
161 
162  /** Enqueues a marker into the associated command queue and return the event.
163  *
164  * @return An event that can be waited on to block the executing thread.
165  */
166  cl::Event enqueue_sync_event();
167 
168  /** Tunes OpenCL kernel
169  *
170  * @param[in] kernel Kernel to tune
171  */
172  void tune_kernel_static(ICLKernel &kernel);
173 
174  /** Enable job chaining. The command queue will only be flushed when @p job_chaining_size kernels have been enqueued.
175  *
176  * @param[in] job_chaining_size Kernels to enqueue before flushing
177  */
178  void enable_job_chaining(int job_chaining_size);
179 
180  bool is_initialised() const;
181 
182 private:
183  void enqueue_common(ICLKernel &kernel, ITensorPack &tensors, bool flush);
184  /** If job chain is disabled, then flush the command queue according to @p flush. Otherwise @p flush is ignored and the queue is only flushed when job chain count exceeds allocated job chain size
185  *
186  * @param[in] flush Flush the command queue. Ignored when job chain is enabled.
187  */
188  void flush_queue(bool flush);
189 
190  /** Flag to ensure symbols initialisation is happening before Scheduler creation */
191  static std::once_flag _initialize_symbols;
192 
193  cl::Context _context;
194  cl::CommandQueue _queue;
195  GPUTarget _target;
196  bool _is_initialised;
197  ICLTuner *_cl_tuner;
198  CLGEMMHeuristicsHandle *_gemm_heuristics;
199  CLBackendType _backend_type;
200  bool _job_chaining_enabled;
201  int _job_chaining_size;
202  int _job_chaining_count;
203 };
204 } // namespace arm_compute
205 #endif /* ARM_COMPUTE_CLSCHEDULER_H */
void set_target(GPUTarget target)
Accessor to set target GPU to be used by the scheduler.
Definition: CLScheduler.cpp:60
void default_reinit(ICLTuner *cl_tuner=nullptr, CLGEMMHeuristicsHandle *gemm_h=nullptr, CLBackendType cl_backend_type=CLBackendType::Native)
Re-initializes the context and command queue used by the scheduler to default values and sets a defau...
void enable_job_chaining(int job_chaining_size)
Enable job chaining.
GPUTarget target() const
Get the target GPU.
Definition: CLScheduler.cpp:45
void set_context(cl::Context context)
Accessor to set the CL context to be used by the scheduler.
void default_init_with_context(cl::Device &device, cl::Context &ctx, ICLTuner *cl_tuner=nullptr, CLGEMMHeuristicsHandle *gemm_h=nullptr)
Initialises the scheduler with context and device provided by the user.
void default_init(ICLTuner *cl_tuner=nullptr, CLGEMMHeuristicsHandle *gemm_h=nullptr, CLBackendType cl_backend_type=CLBackendType::Native)
Initialises the context and command queue used by the scheduler to default values and sets a default ...
OpenCL native backend.
CLScheduler & operator=(const CLScheduler &)=delete
Prevent instances of this class from being copied (As this class contains pointers) ...
~CLScheduler()=default
Default destructor.
bool is_initialised() const
Definition: CLScheduler.cpp:90
Common interface for all the OpenCL kernels.
Definition: ICLKernel.h:67
CLGEMMHeuristicsHandle * gemm_heuristics() const
Accessor for the associated CLGEMMHeuristicsHandle.
Definition: CLScheduler.cpp:50
Copyright (c) 2017-2023 Arm Limited.
cl::Context & context()
Accessor for the associated CL context.
Definition: CLScheduler.cpp:32
cl::Event enqueue_sync_event()
Enqueues a marker into the associated command queue and return the event.
Definition: CLScheduler.cpp:75
Interface used to tune the local work-group size of OpenCL kernels.
void enqueue_op(ICLKernel &kernel, ITensorPack &tensors, bool flush=true)
Schedule the execution of the passed kernel if possible.
void set_tuner(ICLTuner *tuner)
Accessor to set the CL tuner to be used by the scheduler.
Definition: CLScheduler.cpp:65
cl::CommandQueue & queue()
Accessor for the associated CL command queue.
Definition: CLScheduler.cpp:39
void enqueue(ICLKernel &kernel, bool flush=true)
Schedule the execution of the passed kernel if possible.
void set_queue(cl::CommandQueue queue)
Accessor to set the CL command queue to be used by the scheduler.
Definition: CLScheduler.cpp:55
CLScheduler()
Constructor.
Definition: CLScheduler.cpp:97
void sync()
Blocks until all commands in the associated command queue have finished.
Definition: CLScheduler.cpp:70
Handle for loading and retrieving GEMM heuristics.
CLBackendType
List the possible OpenCL backends.
Definition: CLTypes.h:55
GPUTarget
Available GPU Targets.
Definition: GPUTarget.h:34
Provides global access to a CL context and command queue.
Definition: CLScheduler.h:43
Wrapper to configure the Khronos OpenCL C++ header.
Tensor packing service.
Definition: ITensorPack.h:39
Basic interface for tuning the OpenCL kernels.
Definition: ICLTuner.h:34
void tune_kernel_static(ICLKernel &kernel)
Tunes OpenCL kernel.
Definition: CLScheduler.cpp:82
void init(cl::Context context, cl::CommandQueue queue, const cl::Device &device, ICLTuner *cl_tuner=nullptr, CLGEMMHeuristicsHandle *gemm_h=nullptr, CLBackendType cl_backend_type=CLBackendType::Native)
Initialises the context and command queue to be used by the scheduler.