aboutsummaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
authorsteniu01 <steven.niu@arm.com>2017-07-11 09:22:58 +0100
committerAnthony Barbier <anthony.barbier@arm.com>2018-09-17 14:15:39 +0100
commit34702479adcf3559e8ebe27915179af509b070d2 (patch)
tree683b6d81396a6515281f0575f9761efc50d538e8 /src
parentbb4a79b1667eaf9bdb30853c595e6d22d2589f82 (diff)
downloadComputeLibrary-34702479adcf3559e8ebe27915179af509b070d2.tar.gz
COMPMID-417 Checking CL non uniform support at runtime.
What have been done in the ticket are: 1. Add support to check whether cl-non-unform-workgroup is supported at runtime 2. Add helper function to check the CL version at runtime 3. Add boolen to check whether CLSecheduler's init has been called. Change-Id: I6e6df8eb5cebfac7229aa406242bb183477fd191 Reviewed-on: http://mpd-gerrit.cambridge.arm.com/80265 Tested-by: Kaizen <jeremy.johnson+kaizengerrit@arm.com> Reviewed-by: Anthony Barbier <anthony.barbier@arm.com>
Diffstat (limited to 'src')
-rw-r--r--src/core/CL/CLHelpers.cpp53
-rw-r--r--src/core/CL/CLKernelLibrary.cpp23
-rw-r--r--src/runtime/CL/CLScheduler.cpp6
3 files changed, 78 insertions, 4 deletions
diff --git a/src/core/CL/CLHelpers.cpp b/src/core/CL/CLHelpers.cpp
index 835260d35a..dd87e778d7 100644
--- a/src/core/CL/CLHelpers.cpp
+++ b/src/core/CL/CLHelpers.cpp
@@ -166,4 +166,57 @@ GPUTarget get_arch_from_target(GPUTarget target)
{
return (target & GPUTarget::GPU_ARCH_MASK);
}
+
+bool non_uniform_workgroup_support(const cl::Device &device)
+{
+ std::vector<char> extension;
+ size_t extension_size = 0;
+ cl_int err = clGetDeviceInfo(device.get(), CL_DEVICE_EXTENSIONS, 0, nullptr, &extension_size);
+ ARM_COMPUTE_ERROR_ON_MSG((err != 0) || (extension_size == 0), "clGetDeviceInfo failed to return valid information");
+ // Resize vector
+ extension.resize(extension_size);
+ // Query extension
+ err = clGetDeviceInfo(device.get(), CL_DEVICE_EXTENSIONS, extension_size, extension.data(), nullptr);
+ ARM_COMPUTE_ERROR_ON_MSG(err != 0, "clGetDeviceInfo failed to return valid information");
+ ARM_COMPUTE_UNUSED(err);
+
+ std::string extension_str(extension.begin(), extension.end());
+ auto pos = extension_str.find("cl_arm_non_uniform_work_group_size");
+ return (pos != std::string::npos);
+}
+
+CLVersion get_cl_version(const cl::Device &device)
+{
+ std::vector<char> version;
+ size_t version_size = 0;
+ cl_int err = clGetDeviceInfo(device.get(), CL_DEVICE_VERSION, 0, nullptr, &version_size);
+ ARM_COMPUTE_ERROR_ON_MSG((err != 0) || (version_size == 0), "clGetDeviceInfo failed to return valid information");
+ // Resize vector
+ version.resize(version_size);
+ // Query version
+ err = clGetDeviceInfo(device.get(), CL_DEVICE_VERSION, version_size, version.data(), nullptr);
+ ARM_COMPUTE_ERROR_ON_MSG(err != 0, "clGetDeviceInfo failed to return valid information");
+ ARM_COMPUTE_UNUSED(err);
+
+ std::string version_str(version.begin(), version.end());
+ if(version_str.find("OpenCL 2") != std::string::npos)
+ {
+ return CLVersion::CL20;
+ }
+ else if(version_str.find("OpenCL 1.2") != std::string::npos)
+ {
+ return CLVersion::CL12;
+ }
+ else if(version_str.find("OpenCL 1.1") != std::string::npos)
+ {
+ return CLVersion::CL11;
+ }
+ else if(version_str.find("OpenCL 1.0") != std::string::npos)
+ {
+ return CLVersion::CL10;
+ }
+
+ return CLVersion::UNKNOWN;
+}
+
} // namespace arm_compute
diff --git a/src/core/CL/CLKernelLibrary.cpp b/src/core/CL/CLKernelLibrary.cpp
index 72230435d8..769d50992d 100644
--- a/src/core/CL/CLKernelLibrary.cpp
+++ b/src/core/CL/CLKernelLibrary.cpp
@@ -23,6 +23,7 @@
*/
#include "arm_compute/core/CL/CLKernelLibrary.h"
+#include "arm_compute/core/CL/CLHelpers.h"
#include "arm_compute/core/Error.h"
#include "arm_compute/core/Utils.h"
@@ -514,9 +515,25 @@ Kernel CLKernelLibrary::create_kernel(const std::string &kernel_name, const Stri
ARM_COMPUTE_ERROR("Kernel %s not found in the CLKernelLibrary", kernel_name.c_str());
}
+ std::string concat_str;
+
+ if(non_uniform_workgroup_support(_device))
+ {
+ concat_str += " -cl-arm-non-uniform-work-group-size ";
+ }
+ else if(get_cl_version(_device) == CLVersion::CL20)
+ {
+ concat_str += " -cl-std=CL2.0 ";
+ }
+ else
+ {
+ ARM_COMPUTE_ERROR("Non uniform workgroup size is not supported!!");
+ }
+
// Check if the program has been built before with same build options.
- const std::string program_name = kernel_program_it->second;
- const std::string build_options = stringify_set(build_options_set);
+ const std::string program_name = kernel_program_it->second;
+ const std::string build_options = stringify_set(build_options_set) + concat_str;
+
const std::string built_program_name = program_name + "_" + build_options;
auto built_program_it = _built_programs_map.find(built_program_name);
@@ -591,7 +608,7 @@ const Program &CLKernelLibrary::load_program(const std::string &program_name) co
std::string CLKernelLibrary::stringify_set(const StringSet &s) const
{
- std::string concat_set = "-cl-arm-non-uniform-work-group-size ";
+ std::string concat_set;
#ifndef EMBEDDED_KERNELS
concat_set += "-I" + _kernel_path + " ";
diff --git a/src/runtime/CL/CLScheduler.cpp b/src/runtime/CL/CLScheduler.cpp
index fe25ce534c..f413f626eb 100644
--- a/src/runtime/CL/CLScheduler.cpp
+++ b/src/runtime/CL/CLScheduler.cpp
@@ -28,7 +28,7 @@
using namespace arm_compute;
CLScheduler::CLScheduler()
- : _context(), _queue(), _target(GPUTarget::MIDGARD)
+ : _context(), _queue(), _target(GPUTarget::MIDGARD), _is_initialised(false)
{
}
@@ -40,6 +40,10 @@ CLScheduler &CLScheduler::get()
void CLScheduler::enqueue(ICLKernel &kernel, bool flush)
{
+ ARM_COMPUTE_ERROR_ON_MSG(!_is_initialised,
+ "The CLScheduler is not initialised yet! Please call the CLScheduler::get().default_init(), \
+ or CLScheduler::get()::init() and CLKernelLibrary::get()::init() function before running functions!");
+
kernel.run(kernel.window(), _queue);
if(flush)