diff options
author | Gary Antcliffe <gary.antcliffe@arm.com> | 2019-05-28 11:40:21 +0100 |
---|---|---|
committer | Gary Antcliffe <gary.antcliffe@arm.com> | 2019-06-27 14:09:00 +0000 |
commit | fffbdbcc52ae2f30b9c51637d82e5e1f5d604e71 (patch) | |
tree | ac2c43d7b69d61aed29a6ee3151806797e87f739 /src/core/CL/kernels/CLGaussianPyramidKernel.cpp | |
parent | d8a468f90030edf7be512c00fce7230065456f61 (diff) | |
download | ComputeLibrary-fffbdbcc52ae2f30b9c51637d82e5e1f5d604e71.tar.gz |
COMPUTE-10611: CL: Set config_id to enabling LWS tuning
Change-Id: Ie457ab751e1527841c3e2881a25eac889435a26e
Signed-off-by: Gary Antcliffe <gary.antcliffe@arm.com>
Reviewed-on: https://review.mlplatform.org/c/1408
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com>
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/CL/kernels/CLGaussianPyramidKernel.cpp')
-rw-r--r-- | src/core/CL/kernels/CLGaussianPyramidKernel.cpp | 32 |
1 files changed, 30 insertions, 2 deletions
diff --git a/src/core/CL/kernels/CLGaussianPyramidKernel.cpp b/src/core/CL/kernels/CLGaussianPyramidKernel.cpp index c9c7bf39a9..27b73b6d32 100644 --- a/src/core/CL/kernels/CLGaussianPyramidKernel.cpp +++ b/src/core/CL/kernels/CLGaussianPyramidKernel.cpp @@ -56,7 +56,8 @@ void CLGaussianPyramidHorKernel::configure(const ICLTensor *input, ICLTensor *ou _output = output; // Create kernel - _kernel = static_cast<cl::Kernel>(CLKernelLibrary::get().create_kernel("gaussian1x5_sub_x")); + const std::string kernel_name = std::string("gaussian1x5_sub_x"); + _kernel = static_cast<cl::Kernel>(CLKernelLibrary::get().create_kernel(kernel_name)); // Configure kernel window constexpr unsigned int num_elems_processed_per_iteration = 16; @@ -96,6 +97,19 @@ void CLGaussianPyramidHorKernel::configure(const ICLTensor *input, ICLTensor *ou output->info()->set_valid_region(ValidRegion(Coordinates(), output->info()->tensor_shape())); ICLKernel::configure_internal(win); + + // Set config_id for enabling LWS tuning + _config_id = kernel_name; + _config_id += "_"; + _config_id += lower_string(string_from_data_type(input->info()->data_type())); + _config_id += "_"; + _config_id += support::cpp11::to_string(input->info()->dimension(0)); + _config_id += "_"; + _config_id += support::cpp11::to_string(input->info()->dimension(1)); + _config_id += "_"; + _config_id += support::cpp11::to_string(output->info()->dimension(0)); + _config_id += "_"; + _config_id += support::cpp11::to_string(output->info()->dimension(1)); } void CLGaussianPyramidHorKernel::run(const Window &window, cl::CommandQueue &queue) @@ -148,7 +162,8 @@ void CLGaussianPyramidVertKernel::configure(const ICLTensor *input, ICLTensor *o _output = output; // Create kernel - _kernel = static_cast<cl::Kernel>(CLKernelLibrary::get().create_kernel("gaussian5x1_sub_y")); + const std::string kernel_name = std::string("gaussian5x1_sub_y"); + _kernel = static_cast<cl::Kernel>(CLKernelLibrary::get().create_kernel("gaussian5x1_sub_y")); // Configure kernel window constexpr unsigned int num_elems_processed_per_iteration = 8; @@ -178,6 +193,19 @@ void CLGaussianPyramidVertKernel::configure(const ICLTensor *input, ICLTensor *o output->info()->set_valid_region(ValidRegion(Coordinates(), output->info()->tensor_shape())); ICLKernel::configure_internal(win); + + // Set config_id for enabling LWS tuning + _config_id = kernel_name; + _config_id += "_"; + _config_id += lower_string(string_from_data_type(input->info()->data_type())); + _config_id += "_"; + _config_id += support::cpp11::to_string(input->info()->dimension(0)); + _config_id += "_"; + _config_id += support::cpp11::to_string(input->info()->dimension(1)); + _config_id += "_"; + _config_id += support::cpp11::to_string(output->info()->dimension(0)); + _config_id += "_"; + _config_id += support::cpp11::to_string(output->info()->dimension(1)); } void CLGaussianPyramidVertKernel::run(const Window &window, cl::CommandQueue &queue) |