From 562deffa6ff7630aa517ab37fefab1936e9f4b1e Mon Sep 17 00:00:00 2001 From: Gian Marco Date: Wed, 7 Feb 2018 10:18:06 +0000 Subject: COMPMID-765 - Added LWS hint in CLIm2Col The LWS hint has been applied for optimized cases 1x1 and 3x3 Change-Id: I6b4bfe2f9f7da627052336889b8a18d279fe2675 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/119162 Reviewed-by: Michalis Spyrou Reviewed-by: Georgios Pinitas Tested-by: Jenkins --- src/core/CL/kernels/CLIm2ColKernel.cpp | 3 +++ 1 file changed, 3 insertions(+) (limited to 'src/core/CL/kernels/CLIm2ColKernel.cpp') diff --git a/src/core/CL/kernels/CLIm2ColKernel.cpp b/src/core/CL/kernels/CLIm2ColKernel.cpp index d1fc50365e..b75d2646c6 100644 --- a/src/core/CL/kernels/CLIm2ColKernel.cpp +++ b/src/core/CL/kernels/CLIm2ColKernel.cpp @@ -135,12 +135,15 @@ void CLIm2ColKernel::configure(const ICLTensor *input, ICLTensor *output, const // Optimized im2col1x1 if stride_x = 1 and conv_info.has_padding() = false if(conv_info.stride().first == 1 && !conv_info.has_padding()) { + // Set hint for LWS + _lws_hint = cl::NDRange(1, 1, 8); _num_elems_processed_per_iteration = 4; is_optimized_path = true; kernel_name = "im2col1x1_stridex1_dchw"; } break; case 3: + _lws_hint = cl::NDRange(1, 1, 8); _num_elems_processed_per_iteration = 1; is_optimized_path = true; kernel_name = "im2col3x3_dchw"; -- cgit v1.2.1