diff options
author | Anthony Barbier <anthony.barbier@arm.com> | 2017-11-28 10:31:43 +0000 |
---|---|---|
committer | Anthony Barbier <anthony.barbier@arm.com> | 2018-11-02 16:41:58 +0000 |
commit | fcd52fbc578a2f5e6a1df4c823284621cc55645a (patch) | |
tree | b6e7430b2e69fa26fa2405723f827a7e7dc73447 /src/core/CL/kernels/CLCol2ImKernel.cpp | |
parent | 666635c68ebbb182d1db4a85f33ed5325d472a65 (diff) | |
download | ComputeLibrary-fcd52fbc578a2f5e6a1df4c823284621cc55645a.tar.gz |
COMPMID-661: Vectorize im2col and add lws heuristics for convolution kernels #46
Change-Id: Idaab987384d6a12a114f609abd50446fd94536b2
Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/110879
Tested-by: BSG Visual Compute Jenkins server to access repositories on http://mpd-gerrit.cambridge.arm.com <bsgcomp@arm.com>
Reviewed-by: Anthony Barbier <anthony.barbier@arm.com>
Diffstat (limited to 'src/core/CL/kernels/CLCol2ImKernel.cpp')
-rw-r--r-- | src/core/CL/kernels/CLCol2ImKernel.cpp | 15 |
1 files changed, 15 insertions, 0 deletions
diff --git a/src/core/CL/kernels/CLCol2ImKernel.cpp b/src/core/CL/kernels/CLCol2ImKernel.cpp index 31cc6448c9..f2886c569a 100644 --- a/src/core/CL/kernels/CLCol2ImKernel.cpp +++ b/src/core/CL/kernels/CLCol2ImKernel.cpp @@ -72,6 +72,21 @@ void CLCol2ImKernel::configure(const ICLTensor *input, ICLTensor *output, std::p _kernel = static_cast<cl::Kernel>(CLKernelLibrary::get().create_kernel("col2im", build_opts)); + // Configure the local work size for Bifrost with a value obtained + // via exhaustive autotuning over 30 representative tensor shapes. + const GPUTarget gpu_target = get_arch_from_target(get_target()); + if(gpu_target == GPUTarget::BIFROST) + { + if((_convolved_dims.first == 7) || (_convolved_dims.first == 14)) + { + _lws_hint = cl::NDRange(1, 7, 1); + } + else + { + _lws_hint = cl::NDRange(1, 8, 1); + } + } + // Configure window Window win = calculate_max_window(*input->info(), Steps()); |