aboutsummaryrefslogtreecommitdiff
path: root/src/core/gpu/cl/kernels/ClDirectConvolutionKernel.cpp
diff options
context:
space:
mode:
authorMichalis Spyrou <michalis.spyrou@arm.com>2021-03-19 15:06:07 +0000
committerGeorgios Pinitas <georgios.pinitas@arm.com>2021-03-29 19:48:22 +0000
commit702dc0c71f2b2830b63e3b4079ede0ef76377f0a (patch)
treeafb0dacd74a8650350802aea8043822503c2f8b2 /src/core/gpu/cl/kernels/ClDirectConvolutionKernel.cpp
parent26c5c0fc10cbee1b523af0b27f884719dc50820a (diff)
downloadComputeLibrary-702dc0c71f2b2830b63e3b4079ede0ef76377f0a.tar.gz
Remove usage of valid window region CL - NHWC
Resolves: COMPMID-4153 Change-Id: Ib0d60c9acaac8aaf3946c62fc2d740b5ec6cee5c Signed-off-by: Michalis Spyrou <michalis.spyrou@arm.com> Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/5301 Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Michele Di Giorgio <michele.digiorgio@arm.com> Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/gpu/cl/kernels/ClDirectConvolutionKernel.cpp')
-rw-r--r--src/core/gpu/cl/kernels/ClDirectConvolutionKernel.cpp11
1 files changed, 4 insertions, 7 deletions
diff --git a/src/core/gpu/cl/kernels/ClDirectConvolutionKernel.cpp b/src/core/gpu/cl/kernels/ClDirectConvolutionKernel.cpp
index 72801fa6c8..c6ca084386 100644
--- a/src/core/gpu/cl/kernels/ClDirectConvolutionKernel.cpp
+++ b/src/core/gpu/cl/kernels/ClDirectConvolutionKernel.cpp
@@ -279,11 +279,8 @@ std::pair<Status, Window> validate_and_configure_window(ITensorInfo *src, ITenso
const unsigned int num_rows = dst->tensor_shape()[0] > 16 ? 2u : 1U;
// Create window and update padding
- Window win = calculate_max_window(*dst, Steps(vec_size, num_rows));
- dst->set_valid_region(ValidRegion(Coordinates(), dst->tensor_shape()));
-
- Status err = Status{};
- return std::make_pair(err, win);
+ Window win = calculate_max_window(output_shape, Steps(vec_size, num_rows));
+ return std::make_pair(Status{}, win);
}
else if(data_layout == DataLayout::NCHW)
{
@@ -368,8 +365,8 @@ void ClDirectConvolutionKernel::configure(const CLCompileContext &compile_contex
kernel_name << "direct_convolution_nhwc";
- const unsigned int n0 = win_config.second.x().step();
- const unsigned int m0 = win_config.second.y().step();
+ const unsigned int n0 = win_config.second.x().step();
+ const unsigned int m0 = win_config.second.y().step();
const unsigned int k0 = adjust_vec_size(8u, src->dimension(channel_idx));
const unsigned int partial_store_n0 = dst->dimension(channel_idx) % n0;