aboutsummaryrefslogtreecommitdiff
path: root/src/core/CL/cl_kernels/depthwise_convolution_quantized.cl
diff options
context:
space:
mode:
authorGiorgio Arena <giorgio.arena@arm.com>2018-04-23 12:01:33 +0100
committerAnthony Barbier <anthony.barbier@arm.com>2018-11-02 16:49:39 +0000
commitfda901f0485371e8b6a807c8dd9614560a924793 (patch)
treed41f01633fb3d7ecb39472d1c897f9ff1bfb84bd /src/core/CL/cl_kernels/depthwise_convolution_quantized.cl
parentf485a100e3f11911d25a16b4ccc286c6c0816061 (diff)
downloadComputeLibrary-fda901f0485371e8b6a807c8dd9614560a924793.tar.gz
COMPMID-1078 Fix CL DepthwiseConvolutionLayer QASYMM8 failing validation
Change-Id: Id540490e5faf11c466ff039a20880eeedd6e5ec7 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/128612 Tested-by: Jenkins <bsgcomp@arm.com> Reviewed-by: Michalis Spyrou <michalis.spyrou@arm.com> Reviewed-by: Isabella Gottardi <isabella.gottardi@arm.com>
Diffstat (limited to 'src/core/CL/cl_kernels/depthwise_convolution_quantized.cl')
-rw-r--r--src/core/CL/cl_kernels/depthwise_convolution_quantized.cl5
1 files changed, 2 insertions, 3 deletions
diff --git a/src/core/CL/cl_kernels/depthwise_convolution_quantized.cl b/src/core/CL/cl_kernels/depthwise_convolution_quantized.cl
index 635bc9d50b..a0c0a8b1fb 100644
--- a/src/core/CL/cl_kernels/depthwise_convolution_quantized.cl
+++ b/src/core/CL/cl_kernels/depthwise_convolution_quantized.cl
@@ -333,7 +333,7 @@ __kernel void depthwise_convolution_3x3_quantized_nhwc_stride1(
const int src_offs2 = src_offs1 + src_stride_z;
const int cond_top = z - CONV_PAD_TOP < 0;
- const int cond_bottom = z * (src_step_z / src_stride_z) + 2 >= SRC_DEPTH;
+ const int cond_bottom = z * (src_step_z / src_stride_z) + 2 > SRC_DEPTH;
__global uchar *src_addr0 = first_elem + select(src_offs0, pad_offs, cond_top);
__global uchar *src_addr1 = first_elem + src_offs1;
@@ -580,8 +580,7 @@ __kernel void depthwise_convolution_3x3_quantized_nhwc_stride2(
const int src_offs2 = src_offs1 + src_stride_z;
const int cond_top = z - CONV_PAD_TOP < 0;
- const int cond_bottom = z * (src_step_z / src_stride_z) + 2 >= SRC_DEPTH;
- ;
+ const int cond_bottom = z * (src_step_z / src_stride_z) + 2 > SRC_DEPTH;
__global uchar *src_addr0 = first_elem + select(src_offs0, pad_offs, cond_top);
__global uchar *src_addr1 = first_elem + src_offs1;