aboutsummaryrefslogtreecommitdiff
path: root/src/core/CL/cl_kernels/direct_convolution_1x1_3x3_5x5_quantized.cl
diff options
context:
space:
mode:
authorGeorgios Pinitas <georgios.pinitas@arm.com>2018-02-19 12:15:22 +0000
committerAnthony Barbier <anthony.barbier@arm.com>2018-11-02 16:47:18 +0000
commit3cfd237ec976d109989c530f5aa726d1e94963e9 (patch)
tree4eb36a7330b1646e077fd1cac7f6196cb3b5cac4 /src/core/CL/cl_kernels/direct_convolution_1x1_3x3_5x5_quantized.cl
parentf6c572ce404c8ac99b0b00c65b757fbadab33dc1 (diff)
downloadComputeLibrary-3cfd237ec976d109989c530f5aa726d1e94963e9.tar.gz
COMPMID-938: OCLgrind: Mismatches in depthwise convolution on Bifrost
Invalid conversions in oclgrind when clamp is used. Removed call to clamp in CL kernel and replace with convert_sat. Change-Id: I3cd9b87dc10c65d307fbf6eb0aec1b671fba6e97 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/121062 Tested-by: Jenkins <bsgcomp@arm.com> Reviewed-by: Anthony Barbier <anthony.barbier@arm.com>
Diffstat (limited to 'src/core/CL/cl_kernels/direct_convolution_1x1_3x3_5x5_quantized.cl')
-rw-r--r--src/core/CL/cl_kernels/direct_convolution_1x1_3x3_5x5_quantized.cl3
1 files changed, 1 insertions, 2 deletions
diff --git a/src/core/CL/cl_kernels/direct_convolution_1x1_3x3_5x5_quantized.cl b/src/core/CL/cl_kernels/direct_convolution_1x1_3x3_5x5_quantized.cl
index 533bc75bcb..b58dc7af72 100644
--- a/src/core/CL/cl_kernels/direct_convolution_1x1_3x3_5x5_quantized.cl
+++ b/src/core/CL/cl_kernels/direct_convolution_1x1_3x3_5x5_quantized.cl
@@ -302,8 +302,7 @@ __kernel void output_stage_quantized(
vals = ASYMM_MULT_BY_QUANT_MULTIPLIER_LESS_THAN_ONE(vals, output_multiplier, output_shift, 16);
vals = vals + output_offset;
- vals = clamp(vals, 0, 255);
// Store result in dst
- vstore16(convert_uchar16(vals), 0, (__global uchar *)dst.ptr);
+ vstore16(convert_uchar16_sat(vals), 0, (__global uchar *)dst.ptr);
}