aboutsummaryrefslogtreecommitdiff
path: root/src/core/CL/cl_kernels/gemm.cl
diff options
context:
space:
mode:
authorGian Marco Iodice <gianmarco.iodice@arm.com>2018-03-29 10:29:36 +0100
committerAnthony Barbier <anthony.barbier@arm.com>2018-11-02 16:49:16 +0000
commit81b28c423cf864727df0199f3c66837ed3c436ef (patch)
treeeb8a63f31a357cf962be6bc1cffde47e6d37c7f1 /src/core/CL/cl_kernels/gemm.cl
parent61b4fca1dc3102a97087fb0d2d99fd4a3d8fd575 (diff)
downloadComputeLibrary-81b28c423cf864727df0199f3c66837ed3c436ef.tar.gz
COMPMID-1032 - Fixing bug in CLGEMM when is_interleaved_transposed=true
The bug concerned the collapse of the window in CLGEMMMatrixMultiplyKernel Change-Id: I5043bf37b72eeb615ebe7fb3f2c8e72d006bf341 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/126262 Tested-by: Jenkins <bsgcomp@arm.com> Reviewed-by: Anthony Barbier <anthony.barbier@arm.com>
Diffstat (limited to 'src/core/CL/cl_kernels/gemm.cl')
-rw-r--r--src/core/CL/cl_kernels/gemm.cl3
1 files changed, 3 insertions, 0 deletions
diff --git a/src/core/CL/cl_kernels/gemm.cl b/src/core/CL/cl_kernels/gemm.cl
index a5b0acbe9c..00b130f5a9 100644
--- a/src/core/CL/cl_kernels/gemm.cl
+++ b/src/core/CL/cl_kernels/gemm.cl
@@ -1851,6 +1851,9 @@ __kernel void gemm_mm_qs16(IMAGE_DECLARATION(src0),
// Compute dst address
__global uchar *dst_addr = offset(&dst, 0, 0);
+ // Add offset for batched GEMM
+ dst_addr += get_global_id(2) * dst_stride_z;
+
// Multiply by the weight of matrix product and store the result
short8 acc_qs16;
acc_qs16 = convert_short8_sat(acc0);