From 81b28c423cf864727df0199f3c66837ed3c436ef Mon Sep 17 00:00:00 2001 From: Gian Marco Iodice Date: Thu, 29 Mar 2018 10:29:36 +0100 Subject: COMPMID-1032 - Fixing bug in CLGEMM when is_interleaved_transposed=true The bug concerned the collapse of the window in CLGEMMMatrixMultiplyKernel Change-Id: I5043bf37b72eeb615ebe7fb3f2c8e72d006bf341 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/126262 Tested-by: Jenkins Reviewed-by: Anthony Barbier --- src/core/CL/cl_kernels/gemm.cl | 3 +++ 1 file changed, 3 insertions(+) (limited to 'src/core/CL/cl_kernels') diff --git a/src/core/CL/cl_kernels/gemm.cl b/src/core/CL/cl_kernels/gemm.cl index a5b0acbe9c..00b130f5a9 100644 --- a/src/core/CL/cl_kernels/gemm.cl +++ b/src/core/CL/cl_kernels/gemm.cl @@ -1851,6 +1851,9 @@ __kernel void gemm_mm_qs16(IMAGE_DECLARATION(src0), // Compute dst address __global uchar *dst_addr = offset(&dst, 0, 0); + // Add offset for batched GEMM + dst_addr += get_global_id(2) * dst_stride_z; + // Multiply by the weight of matrix product and store the result short8 acc_qs16; acc_qs16 = convert_short8_sat(acc0); -- cgit v1.2.1