aboutsummaryrefslogtreecommitdiff
path: root/src/core/CL/cl_kernels/helpers.h
diff options
context:
space:
mode:
authorAdnan AlSinan <adnan.alsinan@arm.com>2021-12-10 12:34:02 +0000
committerSiCong Li <sicong.li@arm.com>2021-12-23 17:01:14 +0000
commit3e155a52f19db046f83e30c25182460b00d108c7 (patch)
treef3ec747af21c8ee7b95d6dc88bf6ea4b4aa44659 /src/core/CL/cl_kernels/helpers.h
parentf76a502a73ca628e2a2556abeaa60ed17bb68d97 (diff)
downloadComputeLibrary-3e155a52f19db046f83e30c25182460b00d108c7.tar.gz
Rework gemm_reshape_lhs_ with new macros
Resolves COMPMID-4892 Signed-off-by: Adnan AlSinan <adnan.alsinan@arm.com> Change-Id: I52f23ca293506fc693ae829daccc6e889a050752 Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/6833 Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: SiCong Li <sicong.li@arm.com> Reviewed-by: Giorgio Arena <giorgio.arena@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/CL/cl_kernels/helpers.h')
-rw-r--r--src/core/CL/cl_kernels/helpers.h8
1 files changed, 4 insertions, 4 deletions
diff --git a/src/core/CL/cl_kernels/helpers.h b/src/core/CL/cl_kernels/helpers.h
index 88a7665eeb..bfb693e376 100644
--- a/src/core/CL/cl_kernels/helpers.h
+++ b/src/core/CL/cl_kernels/helpers.h
@@ -392,18 +392,18 @@
#define vload_partial_12(DATA, OFFSET, PTR) \
vload_partial_8(DATA.s01234567, OFFSET, PTR); \
vload_partial_4(DATA.s89AB, OFFSET, PTR + 8);
-
+// For vload_partial_{13,14,15}, an 8-vector size has been passed, because vectors size of size 5,6,7 are not supported
#define vload_partial_13(DATA, OFFSET, PTR) \
vload_partial_8(DATA.s01234567, OFFSET, PTR); \
- vload_partial_5(DATA.s89ABC, OFFSET, PTR + 8);
+ vload_partial_5(DATA.s89ABCDEF, OFFSET, PTR + 8);
#define vload_partial_14(DATA, OFFSET, PTR) \
vload_partial_8(DATA.s01234567, OFFSET, PTR); \
- vload_partial_6(DATA.s89ABCD, OFFSET, PTR + 8);
+ vload_partial_6(DATA.s89ABCDEF, OFFSET, PTR + 8);
#define vload_partial_15(DATA, OFFSET, PTR) \
vload_partial_8(DATA.s01234567, OFFSET, PTR); \
- vload_partial_7(DATA.s89ABCDE, OFFSET, PTR + 8);
+ vload_partial_7(DATA.s89ABCDEF, OFFSET, PTR + 8);
#define vload_partial_16(DATA, OFFSET, PTR) \
DATA = vload16(OFFSET, PTR);