diff options
author | Giorgio Arena <giorgio.arena@arm.com> | 2021-09-08 12:26:27 +0100 |
---|---|---|
committer | Giorgio Arena <giorgio.arena@arm.com> | 2021-09-08 13:05:24 +0000 |
commit | 88bd35d68575aca77ab6c44c50bed8f94212b729 (patch) | |
tree | 56bc844e2cebf077955bfce7fa5fbe5e383d167e /src/core/CL/cl_kernels/helpers.h | |
parent | bde2f3536a33e1d018d03c266cc9cd557f50e3e8 (diff) | |
download | ComputeLibrary-88bd35d68575aca77ab6c44c50bed8f94212b729.tar.gz |
Fix vload_partial macros on OpenCL
When calling vload_partial, the macros were overriding the first values with a hidden double assignment
Resolve COMPMID-4792
Signed-off-by: Giorgio Arena <giorgio.arena@arm.com>
Change-Id: I96bca60ae546fc34a71e69d5c471581a472d8ddf
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/6231
Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com>
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/CL/cl_kernels/helpers.h')
-rw-r--r-- | src/core/CL/cl_kernels/helpers.h | 60 |
1 files changed, 30 insertions, 30 deletions
diff --git a/src/core/CL/cl_kernels/helpers.h b/src/core/CL/cl_kernels/helpers.h index fae15b2347..88a7665eeb 100644 --- a/src/core/CL/cl_kernels/helpers.h +++ b/src/core/CL/cl_kernels/helpers.h @@ -362,48 +362,48 @@ #define vload_partial_4(DATA, OFFSET, PTR) \ DATA.s0123 = vload4(OFFSET, PTR); -#define vload_partial_5(DATA, OFFSET, PTR) \ - DATA.s0123 = vload_partial_4(DATA, OFFSET, PTR); \ - DATA.s4 = vload1(OFFSET, PTR + 4); +#define vload_partial_5(DATA, OFFSET, PTR) \ + vload_partial_4(DATA.s0123, OFFSET, PTR); \ + DATA.s4 = vload1(OFFSET, PTR + 4); -#define vload_partial_6(DATA, OFFSET, PTR) \ - DATA.s0123 = vload_partial_4(DATA, OFFSET, PTR); \ - DATA.s45 = vload_partial_2(DATA, OFFSET, PTR + 4); +#define vload_partial_6(DATA, OFFSET, PTR) \ + vload_partial_4(DATA.s0123, OFFSET, PTR); \ + vload_partial_2(DATA.s45, OFFSET, PTR + 4); -#define vload_partial_7(DATA, OFFSET, PTR) \ - DATA.s0123 = vload_partial_4(DATA, OFFSET, PTR); \ - DATA.s456 = vload_partial_3(DATA, OFFSET, PTR + 4); +#define vload_partial_7(DATA, OFFSET, PTR) \ + vload_partial_4(DATA.s0123, OFFSET, PTR); \ + vload_partial_3(DATA.s456, OFFSET, PTR + 4); #define vload_partial_8(DATA, OFFSET, PTR) \ DATA.s01234567 = vload8(OFFSET, PTR); -#define vload_partial_9(DATA, OFFSET, PTR) \ - DATA.s01234567 = vload_partial_8(DATA, OFFSET, PTR); \ - DATA.s8 = vload1(OFFSET, PTR + 8); +#define vload_partial_9(DATA, OFFSET, PTR) \ + vload_partial_8(DATA.s01234567, OFFSET, PTR); \ + DATA.s8 = vload1(OFFSET, PTR + 8); -#define vload_partial_10(DATA, OFFSET, PTR) \ - DATA.s01234567 = vload_partial_8(DATA, OFFSET, PTR); \ - DATA.s89 = vload_partial_2(DATA, OFFSET, PTR + 8); +#define vload_partial_10(DATA, OFFSET, PTR) \ + vload_partial_8(DATA.s01234567, OFFSET, PTR); \ + vload_partial_2(DATA.s89, OFFSET, PTR + 8); -#define vload_partial_11(DATA, OFFSET, PTR) \ - DATA.s01234567 = vload_partial_8(DATA, OFFSET, PTR); \ - DATA.s89A = vload_partial_3(DATA, OFFSET, PTR + 8); +#define vload_partial_11(DATA, OFFSET, PTR) \ + vload_partial_8(DATA.s01234567, OFFSET, PTR); \ + vload_partial_3(DATA.s89A, OFFSET, PTR + 8); -#define vload_partial_12(DATA, OFFSET, PTR) \ - DATA.s01234567 = vload_partial_8(DATA, OFFSET, PTR); \ - DATA.s89AB = vload_partial_4(DATA, OFFSET, PTR + 8); +#define vload_partial_12(DATA, OFFSET, PTR) \ + vload_partial_8(DATA.s01234567, OFFSET, PTR); \ + vload_partial_4(DATA.s89AB, OFFSET, PTR + 8); -#define vload_partial_13(DATA, OFFSET, PTR) \ - DATA.s01234567 = vload_partial_8(DATA, OFFSET, PTR); \ - DATA.s89ABC = vload_partial_5(DATA, OFFSET, PTR + 8); +#define vload_partial_13(DATA, OFFSET, PTR) \ + vload_partial_8(DATA.s01234567, OFFSET, PTR); \ + vload_partial_5(DATA.s89ABC, OFFSET, PTR + 8); -#define vload_partial_14(DATA, OFFSET, PTR) \ - DATA.s01234567 = vload_partial_8(DATA, OFFSET, PTR); \ - DATA.s89ABCD = vload_partial_6(DATA, OFFSET, PTR + 8); +#define vload_partial_14(DATA, OFFSET, PTR) \ + vload_partial_8(DATA.s01234567, OFFSET, PTR); \ + vload_partial_6(DATA.s89ABCD, OFFSET, PTR + 8); -#define vload_partial_15(DATA, OFFSET, PTR) \ - DATA.s01234567 = vload_partial_8(DATA, OFFSET, PTR); \ - DATA.s89ABCDE = vload_partial_7(DATA, OFFSET, PTR + 8); +#define vload_partial_15(DATA, OFFSET, PTR) \ + vload_partial_8(DATA.s01234567, OFFSET, PTR); \ + vload_partial_7(DATA.s89ABCDE, OFFSET, PTR + 8); #define vload_partial_16(DATA, OFFSET, PTR) \ DATA = vload16(OFFSET, PTR); |