aboutsummaryrefslogtreecommitdiff
path: root/src/core/CL/cl_kernels/direct_convolution3x3.cl
diff options
context:
space:
mode:
Diffstat (limited to 'src/core/CL/cl_kernels/direct_convolution3x3.cl')
-rw-r--r--src/core/CL/cl_kernels/direct_convolution3x3.cl10
1 files changed, 5 insertions, 5 deletions
diff --git a/src/core/CL/cl_kernels/direct_convolution3x3.cl b/src/core/CL/cl_kernels/direct_convolution3x3.cl
index 4da7c39e26..28da544f89 100644
--- a/src/core/CL/cl_kernels/direct_convolution3x3.cl
+++ b/src/core/CL/cl_kernels/direct_convolution3x3.cl
@@ -50,8 +50,8 @@ MULQ_SAT_IMPL(qs32x8, qs32x8)
#define CONVOLUTION1x3_STRIDE1(acc, src_row_ptr, weights_row_ptr) \
({ \
- VEC_DATA_TYPE(DATA_TYPE, 4) \
- weights_values0 = vload4(0, weights_row_ptr); \
+ VEC_DATA_TYPE(DATA_TYPE, 3) \
+ weights_values0 = vload3(0, weights_row_ptr); \
VEC_DATA_TYPE(DATA_TYPE, 8) \
src0 = vload8(0, src_row_ptr); \
VEC_DATA_TYPE(DATA_TYPE, 2) \
@@ -64,8 +64,8 @@ MULQ_SAT_IMPL(qs32x8, qs32x8)
#define CONVOLUTION1x3_STRIDE2(acc, src_row_ptr, weights_row_ptr) \
({ \
- VEC_DATA_TYPE(DATA_TYPE, 4) \
- weights_values0 = vload4(0, weights_row_ptr); \
+ VEC_DATA_TYPE(DATA_TYPE, 3) \
+ weights_values0 = vload3(0, weights_row_ptr); \
VEC_DATA_TYPE(DATA_TYPE, 16) \
src0 = vload16(0, src_row_ptr); \
DATA_TYPE src1 = *(src_row_ptr + 16); \
@@ -152,4 +152,4 @@ __kernel void direct_convolution3x3(
vstore8(CONVERT_SAT(pixels0, VEC_DATA_TYPE(DATA_TYPE, 8)), 0, (__global DATA_TYPE *)dst.ptr);
}
-#endif // defined(DATA_TYPE) && defined(STRIDE_X) && defined(WEIGHTS_DEPTH) \ No newline at end of file
+#endif // defined(DATA_TYPE) && defined(STRIDE_X) && defined(WEIGHTS_DEPTH)