APPBROWSER-298, APPBROWSER-306: Reimplement the common code of compute shader

The new common code of compute shader is in file helpers_cs.h Rewrite the direct_convolution1x1.cs and softmax_layer.cs to use the new common code. It will also remove the dependence of the token pasting operator (##). We'll remove the "##" support after we rewrite all of the compute shader code. Change-Id: Icd8553ef6b61ad484a8507590ac8ed499bd47061 Reviewed-on: http://mpd-gerrit.cambridge.arm.com/95455 Tested-by: Kaizen <jeremy.johnson+kaizengerrit@arm.com> Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com> Reviewed-by: Frank Lei <frank.lei@arm.com> (cherry picked from commit 0a4f83570d261f839d9866b68979efe8d7a95883) Reviewed-on: http://mpd-gerrit.cambridge.arm.com/95601 Reviewed-by: Jim He <jim.he@arm.com>
author: Joel Liang <joel.liang@arm.com> 2017-11-10 09:59:19 +0800
committer: Anthony Barbier <anthony.barbier@arm.com> 2018-11-02 16:35:24 +0000
commit: f1f3ebd517089e934cf3f06e64d90619a395ad87 (patch)
tree: 8dac05909b5f522a1c78e0ac4423cb6f65254391 /src/core/GLES_COMPUTE/IGCKernel.cpp
parent: 283c1790da45ab562ecfb2aa7741297191886d85 (diff)
download: ComputeLibrary-f1f3ebd517089e934cf3f06e64d90619a395ad87.tar.gz
1 files changed, 14 insertions, 5 deletions
diff --git a/src/core/GLES_COMPUTE/IGCKernel.cpp b/src/core/GLES_COMPUTE/IGCKernel.cpp
index 154a2c0c66..d6ad6c47d9 100644
--- a/src/core/GLES_COMPUTE/IGCKernel.cpp
+++ b/src/core/GLES_COMPUTE/IGCKernel.cpp
@@ -74,7 +74,8 @@ GCKernel &IGCKernel::kernel()
 template <unsigned int dimension_size>
 unsigned int           IGCKernel::num_arguments_per_tensor() const
 {
-    return 2 + 2 * dimension_size;
+    // Rounding up the tensor attributes structure in compute shader to a multiple of a vec4
+    return ceil_to_multiple(1 + 2 * dimension_size, 4);
 }
 
 template <unsigned int dimension_size>
@@ -97,12 +98,20 @@ void IGCKernel::add_tensor_argument(unsigned int &idx, const IGCTensor *tensor,
 
     for(unsigned int dimension = 0; dimension < dimension_size; dimension++)
     {
-        _kernel.set_params(idx++, strides[dimension]);
-        _kernel.set_params(idx++, strides[dimension] * window[dimension].step());
+        _kernel.set_argument(idx++, strides[dimension]);
+        _kernel.set_argument(idx++, strides[dimension] * window[dimension].step());
     }
 
-    _kernel.set_params(idx++, offset_first_element);
-    _kernel.set_params(idx++, param.buffer_data_type_shift);
+    _kernel.set_argument(idx++, offset_first_element);
+    _kernel.set_argument(idx++, param.buffer_data_type_shift);
+
+    // Rounding up the tensor attributes structure in compute shader to a multiple of a vec4
+    unsigned int idx_end = ceil_to_multiple(idx, 4);
+    for(unsigned int i = idx; i < idx_end; ++i)
+    {
+        _kernel.set_argument(i, 0);
+    }
+    idx = idx_end;
 
     ARM_COMPUTE_GL_CHECK(glBindBufferBase(GL_SHADER_STORAGE_BUFFER, param.binding_point, tensor->gc_buffer()));
author	Joel Liang <joel.liang@arm.com>	2017-11-10 09:59:19 +0800
committer	Anthony Barbier <anthony.barbier@arm.com>	2018-11-02 16:35:24 +0000
commit	f1f3ebd517089e934cf3f06e64d90619a395ad87 (patch)
tree	8dac05909b5f522a1c78e0ac4423cb6f65254391 /src/core/GLES_COMPUTE/IGCKernel.cpp
parent	283c1790da45ab562ecfb2aa7741297191886d85 (diff)
download	ComputeLibrary-f1f3ebd517089e934cf3f06e64d90619a395ad87.tar.gz