aboutsummaryrefslogtreecommitdiff
path: root/arm_compute/core/GLES_COMPUTE
diff options
context:
space:
mode:
authorsteli01 <stephen.li@arm.com>2018-01-02 14:56:06 +0800
committerAnthony Barbier <anthony.barbier@arm.com>2018-11-02 16:42:33 +0000
commitd064389293e4a71781984b2b24f3d44964812949 (patch)
tree7a74f8351d0b255ad9e25bd5b364654b9f0dc74d /arm_compute/core/GLES_COMPUTE
parent1d08a310b7316f2b731e60ac36dc68989d15b546 (diff)
downloadComputeLibrary-d064389293e4a71781984b2b24f3d44964812949.tar.gz
APPBROWSER-357: Fix Transpose performance issue by tuning lws
Change-Id: Ia71435f6e5c5610e2b76d6d4eb61a8847ca42305 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/114829 Reviewed-by: Pablo Tello <pablo.tello@arm.com> Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Tested-by: Anthony Barbier <anthony.barbier@arm.com>
Diffstat (limited to 'arm_compute/core/GLES_COMPUTE')
-rw-r--r--arm_compute/core/GLES_COMPUTE/IGCKernel.h14
1 files changed, 13 insertions, 1 deletions
diff --git a/arm_compute/core/GLES_COMPUTE/IGCKernel.h b/arm_compute/core/GLES_COMPUTE/IGCKernel.h
index 11b2b17e51..ee1e166424 100644
--- a/arm_compute/core/GLES_COMPUTE/IGCKernel.h
+++ b/arm_compute/core/GLES_COMPUTE/IGCKernel.h
@@ -140,6 +140,17 @@ public:
*/
virtual void run(const Window &window) = 0;
+ /** Set the Local-Workgroup-Size hint
+ *
+ * @note This method should be called after the configuration of the kernel
+ *
+ * @param[in] lws_hint Local-Workgroup-Size to use
+ */
+ void set_lws_hint(gles::NDRange &lws_hint)
+ {
+ _lws_hint = lws_hint;
+ }
+
private:
/** Add the passed tensor's parameters to the object's kernel's arguments starting from the index idx.
*
@@ -159,7 +170,8 @@ private:
unsigned int num_arguments_per_tensor() const;
protected:
- GCKernel _kernel; /**< GLES kernel to run */
+ GCKernel _kernel; /**< GLES kernel to run */
+ gles::NDRange _lws_hint; /**< Local workgroup size hint for the GLES kernel */
};
/** Add the kernel to the command queue with the given window.