aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGian Marco Iodice <gianmarco.iodice@arm.com>2021-02-08 17:34:40 +0000
committerSheri Zhang <sheri.zhang@arm.com>2021-02-09 10:52:25 +0000
commitf5aad5166e430819ce8592e0e322d084c4b69d91 (patch)
tree42b7dee51fffa922fba7f6e55b5ad7fc626dc5df
parent70858d8eb178532b0e728e6a7d09a77d27605020 (diff)
downloadComputeLibrary-f5aad5166e430819ce8592e0e322d084c4b69d91.tar.gz
Report WBSM feature support in the documentation
This extension of the OpenCL tuner is still in experimental phase and allows to control the size of batches of workgroups distributed to compute units Resolves COMPMID-3938 Change-Id: I8e55db6877717ef5d50bc7eee24b248b5a2f9414 Signed-off-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/5027 Reviewed-by: Giorgio Arena <giorgio.arena@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com>
-rw-r--r--arm_compute/runtime/CL/CLTunerTypes.h2
-rw-r--r--docs/00_introduction.dox2
2 files changed, 3 insertions, 1 deletions
diff --git a/arm_compute/runtime/CL/CLTunerTypes.h b/arm_compute/runtime/CL/CLTunerTypes.h
index e93ef5b2b3..508cafac95 100644
--- a/arm_compute/runtime/CL/CLTunerTypes.h
+++ b/arm_compute/runtime/CL/CLTunerTypes.h
@@ -45,7 +45,7 @@ struct CLTuningInfo
CLTunerMode tuner_mode = CLTunerMode::NORMAL; /**< Parameter to select the level (granularity) of the tuning */
bool tune_wbsm = false; /**< Flag to tune the batches of work groups distributed to compute units.
Internally, the library will check if this feature is available on
- the target platform */
+ the target platform. This OpenCL tuner extension is still in experimental phase */
};
/** Converts a string to a strong types enumeration @ref CLTunerMode
diff --git a/docs/00_introduction.dox b/docs/00_introduction.dox
index 2f239960c3..4c1112f2d1 100644
--- a/docs/00_introduction.dox
+++ b/docs/00_introduction.dox
@@ -123,6 +123,8 @@ v21.02 Public major release
- NEGEMMMatrixVectorMultiplyKernel
- NELocallyConnectedMatrixMultiplyKernel / CLLocallyConnectedMatrixMultiplyKernel
- NEUpsampleLayerKernel / CLUpsampleLayerKernel
+ - Extend OpenCL tuner with workgroup batch size support
+ - Experimental extension for the OpenCL tuner to tune the batches of work groups distribute to compute units
v20.11 Public major release
- Various bug fixes.