From f5aad5166e430819ce8592e0e322d084c4b69d91 Mon Sep 17 00:00:00 2001 From: Gian Marco Iodice Date: Mon, 8 Feb 2021 17:34:40 +0000 Subject: Report WBSM feature support in the documentation This extension of the OpenCL tuner is still in experimental phase and allows to control the size of batches of workgroups distributed to compute units Resolves COMPMID-3938 Change-Id: I8e55db6877717ef5d50bc7eee24b248b5a2f9414 Signed-off-by: Gian Marco Iodice Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/5027 Reviewed-by: Giorgio Arena Comments-Addressed: Arm Jenkins Tested-by: Arm Jenkins --- arm_compute/runtime/CL/CLTunerTypes.h | 2 +- docs/00_introduction.dox | 2 ++ 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/arm_compute/runtime/CL/CLTunerTypes.h b/arm_compute/runtime/CL/CLTunerTypes.h index e93ef5b2b3..508cafac95 100644 --- a/arm_compute/runtime/CL/CLTunerTypes.h +++ b/arm_compute/runtime/CL/CLTunerTypes.h @@ -45,7 +45,7 @@ struct CLTuningInfo CLTunerMode tuner_mode = CLTunerMode::NORMAL; /**< Parameter to select the level (granularity) of the tuning */ bool tune_wbsm = false; /**< Flag to tune the batches of work groups distributed to compute units. Internally, the library will check if this feature is available on - the target platform */ + the target platform. This OpenCL tuner extension is still in experimental phase */ }; /** Converts a string to a strong types enumeration @ref CLTunerMode diff --git a/docs/00_introduction.dox b/docs/00_introduction.dox index 2f239960c3..4c1112f2d1 100644 --- a/docs/00_introduction.dox +++ b/docs/00_introduction.dox @@ -123,6 +123,8 @@ v21.02 Public major release - NEGEMMMatrixVectorMultiplyKernel - NELocallyConnectedMatrixMultiplyKernel / CLLocallyConnectedMatrixMultiplyKernel - NEUpsampleLayerKernel / CLUpsampleLayerKernel + - Extend OpenCL tuner with workgroup batch size support + - Experimental extension for the OpenCL tuner to tune the batches of work groups distribute to compute units v20.11 Public major release - Various bug fixes. -- cgit v1.2.1