aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGian Marco Iodice <gianmarco.iodice@arm.com>2020-05-06 11:27:08 +0100
committerGian Marco Iodice <gianmarco.iodice@arm.com>2020-05-06 15:36:33 +0000
commit2cfd3f754ec707c25f129c0026686035a0dcfc54 (patch)
tree2a25167f0a55cce182c93117920d5ea1b7cc6c06
parent36a551f32c69dfa4583395eca607afe7fcf40f75 (diff)
downloadComputeLibrary-2cfd3f754ec707c25f129c0026686035a0dcfc54.tar.gz
COMPMID-3459: Update the heuristic for GEMV for F16 on Mali-G77
Change-Id: I10020cd5c88ec1926087531c4c4ce0a1cfaf43c9 Signed-off-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/3151 Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com>
-rw-r--r--src/core/CL/gemm/reshaped_only_rhs/CLGEMMReshapedOnlyRHSKernelConfigurationValhall.cpp14
1 files changed, 11 insertions, 3 deletions
diff --git a/src/core/CL/gemm/reshaped_only_rhs/CLGEMMReshapedOnlyRHSKernelConfigurationValhall.cpp b/src/core/CL/gemm/reshaped_only_rhs/CLGEMMReshapedOnlyRHSKernelConfigurationValhall.cpp
index 5526616001..d93a912c0d 100644
--- a/src/core/CL/gemm/reshaped_only_rhs/CLGEMMReshapedOnlyRHSKernelConfigurationValhall.cpp
+++ b/src/core/CL/gemm/reshaped_only_rhs/CLGEMMReshapedOnlyRHSKernelConfigurationValhall.cpp
@@ -109,13 +109,21 @@ std::pair<GEMMLHSMatrixInfo, GEMMRHSMatrixInfo> CLGEMMReshapedOnlyRHSKernelConfi
if(m == 1)
{
- const int h0 = std::max(std::min(static_cast<int>(n / 4), static_cast<int>(256)), static_cast<int>(1));
- return configure_lhs_rhs_info(m, n, 1, 4, 4, 1, h0, false, true, false, true);
+ if(n > 2048)
+ {
+ const unsigned int h0 = std::max(n / 4, 1U);
+ return configure_lhs_rhs_info(m, n, 1, 4, 4, 1, h0, false, true, false, true);
+ }
+ else
+ {
+ const unsigned int h0 = std::max(n / 2, 1U);
+ return configure_lhs_rhs_info(m, n, 1, 2, 8, 1, h0, false, true, false, true);
+ }
}
else if (m < 128)
{
const int h0 = std::max(std::min(static_cast<int>(n / 4), static_cast<int>(256)), static_cast<int>(1));
- if(k > 512)
+ if(k >= 512)
{
return configure_lhs_rhs_info(m, n, 2, 4, 16, 1, h0, false, true, false, false);
}