From 695ad6913563b5d910f9fca0f5e2822f083456b6 Mon Sep 17 00:00:00 2001 From: Giorgio Arena Date: Fri, 7 Feb 2020 10:28:45 +0000 Subject: COMPMID-2964 ~10-15% Regression of DeepSpeech v1 F16 on hikey960 on G71 (CL) ++performance on few other networks Change-Id: I2e1ec3f34543d43da649c3fb07f4a8e75d25a10b Signed-off-by: Giorgio Arena Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/2716 Reviewed-by: Georgios Pinitas Comments-Addressed: Arm Jenkins Tested-by: Arm Jenkins --- src/runtime/CL/functions/CLGEMM.cpp | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/src/runtime/CL/functions/CLGEMM.cpp b/src/runtime/CL/functions/CLGEMM.cpp index 8d460142e5..fc56a0bd6b 100644 --- a/src/runtime/CL/functions/CLGEMM.cpp +++ b/src/runtime/CL/functions/CLGEMM.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2017-2019 ARM Limited. + * Copyright (c) 2017-2020 ARM Limited. * * SPDX-License-Identifier: MIT * @@ -109,7 +109,14 @@ CLGEMM::GEMMType CLGEMM::select_gemm_type(unsigned int m, unsigned int n, unsign { if((m == 1) || (!reshape_b_only_on_first_run)) { - gemm_type = GEMMType::RESHAPED_ONLY_RHS; + if((n > k) && gpu_target_is_in(gpu_target, GPUTarget::G71)) + { + gemm_type = GEMMType::NATIVE; + } + else + { + gemm_type = GEMMType::RESHAPED_ONLY_RHS; + } } else { -- cgit v1.2.1