From 4bfc70e31766587c951204c93a127a486e007d0c Mon Sep 17 00:00:00 2001 From: Gunes Bayir Date: Fri, 10 Dec 2021 16:17:56 +0000 Subject: Add Gemm MMUL Reshaped Only Rhs Support for FP32/FP16 This patch introduces a GEMM routine that is optimized for Arm(R) Mali(TM)-G715 and Arm(R) Mali(TM)-G615 Resolves: COMPMID-5216 Signed-off-by: Gunes Bayir Change-Id: I2e5d7806f5904347185bb3e250f73d73d6669dba Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/7914 Reviewed-by: SiCong Li Tested-by: Arm Jenkins Comments-Addressed: Arm Jenkins Benchmark: Arm Jenkins --- src/gpu/cl/ClKernelLibrary.cpp | 6 ++++++ 1 file changed, 6 insertions(+) (limited to 'src/gpu/cl/ClKernelLibrary.cpp') diff --git a/src/gpu/cl/ClKernelLibrary.cpp b/src/gpu/cl/ClKernelLibrary.cpp index 1bf7f2b3ac..52661d6d79 100644 --- a/src/gpu/cl/ClKernelLibrary.cpp +++ b/src/gpu/cl/ClKernelLibrary.cpp @@ -272,6 +272,8 @@ const std::map ClKernelLibrary::_kernel_program_map = { "gemm_mv", "common/gemv.cl" }, { "gemm_mv_quantized", "common/gemv.cl" }, { "gemm_mm_native", "common/gemm.cl" }, + { "gemm_mm_reshaped_only_rhs_nt_mmul", "common/gemm_reshaped_only_rhs_mmul.cl" }, + { "gemm_mm_reshaped_only_rhs_nt_mmul_texture", "common/gemm_reshaped_only_rhs_mmul.cl" }, { "gemm_mm_native_post_act_eltwise_op_act", "common/experimental/gemm_fused_post_ops/act_eltwise_op_act/gemm_mm_native.cl" }, { "gemm_mm_reshaped_lhs_nt_rhs_t", "common/gemm.cl" }, { "gemm_mm_reshaped_lhs_nt_rhs_t_texture", "common/gemm.cl" }, @@ -582,6 +584,10 @@ const std::map ClKernelLibrary::_program_source_map = { "common/gemm.cl", #include "./cl_kernels/common/gemm.clembed" + }, + { + "common/gemm_reshaped_only_rhs_mmul.cl", +#include "./cl_kernels/common/gemm_reshaped_only_rhs_mmul.clembed" }, { "common/gemm_utils.cl", -- cgit v1.2.1