aboutsummaryrefslogtreecommitdiff
path: root/src/gpu/cl/ClKernelLibrary.cpp
diff options
context:
space:
mode:
authorFreddie Liardet <frederick.liardet@arm.com>2022-05-16 14:09:10 +0100
committerGunes Bayir <gunes.bayir@arm.com>2022-07-22 10:18:41 +0000
commite572dff7adc334a98ac4a0326d66037451d5d079 (patch)
tree9c4db3d743078de9bda67dfed674e3f371a4e238 /src/gpu/cl/ClKernelLibrary.cpp
parente87120731ca65c54b082734af07f748ac9651427 (diff)
downloadComputeLibrary-e572dff7adc334a98ac4a0326d66037451d5d079.tar.gz
Add GemmLowp MMUL Reshaped Only Rhs Support for QASYMM8/QASYMM8_SIGNED
This patch introduces a GEMMLowp routine that is optimized for Arm(R) Mali(TM)-G715 and Arm(R) Mali(TM)-G615 Resolves: COMPMID-5398 Signed-off-by: Freddie Liardet <frederick.liardet@arm.com> Signed-off-by: Gunes Bayir <gunes.bayir@arm.com> Change-Id: I8d06453645688f3658b6c7c06f1ebc25a2505661 Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/7932 Tested-by: Arm Jenkins <bsgcomp@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: SiCong Li <sicong.li@arm.com> Reviewed-by: Pablo Marquez Tello <pablo.tello@arm.com> Benchmark: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/gpu/cl/ClKernelLibrary.cpp')
-rw-r--r--src/gpu/cl/ClKernelLibrary.cpp5
1 files changed, 5 insertions, 0 deletions
diff --git a/src/gpu/cl/ClKernelLibrary.cpp b/src/gpu/cl/ClKernelLibrary.cpp
index 52661d6d79..0f08f5d044 100644
--- a/src/gpu/cl/ClKernelLibrary.cpp
+++ b/src/gpu/cl/ClKernelLibrary.cpp
@@ -303,6 +303,7 @@ const std::map<std::string, std::string> ClKernelLibrary::_kernel_program_map =
{ "gemmlowp_mm_reshaped_lhs_nt_rhs_t", "common/gemmlowp.cl" },
{ "gemmlowp_mm_reshaped_only_rhs_t", "common/gemmlowp.cl" },
{ "gemmlowp_mm_reshaped_only_rhs_t_fused_output_stage_fixedpoint", "common/gemmlowp.cl" },
+ { "gemmlowp_mm_reshaped_only_rhs_mmul", "common/gemmlowp_reshaped_only_rhs_mmul.cl" },
{ "gemmlowp_offset_contribution", "common/gemmlowp.cl" },
{ "gemmlowp_offset_contribution_quantize_down", "common/gemmlowp.cl" },
{ "gemmlowp_offset_contribution_quantize_down_fixedpoint", "common/gemmlowp.cl" },
@@ -618,6 +619,10 @@ const std::map<std::string, std::string> ClKernelLibrary::_program_source_map =
#include "./cl_kernels/common/gemmlowp.clembed"
},
{
+ "common/gemmlowp_reshaped_only_rhs_mmul.cl",
+#include "./cl_kernels/common/gemmlowp_reshaped_only_rhs_mmul.clembed"
+ },
+ {
"common/gemv.cl",
#include "./cl_kernels/common/gemv.clembed"
},