diff options
author | Georgios Pinitas <georgios.pinitas@arm.com> | 2020-01-22 18:36:27 +0000 |
---|---|---|
committer | Georgios Pinitas <georgios.pinitas@arm.com> | 2020-01-31 11:36:14 +0000 |
commit | 94672fb2af6535adc6ea7fe8b8498580ad8cf3f4 (patch) | |
tree | 189c68e7ff2c29d7800e09239da6d9a6364d5b05 /src/core/NEON/kernels/arm_gemm/gemm_int8.cpp | |
parent | 6a342648ae50beb8457871862f14fc9baef6b74f (diff) | |
download | ComputeLibrary-94672fb2af6535adc6ea7fe8b8498580ad8cf3f4.tar.gz |
COMPMID-3003: Integrate assembly kernels utilizing MMLA instruction.
MMLA is a matrix-multiply instruction introduced on armv8.6-A
Signed-off-by: Georgios Pinitas <georgios.pinitas@arm.com>
Change-Id: I572a54981d48f5a1e0e9e51102cb7ae28ad87806
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/2663
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Reviewed-by: Michalis Spyrou <michalis.spyrou@arm.com>
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/NEON/kernels/arm_gemm/gemm_int8.cpp')
-rw-r--r-- | src/core/NEON/kernels/arm_gemm/gemm_int8.cpp | 20 |
1 files changed, 20 insertions, 0 deletions
diff --git a/src/core/NEON/kernels/arm_gemm/gemm_int8.cpp b/src/core/NEON/kernels/arm_gemm/gemm_int8.cpp index a3446b9ddc..f7d8f65aea 100644 --- a/src/core/NEON/kernels/arm_gemm/gemm_int8.cpp +++ b/src/core/NEON/kernels/arm_gemm/gemm_int8.cpp @@ -34,10 +34,12 @@ #include "kernels/a64_gemm_s8_12x8.hpp" #include "kernels/a64_gemm_s8_4x4.hpp" #include "kernels/a64_hybrid_s8s32_dot_16x4.hpp" +#include "kernels/a64_interleaved_s8s32_mmla_12x8.hpp" #include "kernels/a64_smallK_hybrid_s8s32_dot_4x6.hpp" #include "kernels/a64_smallK_hybrid_s8s32_dot_4x8.hpp" #include "kernels/sve_hybrid_s8s32_dot_4VLx4.hpp" #include "kernels/sve_interleaved_s8s32_dot_3VLx8.hpp" +#include "kernels/sve_interleaved_s8s32_mmla_3VLx8.hpp" #include "kernels/sve_native_s8s32_dot_4VLx4.hpp" #include "kernels/sve_smallK_hybrid_s8s32_dot_1VLx8.hpp" @@ -45,6 +47,15 @@ namespace arm_gemm { static const GemmImplementation<int8_t, int32_t> gemm_s8_methods[] = { #ifdef __ARM_FEATURE_SVE +#ifdef V8P6 +{ + GemmMethod::GEMM_INTERLEAVED, + "interleaved_s8s32_mmla_3VLx8", + [](const GemmArgs &args) { return (args._Ksize>8); }, + nullptr, + [](const GemmArgs &args) { return new GemmInterleaved<interleaved_s8s32_mmla_3VLx8, int8_t, int32_t>(args); } +}, +#endif { GemmMethod::GEMM_HYBRID, "smallK_hybrid_s8s32_dot_1VLx8", @@ -74,6 +85,15 @@ static const GemmImplementation<int8_t, int32_t> gemm_s8_methods[] = { [](const GemmArgs &args) { return new GemmInterleaved<interleaved_s8s32_dot_3VLx8, int8_t, int32_t>(args); } }, #endif +#ifdef V8P6 +{ + GemmMethod::GEMM_INTERLEAVED, + "interleaved_s8s32_mmla_12x8", + [](const GemmArgs &args) { return (args._Ksize>8); }, + nullptr, + [](const GemmArgs &args) { return new GemmInterleaved<interleaved_s8s32_mmla_12x8, int8_t, int32_t>(args); } +}, +#endif { GemmMethod::GEMM_HYBRID, "smallK_hybrid_s8s32_dot_4x8", |