aboutsummaryrefslogtreecommitdiff
path: root/src/core/NEON/kernels/arm_gemm/gemv_pretransposed.hpp
diff options
context:
space:
mode:
authorViet-Hoa Do <viet-hoa.do@arm.com>2022-06-01 11:47:14 +0100
committerViet-Hoa Do <viet-hoa.do@arm.com>2022-11-28 16:57:42 +0000
commit03b2971ac69a86f10a1566938d1a25afee15746c (patch)
treeaec7cfc047e1da278b4b71a706cda7b1b0faa158 /src/core/NEON/kernels/arm_gemm/gemv_pretransposed.hpp
parent7dc0234331f2150a6b4ac5c2b49de419870f7cf5 (diff)
downloadComputeLibrary-03b2971ac69a86f10a1566938d1a25afee15746c.tar.gz
Integrate SME2 kernels
* Add SME/SME2 detection. * Integrate SME2 implementation for: - Normal convolution - Winograd - Depthwise convolution - Pooling Resolves: COMPMID-5700 Signed-off-by: Viet-Hoa Do <viet-hoa.do@arm.com> Change-Id: I2f1ca1d05f8cfeee9309ed1c0a36096a4a6aad5c Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/8692 Reviewed-by: Gunes Bayir <gunes.bayir@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/NEON/kernels/arm_gemm/gemv_pretransposed.hpp')
-rw-r--r--src/core/NEON/kernels/arm_gemm/gemv_pretransposed.hpp14
1 files changed, 7 insertions, 7 deletions
diff --git a/src/core/NEON/kernels/arm_gemm/gemv_pretransposed.hpp b/src/core/NEON/kernels/arm_gemm/gemv_pretransposed.hpp
index f0b4e5db9e..86b33d081f 100644
--- a/src/core/NEON/kernels/arm_gemm/gemv_pretransposed.hpp
+++ b/src/core/NEON/kernels/arm_gemm/gemv_pretransposed.hpp
@@ -1,5 +1,5 @@
/*
- * Copyright (c) 2017-2021 Arm Limited.
+ * Copyright (c) 2017-2022 Arm Limited.
*
* SPDX-License-Identifier: MIT
*
@@ -41,10 +41,10 @@ namespace {
template<typename OutputStage>
class run_gemv_kernel {
public:
- template<typename strategy, typename To, typename Tr>
+ template<typename strategy, typename Tlo, typename Tro, typename Tr>
static void run (
const strategy &strat,
- const To *A_ptr, const To *B_ptr, Tr *c_ptr,
+ const Tlo *A_ptr, const Tro *B_ptr, Tr *c_ptr,
size_t N, size_t K,
const Tr *bias, const Activation &act, bool Accumulate,
const OutputStage &os, const int32_t *col_bias, unsigned int col_base
@@ -52,10 +52,10 @@ public:
};
template<>
-template<typename strategy, typename To, typename Tr>
+template<typename strategy, typename Tlo, typename Tro, typename Tr>
void run_gemv_kernel<Nothing>::run(
const strategy &strat,
- const To *A_ptr, const To *B_ptr, Tr *C_ptr,
+ const Tlo *A_ptr, const Tro *B_ptr, Tr *C_ptr,
size_t N, size_t K,
const Tr *bias, const Activation &act, bool Accumulate,
const Nothing &, const int32_t *, unsigned int
@@ -65,10 +65,10 @@ void run_gemv_kernel<Nothing>::run(
}
template<>
-template<typename strategy, typename To, typename Tr>
+template<typename strategy, typename Tlo, typename Tro, typename Tr>
void run_gemv_kernel<Requantize32>::run(
const strategy &strat,
- const To *A_ptr, const To *B_ptr, Tr *C_ptr,
+ const Tlo *A_ptr, const Tro *B_ptr, Tr *C_ptr,
size_t N, size_t K,
const Tr *, const Activation &, bool,
const Requantize32 &qp, const int32_t *col_bias, unsigned int col_base