aboutsummaryrefslogtreecommitdiff
path: root/src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp')
-rw-r--r--src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp22
1 files changed, 17 insertions, 5 deletions
diff --git a/src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp b/src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp
index 23f4c1d84f..2da3ecd4f8 100644
--- a/src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp
+++ b/src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp
@@ -25,6 +25,8 @@
#ifdef __aarch64__
+#include "../std_transforms_fixed.hpp"
+
namespace arm_gemm {
// Kernel definition
@@ -48,14 +50,24 @@ public:
static const bool B_transpose = true;
/* Kernel blocking parameters */
- static const int out_width = 4;
- static const int out_height = 4;
- static const int k_unroll = 16;
+ static int out_width() {
+ return 4;
+ }
+
+ static int out_height() {
+ return 4;
+ }
+
+ static int k_unroll() {
+ return 16;
+ }
+
+ // Use the standard fixed size transforms.
+ StdTransformsFixed<operand_type, result_type, 4, 4, 16> transforms = {};
- kern_type kernel = nullptr;
+ kern_type kernel = a64_gemm_u8_4x4;
gemm_u8_4x4(const CPUInfo *ci) {
- kernel = a64_gemm_u8_4x4;
}
};