diff options
Diffstat (limited to 'src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_12x8.hpp')
-rw-r--r-- | src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_12x8.hpp | 27 |
1 files changed, 15 insertions, 12 deletions
diff --git a/src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_12x8.hpp b/src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_12x8.hpp index c91d50469f..10d1069417 100644 --- a/src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_12x8.hpp +++ b/src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_12x8.hpp @@ -25,6 +25,8 @@ #ifdef __aarch64__ +#include "../std_transforms_fixed.hpp" + namespace arm_gemm { // Actual kernel implementations @@ -48,20 +50,21 @@ public: typedef void (*kern_type)(const float *, const float *, float *, int, int, int); - /* Describes the data layout for A input */ - static const int A_interleave = 8; - static const int A_block = 1; - static const int A_transpose = 0; + /* Kernel blocking parameters */ + static int out_width() { + return 12; + } - /* Same for B input */ - static const int B_interleave = 12; - static const int B_block = 1; - static const int B_transpose = 1; + static int out_height() { + return 8; + } - /* Kernel blocking parameters */ - static const int out_width = 12; - static const int out_height = 8; - static const int k_unroll = 1; + static int k_unroll() { + return 1; + } + + // Use the standard fixed size transforms. + StdTransformsFixed<operand_type, result_type, 8, 12> transforms = {}; kern_type kernel=a64_sgemm_asimd_12x8; |