diff options
Diffstat (limited to 'src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp')
-rw-r--r-- | src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp | 28 |
1 files changed, 13 insertions, 15 deletions
diff --git a/src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp b/src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp index 5aa5291a29..23f4c1d84f 100644 --- a/src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp +++ b/src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4.hpp @@ -25,38 +25,36 @@ #ifdef __aarch64__ -namespace arm_gemm -{ +namespace arm_gemm { + // Kernel definition void a64_gemm_u8_4x4(const uint8_t *Apanel, const uint8_t *Bpanel, uint32_t *Cpanel, int ablocks, int bblocks, int K); -class gemm_u8_4x4 -{ +class gemm_u8_4x4 { public: - typedef uint8_t operand_type; + typedef uint8_t operand_type; typedef uint32_t result_type; typedef void (*kern_type)(const uint8_t *, const uint8_t *, uint32_t *, int, int, int); /* Describes the data layout for A input */ - static const int A_interleave = 4; - static const int A_block = 16; - static const bool A_transpose = false; + static const int A_interleave = 4; + static const int A_block = 16; + static const bool A_transpose = false; /* Same for B input */ - static const int B_interleave = 4; - static const int B_block = 16; - static const bool B_transpose = true; + static const int B_interleave = 4; + static const int B_block = 16; + static const bool B_transpose = true; /* Kernel blocking parameters */ - static const int out_width = 4; + static const int out_width = 4; static const int out_height = 4; - static const int k_unroll = 16; + static const int k_unroll = 16; kern_type kernel = nullptr; - gemm_u8_4x4(const CPUInfo *ci) - { + gemm_u8_4x4(const CPUInfo *ci) { kernel = a64_gemm_u8_4x4; } }; |