aboutsummaryrefslogtreecommitdiff
path: root/src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_fp16_mla_8x24.hpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_fp16_mla_8x24.hpp')
-rw-r--r--src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_fp16_mla_8x24.hpp110
1 files changed, 0 insertions, 110 deletions
diff --git a/src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_fp16_mla_8x24.hpp b/src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_fp16_mla_8x24.hpp
deleted file mode 100644
index ce63600424..0000000000
--- a/src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_fp16_mla_8x24.hpp
+++ /dev/null
@@ -1,110 +0,0 @@
-/*
- * Copyright (c) 2021 Arm Limited.
- *
- * SPDX-License-Identifier: MIT
- *
- * Permission is hereby granted, free of charge, to any person obtaining a copy
- * of this software and associated documentation files (the "Software"), to
- * deal in the Software without restriction, including without limitation the
- * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
- * sell copies of the Software, and to permit persons to whom the Software is
- * furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
- * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
- * IN THE SOFTWARE.
- */
-#pragma once
-
-#ifdef __aarch64__
-#include "../std_transforms_fixed.hpp"
-#include "../performance_parameters.hpp"
-
-#define ARGLIST \
- const __fp16 *, const __fp16 *, \
- __fp16 *, int, int, int
-
-namespace arm_gemm
-{
-// Actual kernel implementations
-void a64_interleaved_fp16_mla_8x24( ARGLIST );
-void a64_interleaved_fp16_mla_8x24_a55( ARGLIST );
-void a64_interleaved_fp16_mla_8x24_x1( ARGLIST );
-
-class cls_a64_interleaved_fp16_mla_8x24
-{
-public:
- typedef __fp16 operand_type;
- typedef __fp16 result_type;
-
- typedef void (*kern_type)( ARGLIST );
-
- /* Kernel blocking parameters */
- static constexpr unsigned int out_height()
- {
- return 8;
- }
-
- static unsigned int out_width()
- {
- return 24;
- }
-
- static unsigned int stripe_width()
- {
- return 8;
- }
-
- static constexpr unsigned int k_unroll()
- {
- return 1;
- }
-
-
- StdTransformsFixed<operand_type, result_type, 8, 24, 1> transforms = {};
- StdTransformsFixed<operand_type, result_type, 8, 24, 1, true> transforms_quantized = {};
- template<typename T>
- static inline PerformanceParameters get_performance_parameters(const CPUInfo *ci)
- {
-
- if (std::is_same<T, __fp16>::value) {
- switch (ci->get_cpu_model()) {
- case CPUModel::A55r1:
- return { 7.16, 1.14, 0.67 };
- default:
- return { 12.67, 3.98, 1.16 };
- }
- }
-
- return { 1.0 };
- }
-
- // Default to the generic kernel
- kern_type kernel=a64_interleaved_fp16_mla_8x24;
- cls_a64_interleaved_fp16_mla_8x24(const CPUInfo *ci)
- {
- switch(ci->get_cpu_model()) {
- default:
- break;
- case CPUModel::A55r1:
- kernel=a64_interleaved_fp16_mla_8x24_a55;
- break;
- case CPUModel::X1:
- kernel=a64_interleaved_fp16_mla_8x24_x1;
- break;
- }
- }
-};
-
-} // namespace arm_gemm
-
-#undef ARGLIST
-
-#endif // __aarch64__