aboutsummaryrefslogtreecommitdiff
path: root/src/cpu/kernels/CpuActivationKernel.cpp
diff options
context:
space:
mode:
authorMohammed Suhail Munshi <MohammedSuhail.Munshi@arm.com>2023-12-05 14:27:31 +0000
committerMohmun02 <MohammedSuhail.Munshi@arm.com>2024-01-10 09:56:39 +0000
commit7467ba8fac0afb19d750b3bdda9ba95002634038 (patch)
treee47d4989251f03d13590e6b22d9bd228fd1efe34 /src/cpu/kernels/CpuActivationKernel.cpp
parent7fe7791468978429ab02343a8485b51b39832027 (diff)
downloadComputeLibrary-7467ba8fac0afb19d750b3bdda9ba95002634038.tar.gz
Use look up table for fp16 activation
- Enables FP16 lut for logistic activation - Adds LUTManager to re-use lut where appropriate. Signed-off-by: Mohammed Suhail Munshi <MohammedSuhail.Munshi@arm.com> Change-Id: I94667b63b452a8e58a1eb59cb0b5866178954523 Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/10864 Tested-by: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Gunes Bayir <gunes.bayir@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Benchmark: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/cpu/kernels/CpuActivationKernel.cpp')
-rw-r--r--src/cpu/kernels/CpuActivationKernel.cpp17
1 files changed, 17 insertions, 0 deletions
diff --git a/src/cpu/kernels/CpuActivationKernel.cpp b/src/cpu/kernels/CpuActivationKernel.cpp
index 3f3d72e8df..7cfa39b286 100644
--- a/src/cpu/kernels/CpuActivationKernel.cpp
+++ b/src/cpu/kernels/CpuActivationKernel.cpp
@@ -83,6 +83,13 @@ static const std::vector<CpuActivationKernel::ActivationKernel> available_kernel
data.f != ActivationLayerInfo::ActivationFunction::GELU;
},
REGISTER_QSYMM16_SVE2(arm_compute::cpu::sve2_qsymm16_activation)},
+ {"sve_fp16_activation_lut",
+ [](const ActivationDataTypeISASelectorData &data)
+ {
+ return data.dt == DataType::F16 && data.isa.fp16 && data.isa.sve &&
+ data.f == ActivationLayerInfo::ActivationFunction::LOGISTIC;
+ },
+ REGISTER_FP16_SVE(arm_compute::cpu::sve_fp16_activation_lut)},
{"sve_fp16_activation",
[](const ActivationDataTypeISASelectorData &data)
{
@@ -279,6 +286,9 @@ void CpuActivationKernel::configure(const ITensorInfo *src, ITensorInfo *dst, Ac
_name = std::string("CpuActivationKernel").append("/").append(uk->name);
#ifdef __aarch64__
+ // Initialise lut_manager
+ LUTManager &lut_manager = LUTManager::get_instance();
+
if ((src->data_type() == DataType::QASYMM8 || src->data_type() == DataType::QASYMM8_SIGNED) &&
activation_info.activation() != ActivationFunction::RELU)
{
@@ -288,6 +298,13 @@ void CpuActivationKernel::configure(const ITensorInfo *src, ITensorInfo *dst, Ac
activation_info.a(), activation_info.b());
activation_info.setLookupTable256(tmp_lut);
}
+
+ if (src->data_type() == DataType::F16 &&
+ activation_info.activation() == ActivationLayerInfo::ActivationFunction::LOGISTIC)
+ {
+ const LUTInfo info = {activation_info.activation(), src->data_type(), src->quantization_info()};
+ activation_info.setLookupTable65536((lut_manager.get_lut_table(info)));
+ }
#endif // __aarch64__
_act_info = activation_info;