aboutsummaryrefslogtreecommitdiff
path: root/src/cpu/kernels/add/generic/neon/integer.cpp
diff options
context:
space:
mode:
authorGunes Bayir <gunes.bayir@arm.com>2022-07-28 17:44:00 +0100
committerGunes Bayir <gunes.bayir@arm.com>2022-08-01 20:13:56 +0000
commit9b921be1ff7283050eb39d9ce1b10b5c8bfc1300 (patch)
tree0cb274a6c529717b8ef987aa3e270647927e9d89 /src/cpu/kernels/add/generic/neon/integer.cpp
parent385dad2bffecbf395aa9aad257809de81c727ac7 (diff)
downloadComputeLibrary-9b921be1ff7283050eb39d9ce1b10b5c8bfc1300.tar.gz
Optimize add layer by considering the input tensors as 1D array
Resolves: COMPMID-5108 Change-Id: I544f8160fbe5b4ffbef348d1fbd3dd626a6e1bdb Signed-off-by: Gunes Bayir <gunes.bayir@arm.com> Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/8002 Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Benchmark: Arm Jenkins <bsgcomp@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/cpu/kernels/add/generic/neon/integer.cpp')
-rw-r--r--src/cpu/kernels/add/generic/neon/integer.cpp17
1 files changed, 16 insertions, 1 deletions
diff --git a/src/cpu/kernels/add/generic/neon/integer.cpp b/src/cpu/kernels/add/generic/neon/integer.cpp
index 62c19e66b1..ffead03474 100644
--- a/src/cpu/kernels/add/generic/neon/integer.cpp
+++ b/src/cpu/kernels/add/generic/neon/integer.cpp
@@ -1,5 +1,5 @@
/*
- * Copyright (c) 2021 Arm Limited.
+ * Copyright (c) 2021-2022 Arm Limited.
*
* SPDX-License-Identifier: MIT
*
@@ -42,5 +42,20 @@ void add_s32_neon(const ITensor *src0, const ITensor *src1, ITensor *dst, const
{
return add_same_neon<int32_t>(src0, src1, dst, policy, window);
}
+
+void add_u8_neon_as_1d_array(const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window)
+{
+ return add_same_neon_as_1d_array<uint8_t>(src0, src1, dst, policy, window);
+}
+
+void add_s16_neon_as_1d_array(const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window)
+{
+ return add_same_neon_as_1d_array<int16_t>(src0, src1, dst, policy, window);
+}
+
+void add_s32_neon_as_1d_array(const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window)
+{
+ return add_same_neon_as_1d_array<int32_t>(src0, src1, dst, policy, window);
+}
}
} // namespace arm_compute