aboutsummaryrefslogtreecommitdiff
path: root/src/core/NEON/kernels/arm_gemm/merges
diff options
context:
space:
mode:
authorGeorgios Pinitas <georgios.pinitas@arm.com>2020-03-06 18:12:09 +0000
committerGeorgios Pinitas <georgios.pinitas@arm.com>2020-03-12 12:12:30 +0000
commitc7b183ab741650653289f8ce3bdeb4926521fdbd (patch)
tree991e9f20340c91c288d52d8f9a64a3729e4a40b0 /src/core/NEON/kernels/arm_gemm/merges
parent6800117df3be825f0ec5c6cc71c4377322f51b99 (diff)
downloadComputeLibrary-c7b183ab741650653289f8ce3bdeb4926521fdbd.tar.gz
COMPMID-3160: Add Bfloat16 support in NEGEMMConvolutionLayer
Signed-off-by: Georgios Pinitas <georgios.pinitas@arm.com> Change-Id: I0e449306c138a562ffc1455e76ec44b2fd059d85 Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/2860 Tested-by: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Michele Di Giorgio <michele.digiorgio@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/NEON/kernels/arm_gemm/merges')
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp16_24x8.hpp2
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp32_12x8.hpp2
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_12x8.hpp2
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_4x4.hpp2
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_12x8.hpp2
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_4x4.hpp2
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp16_3VLx8.hpp2
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp32_3VLx8.hpp2
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/sve_merge_s32_3VLx8.hpp2
-rw-r--r--src/core/NEON/kernels/arm_gemm/merges/sve_merge_u32_3VLx8.hpp2
10 files changed, 10 insertions, 10 deletions
diff --git a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp16_24x8.hpp b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp16_24x8.hpp
index f82e7b4e47..5d8eae4866 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp16_24x8.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp16_24x8.hpp
@@ -29,7 +29,7 @@ template<>
void MergeResults<24, 8, false>(__fp16 *out, const __fp16 *in, const int ldout, const int y0, const int ymax, const int x0, const int xmax, const __fp16 *bias, Activation act, bool append)
{
const __fp16 *inptr = in;
- __fp16 nullbias[24] = { 0 };
+ __fp16 nullbias[24];
__fp16 minval = - static_cast<__fp16>(std::numeric_limits<float>::infinity());
__fp16 maxval = static_cast<__fp16>(std::numeric_limits<float>::infinity());
diff --git a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp32_12x8.hpp b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp32_12x8.hpp
index 0c5aa7eae8..088353e5f3 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp32_12x8.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_fp32_12x8.hpp
@@ -29,7 +29,7 @@ template<>
void MergeResults<12, 8, false>(float *out, const float *in, const int ldout, const int y0, const int ymax, const int x0, const int xmax, const float *bias, Activation act, bool append)
{
const float *inptr = in;
- float nullbias[12] = { 0 };
+ float nullbias[12];
float minval = - std::numeric_limits<float>::infinity();
float maxval = std::numeric_limits<float>::infinity();
diff --git a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_12x8.hpp b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_12x8.hpp
index 313f8295ff..2e45d8b5d1 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_12x8.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_12x8.hpp
@@ -31,7 +31,7 @@ void MergeResults<12, 8, false>(int32_t *out, const int32_t *in, const int ldout
UNUSED(act);
const int32_t *inptr = in;
- int32_t nullbias[12] = { 0 };
+ int32_t nullbias[12];
if (!append && !bias)
diff --git a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_4x4.hpp b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_4x4.hpp
index a93060fa5a..6d869af803 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_4x4.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_s32_4x4.hpp
@@ -31,7 +31,7 @@ void MergeResults<4, 4, false>(int32_t *out, const int32_t *in, const int ldout,
UNUSED(act);
const int32_t *inptr = in;
- int32_t nullbias[4] = { 0 };
+ int32_t nullbias[4];
if (!append && !bias)
diff --git a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_12x8.hpp b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_12x8.hpp
index 5569f5157b..0a05944102 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_12x8.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_12x8.hpp
@@ -31,7 +31,7 @@ void MergeResults<12, 8, false>(uint32_t *out, const uint32_t *in, const int ldo
UNUSED(act);
const uint32_t *inptr = in;
- uint32_t nullbias[12] = { 0 };
+ uint32_t nullbias[12];
if (!append && !bias)
diff --git a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_4x4.hpp b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_4x4.hpp
index fd01bb2392..efb17dc9e9 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_4x4.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/a64_merge_u32_4x4.hpp
@@ -31,7 +31,7 @@ void MergeResults<4, 4, false>(uint32_t *out, const uint32_t *in, const int ldou
UNUSED(act);
const uint32_t *inptr = in;
- uint32_t nullbias[4] = { 0 };
+ uint32_t nullbias[4];
if (!append && !bias)
diff --git a/src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp16_3VLx8.hpp b/src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp16_3VLx8.hpp
index e5efc09b52..a44ef55a86 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp16_3VLx8.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp16_3VLx8.hpp
@@ -29,7 +29,7 @@ template<>
void MergeResults<3, 8, true>(__fp16 *out, const __fp16 *in, const int ldout, const int y0, const int ymax, const int x0, const int xmax, const __fp16 *bias, Activation act, bool append)
{
const __fp16 *inptr = in;
- __fp16 nullbias[384] = { 0 };
+ __fp16 nullbias[384];
__fp16 minval = - static_cast<__fp16>(std::numeric_limits<float>::infinity());
__fp16 maxval = static_cast<__fp16>(std::numeric_limits<float>::infinity());
diff --git a/src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp32_3VLx8.hpp b/src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp32_3VLx8.hpp
index f7feec4d83..bb073e4868 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp32_3VLx8.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/sve_merge_fp32_3VLx8.hpp
@@ -29,7 +29,7 @@ template<>
void MergeResults<3, 8, true>(float *out, const float *in, const int ldout, const int y0, const int ymax, const int x0, const int xmax, const float *bias, Activation act, bool append)
{
const float *inptr = in;
- float nullbias[192] = { 0 };
+ float nullbias[192];
float minval = - std::numeric_limits<float>::infinity();
float maxval = std::numeric_limits<float>::infinity();
diff --git a/src/core/NEON/kernels/arm_gemm/merges/sve_merge_s32_3VLx8.hpp b/src/core/NEON/kernels/arm_gemm/merges/sve_merge_s32_3VLx8.hpp
index 03a28241fd..d4c5073f8d 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/sve_merge_s32_3VLx8.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/sve_merge_s32_3VLx8.hpp
@@ -31,7 +31,7 @@ void MergeResults<3, 8, true>(int32_t *out, const int32_t *in, const int ldout,
UNUSED(act);
const int32_t *inptr = in;
- int32_t nullbias[192] = { 0 };
+ int32_t nullbias[192];
if (!append && !bias)
{
diff --git a/src/core/NEON/kernels/arm_gemm/merges/sve_merge_u32_3VLx8.hpp b/src/core/NEON/kernels/arm_gemm/merges/sve_merge_u32_3VLx8.hpp
index 67a6eb32bb..f2a28fa004 100644
--- a/src/core/NEON/kernels/arm_gemm/merges/sve_merge_u32_3VLx8.hpp
+++ b/src/core/NEON/kernels/arm_gemm/merges/sve_merge_u32_3VLx8.hpp
@@ -31,7 +31,7 @@ void MergeResults<3, 8, true>(uint32_t *out, const uint32_t *in, const int ldout
UNUSED(act);
const uint32_t *inptr = in;
- uint32_t nullbias[192] = { 0 };
+ uint32_t nullbias[192];
if (!append && !bias)
{