aboutsummaryrefslogtreecommitdiff
path: root/arm_compute/core/NEON/kernels/NEBatchNormalizationLayerKernel.h
diff options
context:
space:
mode:
authorGeorgios Pinitas <georgios.pinitas@arm.com>2020-06-03 20:16:46 +0100
committerGeorgios Pinitas <georgios.pinitas@arm.com>2020-06-09 11:58:01 +0000
commit980a9168b81d778f4902973b4920b54c103907e0 (patch)
treed2e8bf3527db8fe39cec8c51c6a914b721c35b03 /arm_compute/core/NEON/kernels/NEBatchNormalizationLayerKernel.h
parent2d10f186aacfc56b601b3cdaffa942cc6e6d1f53 (diff)
downloadComputeLibrary-980a9168b81d778f4902973b4920b54c103907e0.tar.gz
COMPMID-3177: Remove padding from NEBatchNormalizationLayer
Signed-off-by: Georgios Pinitas <georgios.pinitas@arm.com> Change-Id: I9be23e6ef1f552eb159e39fda16c82fa20124094 Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/3307 Tested-by: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'arm_compute/core/NEON/kernels/NEBatchNormalizationLayerKernel.h')
-rw-r--r--arm_compute/core/NEON/kernels/NEBatchNormalizationLayerKernel.h29
1 files changed, 8 insertions, 21 deletions
diff --git a/arm_compute/core/NEON/kernels/NEBatchNormalizationLayerKernel.h b/arm_compute/core/NEON/kernels/NEBatchNormalizationLayerKernel.h
index d59ed7baf0..7371e3c177 100644
--- a/arm_compute/core/NEON/kernels/NEBatchNormalizationLayerKernel.h
+++ b/arm_compute/core/NEON/kernels/NEBatchNormalizationLayerKernel.h
@@ -1,5 +1,5 @@
/*
- * Copyright (c) 2017-2019 ARM Limited.
+ * Copyright (c) 2017-2020 ARM Limited.
*
* SPDX-License-Identifier: MIT
*
@@ -28,6 +28,7 @@
namespace arm_compute
{
+// Forward declarations
class ITensor;
/** Interface for the batch normalization layer kernel.
@@ -97,40 +98,26 @@ private:
/** Configure execution function in case of fused activation **/
void configure_fused();
- /** Template function to run batch normalization on fp16
- *
- * @tparam fused_activation Boolean that flags if its a fused activation or not
- *
- * @param[in] window Region on which to execute the kernel. (Must be a valid region of the window returned by window()).
- */
- template <bool fused_activation, typename F>
- void batch_normalization_fp16_nchw(const Window &window);
- /** Template function to run batch normalization on fp16 on tensors with NHWC format
- *
- * @tparam fused_activation Boolean that flags if its a fused activation or not
- *
- * @param[in] window Region on which to execute the kernel. (Must be a valid region of the window returned by window()).
- */
- template <bool fused_activation, typename F>
- void batch_normalization_fp16_nhwc(const Window &window);
/** Template function to run batch normalization on fp32
*
+ * @tparam T Specialization data type
* @tparam fused_activation Boolean that flags if its a fused activation or not
* @tparam F Activation function functor to run
*
* @param[in] window Region on which to execute the kernel. (Must be a valid region of the window returned by window()).
*/
- template <bool fused_activation, typename F>
- void batch_normalization_fp32_nchw(const Window &window);
+ template <typename T, bool fused_activation, typename F>
+ void batch_normalization_nchw(const Window &window);
/** Template function to run batch normalization on fp32 on tensors with NHWC format
*
+ * @tparam T Specialization data type
* @tparam fused_activation Boolean that flags if its a fused activation or not
* @tparam F Activation function functor to run
*
* @param[in] window Region on which to execute the kernel. (Must be a valid region of the window returned by window()).
*/
- template <bool fused_activation, typename F>
- void batch_normalization_fp32_nhwc(const Window &window);
+ template <typename T, bool fused_activation, typename F>
+ void batch_normalization_nhwc(const Window &window);
/** Common signature for all the batch normalization functions
*
* @param[in] window Region on which to execute the kernel.