aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorPablo Tello <pablo.tello@arm.com>2019-07-26 13:45:48 +0100
committerPablo Tello <pablo.tello@arm.com>2019-07-26 17:04:50 +0100
commitb38ed40d34b6c176dc47884419e9d367452b7fe0 (patch)
treeaba0ba5cb2b0df0e033e06460cfd1a5fd59e2224
parent3b9383548309a8f9121668826a628ec250c57a1c (diff)
downloadarmnn-b38ed40d34b6c176dc47884419e9d367452b7fe0.tar.gz
MLCE-130: Enabled optimized path for DepthwiseConv 5x5
Change-Id: I5cd90121e5fe1b49b394ee6f5a87e86520a30119 Signed-off-by: Pablo Tello <pablo.tello@arm.com>
-rw-r--r--src/backends/neon/workloads/NeonDepthwiseConvolutionWorkload.cpp6
1 files changed, 4 insertions, 2 deletions
diff --git a/src/backends/neon/workloads/NeonDepthwiseConvolutionWorkload.cpp b/src/backends/neon/workloads/NeonDepthwiseConvolutionWorkload.cpp
index bfe4ddaea7..400ae18807 100644
--- a/src/backends/neon/workloads/NeonDepthwiseConvolutionWorkload.cpp
+++ b/src/backends/neon/workloads/NeonDepthwiseConvolutionWorkload.cpp
@@ -114,8 +114,10 @@ NeonDepthwiseConvolutionWorkload::NeonDepthwiseConvolutionWorkload(
arm_compute::PadStrideInfo padStrideInfo = BuildArmComputePadStrideInfo(m_Data.m_Parameters);
// Check for optimisation opportunities.
- bool use3x3Optimisation = (weightInfo.GetShape()[2] == 3) && (weightInfo.GetShape()[3] == 3);
- if (use3x3Optimisation)
+ const bool use3x3Optimisation = (weightInfo.GetShape()[2] == 3) && (weightInfo.GetShape()[3] == 3);
+ const bool use5x5Optimisation = (weightInfo.GetShape()[2] == 5) && (weightInfo.GetShape()[3] == 5);
+
+ if (use3x3Optimisation||use5x5Optimisation)
{
m_pDepthwiseConvolutionLayer = std::make_unique<arm_compute::NEDepthwiseConvolutionLayerOptimized>();
static_cast<arm_compute::NEDepthwiseConvolutionLayerOptimized*>(