aboutsummaryrefslogtreecommitdiff
path: root/src/armnn/Network.cpp
diff options
context:
space:
mode:
authorRob Hughes <robert.hughes@arm.com>2019-09-24 16:59:56 +0100
committerÁron Virginás-Tar <aron.virginas-tar@arm.com>2019-09-27 10:17:26 +0000
commit3a7d3a70d99cbe22f5e4711d5dbbea2a245da7ed (patch)
tree445967fa35016374657b5c7e38b2715773a25e02 /src/armnn/Network.cpp
parent83239f995e7b86062450794b85bfe4c4c387fda0 (diff)
downloadarmnn-3a7d3a70d99cbe22f5e4711d5dbbea2a245da7ed.tar.gz
NNXSW-1826 Add an optimization step which combines Permute and BatchToSpace into DepthToSpace
This is only possible in some limited cases, but removes an extra layer from the graph and so should improve performance in all cases. Change-Id: I7b3e6ba5dacb4fdb816ad270edaecda1436ab4cf Signed-off-by: Rob Hughes <robert.hughes@arm.com>
Diffstat (limited to 'src/armnn/Network.cpp')
-rw-r--r--src/armnn/Network.cpp3
1 files changed, 2 insertions, 1 deletions
diff --git a/src/armnn/Network.cpp b/src/armnn/Network.cpp
index a668274c4d..cf9a138084 100644
--- a/src/armnn/Network.cpp
+++ b/src/armnn/Network.cpp
@@ -818,7 +818,8 @@ IOptimizedNetworkPtr Optimize(const INetwork& inNetwork,
MovePermuteUp(),
PermuteAsReshape(),
OptimizeConsecutiveReshapes(),
- FoldPadIntoConvolution2d()));
+ FoldPadIntoConvolution2d(),
+ PermuteAndBatchToSpaceAsDepthToSpace()));
// Infer the tensor infos for all output slots. Throws an exception on failure
optGraph.InferTensorInfos();