plain/22.08/_fold_pad_tests_8cpp_source.xhtml

 //
 // Copyright © 2022 Arm Ltd and Contributors. All rights reserved.
 // SPDX-License-Identifier: MIT
 //

 #include "LayersFwd.hpp"
 #include <Network.hpp>
 #include <TestUtils.hpp>
 #include <doctest/doctest.h>
 #include <armnn/backends/TensorHandle.hpp>
 #include <Optimizer.hpp>

 TEST_SUITE("Optimizer")
 {
 using namespace armnn;
 using namespace armnn::optimizations;

 TEST_CASE("FoldPadLayerIntoConvolution2dLayer")
 {
     Graph              graph;
     const unsigned int inputShape[]   = {1, 2, 2, 3};
     const unsigned int paddedShape[]  = {1, 6, 6, 3};
     const unsigned int weightsShape[] = {1, 2, 3, 3};
     const unsigned int outputShape[]  = {1, 2, 1, 1};

     TensorInfo inputInfo(4, inputShape, DataType::Float32);
     TensorInfo paddedInfo(4, paddedShape, DataType::Float32);
     TensorInfo weightsInfo(4, weightsShape, DataType::Float32, 1.0f, 0, true);
     TensorInfo outputInfo(4, outputShape, DataType::Float32);

     Layer* input = graph.AddLayer<InputLayer>(0, "input");
     input->GetOutputSlot().SetTensorInfo(inputInfo);

     PadDescriptor padDescriptor({{0, 0},
                                  {2, 2},
                                  {2, 2},
                                  {0, 0}});

     PadLayer* padLayer = graph.AddLayer<PadLayer>(padDescriptor, "pad");
     padLayer->GetOutputSlot().SetTensorInfo(paddedInfo);

     Convolution2dDescriptor convolution2dDescriptor;
     convolution2dDescriptor.m_BiasEnabled = false;
     convolution2dDescriptor.m_StrideX     = 1;
     convolution2dDescriptor.m_StrideY     = 1;
     convolution2dDescriptor.m_DataLayout  = DataLayout::NHWC;

     std::vector<float> weightsVector(18);
     ConstTensor        weights(weightsInfo, weightsVector);

     ConstantLayer* weightsLayer = graph.AddLayer<ConstantLayer>("Weights");
     weightsLayer->m_LayerOutput = std::make_shared<ScopedTensorHandle>(weights);
     weightsLayer->GetOutputSlot(0).SetTensorInfo(weightsInfo);

     Convolution2dLayer* conv2dLayer = graph.AddLayer<Convolution2dLayer>(convolution2dDescriptor, "conv2d");
     conv2dLayer->GetOutputSlot().SetTensorInfo(outputInfo);

     Layer* output = graph.AddLayer<OutputLayer>(0, "output");

     // Connect up layers - input -> pad -> conv2d -> output
     input->GetOutputSlot().Connect(padLayer->GetInputSlot(0));
     padLayer->GetOutputSlot().Connect(conv2dLayer->GetInputSlot(0));
     weightsLayer->GetOutputSlot().Connect(conv2dLayer->GetInputSlot(1));
     conv2dLayer->GetOutputSlot().Connect(output->GetInputSlot(0));

     auto checkSimpleConv2d = [](const Layer* const layer)->bool {
         const auto conv2dLayer       = static_cast<const Convolution2dLayer*>(layer);
         const auto conv2dLayerParams = conv2dLayer->GetParameters();
         return IsLayerOfType<Convolution2dLayer>(layer) && (layer->GetNameStr() == "conv2d") &&
             (conv2dLayerParams.m_PadLeft == 0) && (conv2dLayerParams.m_PadRight == 0) &&
             (conv2dLayerParams.m_PadTop == 0) && (conv2dLayerParams.m_PadBottom == 0) &&
             (conv2dLayerParams.m_StrideX == 1) && (conv2dLayerParams.m_StrideY == 1) &&
             (conv2dLayerParams.m_BiasEnabled == false) && (conv2dLayerParams.m_DataLayout == DataLayout::NHWC);
     };

     CHECK(CheckSequence(graph.cbegin(), graph.cend(), &IsLayerOfType<InputLayer>,
                                                       &IsLayerOfType<ConstantLayer>,
                                                       &IsLayerOfType<PadLayer>,
                                                       checkSimpleConv2d,
                                                       &IsLayerOfType<OutputLayer>));

     armnn::Optimizer::Pass(graph, armnn::MakeOptimizations(FoldPadIntoConvolution2d()));

     auto checkPadFoldedIntoConv2d = [](const Layer* const layer)->bool {
         const auto conv2dLayer       = static_cast<const Convolution2dLayer*>(layer);
         const auto conv2dLayerParams = conv2dLayer->GetParameters();
         return IsLayerOfType<Convolution2dLayer>(layer) && (layer->GetNameStr() == "folded-pad-into-conv2d") &&
             (conv2dLayerParams.m_PadLeft == 2) && (conv2dLayerParams.m_PadRight == 2) &&
             (conv2dLayerParams.m_PadTop == 2) && (conv2dLayerParams.m_PadBottom == 2) &&
             (conv2dLayerParams.m_StrideX == 1) && (conv2dLayerParams.m_StrideY == 1) &&
             (conv2dLayerParams.m_BiasEnabled == false) && (conv2dLayerParams.m_DataLayout == DataLayout::NHWC);
     };

     CHECK(CheckSequence(graph.cbegin(), graph.cend(), &IsLayerOfType<InputLayer>,
                                                       &IsLayerOfType<ConstantLayer>,
                                                       checkPadFoldedIntoConv2d,
                                                       &IsLayerOfType<OutputLayer>));
 }

 TEST_CASE("FoldPadLayerIntoDepthwiseConvolution2dLayer")
 {
     Graph              graph;
     const unsigned int inputShape[]   = {1, 2, 2, 3};
     const unsigned int paddedShape[]  = {1, 6, 6, 3};
     const unsigned int weightsShape[] = {1, 2, 3, 3};
     const unsigned int outputShape[]  = {1, 2, 1, 3};

     TensorInfo inputInfo(4, inputShape, DataType::Float32);
     TensorInfo paddedInfo(4, paddedShape, DataType::Float32);
     TensorInfo weightsInfo(4, weightsShape, DataType::Float32, 1.0f, 0, true);
     TensorInfo outputInfo(4, outputShape, DataType::Float32);

     Layer* input = graph.AddLayer<InputLayer>(0, "input");
     input->GetOutputSlot().SetTensorInfo(inputInfo);

     PadDescriptor padDescriptor({{0, 0},
                                  {2, 2},
                                  {2, 2},
                                  {0, 0}});

     PadLayer* padLayer = graph.AddLayer<PadLayer>(padDescriptor, "pad");
     padLayer->GetOutputSlot().SetTensorInfo(paddedInfo);

     DepthwiseConvolution2dDescriptor depthwiseConvolution2dDescriptor;
     depthwiseConvolution2dDescriptor.m_BiasEnabled = false;
     depthwiseConvolution2dDescriptor.m_StrideX     = 1;
     depthwiseConvolution2dDescriptor.m_StrideY     = 1;
     depthwiseConvolution2dDescriptor.m_DataLayout  = DataLayout::NHWC;

     std::vector<float> weightsVector(18);
     ConstTensor        weights(weightsInfo, weightsVector);

     auto* weightsLayer = graph.AddLayer<ConstantLayer>("weights");
     weightsLayer->GetOutputSlot().SetTensorInfo(weightsInfo);
     weightsLayer->m_LayerOutput = std::make_shared<ScopedTensorHandle>(weights);

     auto* depthwiseConv2dLayer = graph.AddLayer<DepthwiseConvolution2dLayer>(depthwiseConvolution2dDescriptor,
                                                                              "depthwiseConv2d");
     depthwiseConv2dLayer->GetOutputSlot().SetTensorInfo(outputInfo);

     Layer* output = graph.AddLayer<OutputLayer>(0, "output");

     // Connect up layers - input -> pad -> depthwiseConv2d -> output
     input->GetOutputSlot().Connect(padLayer->GetInputSlot(0));
     padLayer->GetOutputSlot().Connect(depthwiseConv2dLayer->GetInputSlot(0));
     weightsLayer->GetOutputSlot().Connect(depthwiseConv2dLayer->GetInputSlot(1));
     depthwiseConv2dLayer->GetOutputSlot().Connect(output->GetInputSlot(0));

     auto checkSimpleDepthwiseConv2d = [](const Layer* const layer)->bool {
         const auto depthwiseConv2dLayer       = static_cast<const DepthwiseConvolution2dLayer*>(layer);
         const auto depthwiseConv2dLayerParams = depthwiseConv2dLayer->GetParameters();
         return IsLayerOfType<DepthwiseConvolution2dLayer>(layer) && (layer->GetNameStr() == "depthwiseConv2d") &&
             (depthwiseConv2dLayerParams.m_PadLeft == 0) && (depthwiseConv2dLayerParams.m_PadRight == 0) &&
             (depthwiseConv2dLayerParams.m_PadTop == 0) && (depthwiseConv2dLayerParams.m_PadBottom == 0) &&
             (depthwiseConv2dLayerParams.m_StrideX == 1) && (depthwiseConv2dLayerParams.m_StrideY == 1) &&
             (depthwiseConv2dLayerParams.m_BiasEnabled == false) &&
             (depthwiseConv2dLayerParams.m_DataLayout == DataLayout::NHWC);
     };

     CHECK(CheckSequence(graph.cbegin(), graph.cend(), &IsLayerOfType<InputLayer>,
                                                       &IsLayerOfType<ConstantLayer>,
                                                       &IsLayerOfType<PadLayer>,
                                                       checkSimpleDepthwiseConv2d,
                                                       &IsLayerOfType<OutputLayer>));

     armnn::Optimizer::Pass(graph, MakeOptimizations(FoldPadIntoDepthwiseConvolution2d()));

     auto checkPadFoldedIntoDepthwiseConv2d = [](const Layer* const layer)->bool {
         const auto depthwiseConv2dLayer       = static_cast<const DepthwiseConvolution2dLayer*>(layer);
         const auto depthwiseConv2dLayerParams = depthwiseConv2dLayer->GetParameters();
         return IsLayerOfType<DepthwiseConvolution2dLayer>(layer) &&
             (layer->GetNameStr() == "folded-pad-into-depthwiseConv2d") &&
             (depthwiseConv2dLayerParams.m_PadLeft == 2) && (depthwiseConv2dLayerParams.m_PadRight == 2) &&
             (depthwiseConv2dLayerParams.m_PadTop == 2) && (depthwiseConv2dLayerParams.m_PadBottom == 2) &&
             (depthwiseConv2dLayerParams.m_StrideX == 1) && (depthwiseConv2dLayerParams.m_StrideY == 1) &&
             (depthwiseConv2dLayerParams.m_BiasEnabled == false) &&
             (depthwiseConv2dLayerParams.m_DataLayout == DataLayout::NHWC);
     };

     CHECK(CheckSequence(graph.cbegin(), graph.cend(), &IsLayerOfType<InputLayer>,
                                                       &IsLayerOfType<ConstantLayer>,
                                                       checkPadFoldedIntoDepthwiseConv2d,
                                                       &IsLayerOfType<OutputLayer>));
 }

 TEST_CASE("FoldPadLayerIntoPooling2dLayer")
 {
     Graph              graph;
     const unsigned int inputShape[]  = {1, 2, 2, 3};
     const unsigned int paddedShape[] = {1, 4, 4, 3};
     const unsigned int outputShape[] = {1, 2, 2, 3};

     TensorInfo inputInfo(4, inputShape, DataType::Float32);
     TensorInfo paddedInfo(4, paddedShape, DataType::Float32);
     TensorInfo outputInfo(4, outputShape, DataType::Float32);

     Layer* input = graph.AddLayer<InputLayer>(0, "input");
     input->GetOutputSlot().SetTensorInfo(inputInfo);

     PadDescriptor padDescriptor({{0, 0},
                                  {1, 1},
                                  {1, 1},
                                  {0, 0}});

     PadLayer* padLayer = graph.AddLayer<PadLayer>(padDescriptor, "pad");
     padLayer->GetOutputSlot().SetTensorInfo(paddedInfo);

     Pooling2dDescriptor pooling2dDescriptor;
     pooling2dDescriptor.m_PoolType   = PoolingAlgorithm::Average;
     pooling2dDescriptor.m_PoolWidth  = 3;
     pooling2dDescriptor.m_PoolHeight = 3;
     pooling2dDescriptor.m_StrideX    = 1;
     pooling2dDescriptor.m_StrideY    = 1;
     pooling2dDescriptor.m_DataLayout = DataLayout::NHWC;

     Pooling2dLayer* pool2dLayer = graph.AddLayer<Pooling2dLayer>(pooling2dDescriptor, "pool2d");
     pool2dLayer->GetOutputSlot().SetTensorInfo(outputInfo);

     Layer* output = graph.AddLayer<OutputLayer>(0, "output");

     // Connect up layers - input -> pad -> pool2d -> output
     input->GetOutputSlot().Connect(padLayer->GetInputSlot(0));
     padLayer->GetOutputSlot().Connect(pool2dLayer->GetInputSlot(0));
     pool2dLayer->GetOutputSlot().Connect(output->GetInputSlot(0));

     auto checkSimplePool2d = [&](const Layer* const layer) {
         const auto pool2dLayer = static_cast<const Pooling2dLayer*>(layer);
         return IsLayerOfType<Pooling2dLayer>(layer) && (layer->GetNameStr() == "pool2d") &&
             (pool2dLayer->GetParameters() == pooling2dDescriptor);
     };

     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                              &IsLayerOfType<InputLayer>,
                              &IsLayerOfType<PadLayer>,
                              checkSimplePool2d,
                              &IsLayerOfType<OutputLayer>));

     armnn::Optimizer::Pass(graph, MakeOptimizations(FoldPadIntoPooling2d()));

     auto checkPadFoldedIntoPool2d = [&](const Layer* const layer) {
         if (!IsLayerOfType<Pooling2dLayer>(layer) || (layer->GetNameStr() != "folded-pad-into-pool2d"))
         {
             return false;
         }

         const auto                pool2dLayer       = static_cast<const Pooling2dLayer*>(layer);
         const Pooling2dDescriptor pool2dLayerParams = pool2dLayer->GetParameters();

         Pooling2dDescriptor pool2dLayerParamsNoPad = pool2dLayerParams;
         pool2dLayerParamsNoPad.m_PadLeft       = 0;
         pool2dLayerParamsNoPad.m_PadRight      = 0;
         pool2dLayerParamsNoPad.m_PadTop        = 0;
         pool2dLayerParamsNoPad.m_PadBottom     = 0;
         // If we fold then PaddingMethod will be set to Ignore. The original will be Exclude.
         pool2dLayerParamsNoPad.m_PaddingMethod = PaddingMethod::Exclude;

         return (pool2dLayerParamsNoPad == pooling2dDescriptor) && (pool2dLayerParams.m_PadLeft == 1) &&
             (pool2dLayerParams.m_PadRight == 1) && (pool2dLayerParams.m_PadTop == 1) &&
             (pool2dLayerParams.m_PadBottom == 1) && (pool2dLayerParams.m_PaddingMethod == PaddingMethod::IgnoreValue);
     };

     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                              &IsLayerOfType<InputLayer>,
                              checkPadFoldedIntoPool2d,
                              &IsLayerOfType<OutputLayer>));
 }

 TEST_CASE("FoldPadLayerIntoPooling2d_PadWithMultipleOutputsShouldNotBeOptimized")
 {
     // In this test case we'll setup a pad layer with two outputs. One goes to a polling layers and the other
     // goes to an output layer. FoldPadLayerIntoPooling2d should not optimize this graph as it uses the
     // OptimizeForExclusiveConnection method.
     Graph              graph;
     const unsigned int inputShape[]  = {1, 2, 2, 3};
     const unsigned int paddedShape[] = {1, 4, 4, 3};
     const unsigned int outputShape[] = {1, 2, 2, 3};

     TensorInfo inputInfo(4, inputShape, DataType::Float32);
     TensorInfo paddedInfo(4, paddedShape, DataType::Float32);
     TensorInfo outputInfo(4, outputShape, DataType::Float32);

     Layer* input = graph.AddLayer<InputLayer>(0, "input");
     input->GetOutputSlot().SetTensorInfo(inputInfo);

     PadDescriptor padDescriptor({{0, 0},
                                  {1, 1},
                                  {1, 1},
                                  {0, 0}});

     PadLayer* padLayer = graph.AddLayer<PadLayer>(padDescriptor, "pad");
     padLayer->GetOutputSlot().SetTensorInfo(paddedInfo);

     Pooling2dDescriptor pooling2dDescriptor;
     pooling2dDescriptor.m_PoolType   = PoolingAlgorithm::Average;
     pooling2dDescriptor.m_PoolWidth  = 3;
     pooling2dDescriptor.m_PoolHeight = 3;
     pooling2dDescriptor.m_StrideX    = 1;
     pooling2dDescriptor.m_StrideY    = 1;
     pooling2dDescriptor.m_DataLayout = DataLayout::NHWC;

     Pooling2dLayer* pool2dLayer = graph.AddLayer<Pooling2dLayer>(pooling2dDescriptor, "pool2d");
     pool2dLayer->GetOutputSlot().SetTensorInfo(outputInfo);

     Layer* output = graph.AddLayer<OutputLayer>(0, "output");

     // Connect up layers - input -> pad -> pool2d -> output
     input->GetOutputSlot().Connect(padLayer->GetInputSlot(0));
     padLayer->GetOutputSlot().Connect(pool2dLayer->GetInputSlot(0));
     pool2dLayer->GetOutputSlot().Connect(output->GetInputSlot(0));

     // Add the alternative branch from the pas layer to an output layer.
     Layer* secondOutput = graph.AddLayer<OutputLayer>(1, "dummy output");
     padLayer->GetOutputSlot().Connect(secondOutput->GetInputSlot(0));

     auto checkSimplePool2d = [&](const Layer* const layer) {
         const auto pool2dLayer = static_cast<const Pooling2dLayer*>(layer);
         return IsLayerOfType<Pooling2dLayer>(layer) && (layer->GetNameStr() == "pool2d") &&
             (pool2dLayer->GetParameters() == pooling2dDescriptor);
     };

     // Initial sequence.
     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                              &IsLayerOfType<InputLayer>,
                              &IsLayerOfType<PadLayer>,
                              checkSimplePool2d,
                              &IsLayerOfType<OutputLayer>,
                              &IsLayerOfType<OutputLayer>));

     armnn::Optimizer::Pass(graph, MakeOptimizations(FoldPadIntoPooling2d()));

     // The network should not change.
     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                              &IsLayerOfType<InputLayer>,
                              &IsLayerOfType<PadLayer>,
                              checkSimplePool2d,
                              &IsLayerOfType<OutputLayer>,
                              &IsLayerOfType<OutputLayer>));
 }

 TEST_CASE("FoldPadLayerIntoPooling2dLayer_PoolingLayerWithExcludePaddingShouldNotTakeMorePadding")
 {
     // In this test setup input, Pad layer, Pooling layer that includes padding, output layer. The optimization
     // should not work as the pooling layer already includes and existing pad and specifies PaddingMethod::Exclude.
     Graph              graph;
     const unsigned int inputShape[]  = {1, 2, 2, 3};
     const unsigned int paddedShape[] = {1, 4, 4, 3};
     const unsigned int outputShape[] = {1, 2, 2, 3};

     TensorInfo inputInfo(4, inputShape, DataType::Float32);
     TensorInfo paddedInfo(4, paddedShape, DataType::Float32);
     TensorInfo outputInfo(4, outputShape, DataType::Float32);

     Layer* input = graph.AddLayer<InputLayer>(0, "input");
     input->GetOutputSlot().SetTensorInfo(inputInfo);

     PadDescriptor padDescriptor({{0, 0},
                                  {1, 1},
                                  {1, 1},
                                  {0, 0}});

     PadLayer* padLayer = graph.AddLayer<PadLayer>(padDescriptor, "pad");
     padLayer->GetOutputSlot().SetTensorInfo(paddedInfo);

     Pooling2dDescriptor pooling2dDescriptor;
     pooling2dDescriptor.m_PoolType      = PoolingAlgorithm::Average;
     pooling2dDescriptor.m_PoolWidth     = 3;
     pooling2dDescriptor.m_PoolHeight    = 3;
     pooling2dDescriptor.m_StrideX       = 1;
     pooling2dDescriptor.m_StrideY       = 1;
     pooling2dDescriptor.m_DataLayout    = DataLayout::NHWC;
     // Include a pad with the pooling layer. This should prevent the optimization working.
     pooling2dDescriptor.m_PadLeft       = 1;
     pooling2dDescriptor.m_PadRight      = 1;
     pooling2dDescriptor.m_PadTop        = 1;
     pooling2dDescriptor.m_PadBottom     = 1;
     pooling2dDescriptor.m_PaddingMethod = PaddingMethod::Exclude;

     Pooling2dLayer* pool2dLayer = graph.AddLayer<Pooling2dLayer>(pooling2dDescriptor, "pool2d");
     pool2dLayer->GetOutputSlot().SetTensorInfo(outputInfo);

     Layer* output = graph.AddLayer<OutputLayer>(0, "output");

     // Connect up layers - input -> pad -> pool2d -> output
     input->GetOutputSlot().Connect(padLayer->GetInputSlot(0));
     padLayer->GetOutputSlot().Connect(pool2dLayer->GetInputSlot(0));
     pool2dLayer->GetOutputSlot().Connect(output->GetInputSlot(0));

     auto checkSimplePool2d = [&](const Layer* const layer) {
         const auto pool2dLayer = static_cast<const Pooling2dLayer*>(layer);
         return IsLayerOfType<Pooling2dLayer>(layer) && (layer->GetNameStr() == "pool2d") &&
             (pool2dLayer->GetParameters() == pooling2dDescriptor);
     };

     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                              &IsLayerOfType<InputLayer>,
                              &IsLayerOfType<PadLayer>,
                              checkSimplePool2d,
                              &IsLayerOfType<OutputLayer>));

     armnn::Optimizer::Pass(graph, MakeOptimizations(FoldPadIntoPooling2d()));

     // The optimization should not have modified the graph.
     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                              &IsLayerOfType<InputLayer>,
                              &IsLayerOfType<PadLayer>,
                              checkSimplePool2d,
                              &IsLayerOfType<OutputLayer>));
 }

 TEST_CASE("FoldPadLayerIntoPooling2dLayer_MaxPoolingLayerWithLargePadValueShouldNotBeFolded")
 {
     // In this test setup input, Pad layer with a large pad value, Max Pooling layer, output layer. The optimization
     // should not work as the pad value will modify the result of the max pooling layer.
     Graph              graph;
     const unsigned int inputShape[]  = {1, 2, 2, 3};
     const unsigned int paddedShape[] = {1, 4, 4, 3};
     const unsigned int outputShape[] = {1, 2, 2, 3};

     TensorInfo inputInfo(4, inputShape, DataType::Float32);
     TensorInfo paddedInfo(4, paddedShape, DataType::Float32);
     TensorInfo outputInfo(4, outputShape, DataType::Float32);

     Layer* input = graph.AddLayer<InputLayer>(0, "input");
     input->GetOutputSlot().SetTensorInfo(inputInfo);

     PadDescriptor padDescriptor({{0, 0},
                                  {1, 1},
                                  {1, 1},
                                  {0, 0}});
     // For Max pooling of a float a pad value of 0 is more than enough to stop the fold happening.
     // Set this to -std::numeric_limits<float>::infinity() to make the fold happen.
     padDescriptor.m_PadValue = 0;

     PadLayer* padLayer = graph.AddLayer<PadLayer>(padDescriptor, "pad");
     padLayer->GetOutputSlot().SetTensorInfo(paddedInfo);

     Pooling2dDescriptor pooling2dDescriptor;
     pooling2dDescriptor.m_PoolType   = PoolingAlgorithm::Max;
     pooling2dDescriptor.m_PoolWidth  = 3;
     pooling2dDescriptor.m_PoolHeight = 3;
     pooling2dDescriptor.m_StrideX    = 1;
     pooling2dDescriptor.m_StrideY    = 1;
     pooling2dDescriptor.m_DataLayout = DataLayout::NHWC;

     Pooling2dLayer* pool2dLayer = graph.AddLayer<Pooling2dLayer>(pooling2dDescriptor, "pool2d");
     pool2dLayer->GetOutputSlot().SetTensorInfo(outputInfo);

     Layer* output = graph.AddLayer<OutputLayer>(0, "output");

     // Connect up layers - input -> pad -> pool2d -> output
     input->GetOutputSlot().Connect(padLayer->GetInputSlot(0));
     padLayer->GetOutputSlot().Connect(pool2dLayer->GetInputSlot(0));
     pool2dLayer->GetOutputSlot().Connect(output->GetInputSlot(0));

     auto checkSimplePool2d = [&](const Layer* const layer) {
         const auto pool2dLayer = static_cast<const Pooling2dLayer*>(layer);
         return IsLayerOfType<Pooling2dLayer>(layer) && (layer->GetNameStr() == "pool2d") &&
             (pool2dLayer->GetParameters() == pooling2dDescriptor);
     };

     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                              &IsLayerOfType<InputLayer>,
                              &IsLayerOfType<PadLayer>,
                              checkSimplePool2d,
                              &IsLayerOfType<OutputLayer>));

     armnn::Optimizer::Pass(graph, MakeOptimizations(FoldPadIntoPooling2d()));

     // The optimization should not have modified the graph.
     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                              &IsLayerOfType<InputLayer>,
                              &IsLayerOfType<PadLayer>,
                              checkSimplePool2d,
                              &IsLayerOfType<OutputLayer>));
 }

 TEST_CASE("FoldPadLayerIntoPooling2dLayer_QuantizedAveragePoolingShouldNotBeFolded")
 {
     Graph              graph;
     const unsigned int inputShape[]  = {1, 2, 2, 3};
     const unsigned int paddedShape[] = {1, 4, 4, 3};
     const unsigned int outputShape[] = {1, 2, 2, 3};

     TensorInfo inputInfo(4, inputShape, DataType::QAsymmU8);
     TensorInfo paddedInfo(4, paddedShape, DataType::QAsymmU8);
     TensorInfo outputInfo(4, outputShape, DataType::QAsymmU8);

     Layer* input = graph.AddLayer<InputLayer>(0, "input");
     input->GetOutputSlot().SetTensorInfo(inputInfo);

     PadDescriptor padDescriptor({{0, 0},
                                  {1, 1},
                                  {1, 1},
                                  {0, 0}});

     PadLayer* padLayer = graph.AddLayer<PadLayer>(padDescriptor, "pad");
     padLayer->GetOutputSlot().SetTensorInfo(paddedInfo);

     Pooling2dDescriptor pooling2dDescriptor;
     pooling2dDescriptor.m_PoolType   = PoolingAlgorithm::Average;
     pooling2dDescriptor.m_PoolWidth  = 3;
     pooling2dDescriptor.m_PoolHeight = 3;
     pooling2dDescriptor.m_StrideX    = 1;
     pooling2dDescriptor.m_StrideY    = 1;
     pooling2dDescriptor.m_DataLayout = DataLayout::NHWC;

     Pooling2dLayer* pool2dLayer = graph.AddLayer<Pooling2dLayer>(pooling2dDescriptor, "pool2d");
     pool2dLayer->GetOutputSlot().SetTensorInfo(outputInfo);

     Layer* output = graph.AddLayer<OutputLayer>(0, "output");

     // Connect up layers - input -> pad -> pool2d -> output
     input->GetOutputSlot().Connect(padLayer->GetInputSlot(0));
     padLayer->GetOutputSlot().Connect(pool2dLayer->GetInputSlot(0));
     pool2dLayer->GetOutputSlot().Connect(output->GetInputSlot(0));

     auto checkSimplePool2d = [&](const Layer* const layer) {
         const auto pool2dLayer = static_cast<const Pooling2dLayer*>(layer);
         return IsLayerOfType<Pooling2dLayer>(layer) && (layer->GetNameStr() == "pool2d") &&
             (pool2dLayer->GetParameters() == pooling2dDescriptor);
     };

     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                         &IsLayerOfType<InputLayer>,
                         &IsLayerOfType<PadLayer>,
                         checkSimplePool2d,
                         &IsLayerOfType<OutputLayer>));

     armnn::Optimizer::Pass(graph, MakeOptimizations(FoldPadIntoPooling2d()));

     // The optimization should not have modified the graph.
     CHECK(CheckSequence(graph.cbegin(), graph.cend(),
                         &IsLayerOfType<InputLayer>,
                         &IsLayerOfType<PadLayer>,
                         checkSimplePool2d,
                         &IsLayerOfType<OutputLayer>));
 }

 #if defined(ARMNNREF_ENABLED)
 TEST_CASE("FoldPadLayerIntoPooling2dLayer_ExecuteInferenceWithAndWithoutOptimization")
 {
     // The idea of this test to run a simple pad+pool2d network twice. Once
     // with FoldPadLayerIntoPooling2dLayer enabled and a second time with it
     // avoided. The output tensors of each should match.
     const unsigned int inputShape[]  = {1, 4, 4, 2};
     const unsigned int paddedShape[] = {1, 6, 6, 2};
     const unsigned int outputShape[] = {1, 4, 4, 2};
     std::vector<float> inputData({2.0f, 2.0f, 6.0f, 6.0f,
                                   4.0f, 4.0f, 8.0f, 8.0f,
                                   10.0f, 12.0f, 14.0f, 16.0f,
                                   10.0f, 12.0f, 16.0f, 14.0f,

                                   18.0f, 20.0f, 24.0f, 22.0f,
                                   20.0f, 18.0f, 22.0f, 24.0f,
                                   26.0f, 28.0f, 0.0f, 0.0f,
                                   26.0f, 28.0f, 0.0f, 0.0f,
                                  });
     try
     {
         // Create a network of input, pad, pooling 2D, output.
         INetworkPtr network = INetwork::Create();

         IConnectableLayer* inputLayer = network->AddInputLayer(0);
         TensorInfo inputInfo(4, inputShape, DataType::Float32);
         inputLayer->GetOutputSlot(0).SetTensorInfo(inputInfo);

         PadDescriptor padDescriptor({{0, 0},
                                      {1, 1},
                                      {1, 1},
                                      {0, 0}});
         IConnectableLayer* padLayer = network->AddPadLayer(padDescriptor, "Pad");
         TensorInfo paddedInfo(4, paddedShape, DataType::Float32);
         padLayer->GetOutputSlot(0).SetTensorInfo(paddedInfo);

         Pooling2dDescriptor pooling2dDescriptor;
         pooling2dDescriptor.m_PoolType   = PoolingAlgorithm::Average;
         pooling2dDescriptor.m_PoolWidth  = 3;
         pooling2dDescriptor.m_PoolHeight = 3;
         pooling2dDescriptor.m_StrideX    = 1;
         pooling2dDescriptor.m_StrideY    = 1;
         pooling2dDescriptor.m_DataLayout = DataLayout::NHWC;
         IConnectableLayer* pool2dLayer = network->AddPooling2dLayer(pooling2dDescriptor, "Pool2D");
         TensorInfo outputInfo(4, outputShape, DataType::Float32);
         pool2dLayer->GetOutputSlot(0).SetTensorInfo(outputInfo);

         IConnectableLayer* outputLayer = network->AddOutputLayer(0);

         // Connect layers
         inputLayer->GetOutputSlot(0).Connect(padLayer->GetInputSlot(0));
         padLayer->GetOutputSlot(0).Connect(pool2dLayer->GetInputSlot(0));
         pool2dLayer->GetOutputSlot(0).Connect(outputLayer->GetInputSlot(0));

         // Create ArmNN runtime
         IRuntimePtr          run              = IRuntime::Create(IRuntime::CreationOptions());    // default options
         // Optimise the network
         IOptimizedNetworkPtr optimizedNetwork = Optimize(*network, {Compute::CpuRef}, run->GetDeviceSpec());
         // Load network into runtime
         NetworkId            networkIdentifier;
         CHECK(run->LoadNetwork(networkIdentifier, std::move(optimizedNetwork)) == Status::Success);

         TensorInfo inputTensorInfo = run->GetInputTensorInfo(networkIdentifier, 0);
         inputTensorInfo.SetConstant(true);
         InputTensors inputTensors{{0, ConstTensor(inputTensorInfo, inputData.data())}};

         // Set the initial values of the data to different values to the golden data just in case the inference fails.
         std::vector<float> optimizedData(32, -std::numeric_limits<float>::infinity());
         OutputTensors      outputTensors{{0, Tensor(outputInfo, optimizedData.data())}};
         // Execute network
         run->EnqueueWorkload(networkIdentifier, inputTensors, outputTensors);
         // Unload it.
         run->UnloadNetwork(networkIdentifier);

         // In this second case the pad will have two outputs, one connected to the pooling layer the second connected to
         // a second output layer. This will prevent the FoldPadLayerIntoPooling2dLayer optimization from working.
         // A previous test, FoldPadLayerIntoPooling2d_PadWithMultipleOutputsShouldNotBeOptimized, has proved that doing
         // this will avoid the optimization.
         IConnectableLayer* dummyOutputLayer = network->AddOutputLayer(1);
         padLayer->GetOutputSlot(0).Connect(dummyOutputLayer->GetInputSlot(0));

         // Optimize and load and execute it a second time.
         optimizedNetwork = Optimize(*network, {Compute::CpuRef}, run->GetDeviceSpec());
         CHECK(run->LoadNetwork(networkIdentifier, std::move(optimizedNetwork)) == Status::Success);
         std::vector<float> goldenData(32, 0.0f);
         std::vector<float> padOutputData(72, 0.0f);
         OutputTensors      goldenTensors{{0, Tensor(outputInfo, goldenData.data())},
                                          {1, Tensor(paddedInfo, padOutputData.data())}};
         run->EnqueueWorkload(networkIdentifier, inputTensors, goldenTensors);

         // Now we can compare goldenData against optimizedData. They should be the same.
         CHECK(std::equal(goldenData.begin(), goldenData.end(), optimizedData.begin()));
     }
     catch (const std::exception& e)
     {
         std::cerr << e.what() << std::endl;
         ARMNN_ASSERT_MSG(false, e.what());
     }
 }

 TEST_CASE("FoldPadLayerIntoConv2dLayer_ExecuteInferenceWithAndWithoutOptimization")
 {
     // The idea of this test to run a simple pad+conv2d network twice. Once
     // with FoldPadLayerIntoConv2dLayer enabled and a second time with it
     // avoided. The output tensors of each should match.
     const unsigned int inputShape[]   = {1, 4, 4, 3}; // NHWCin
     const unsigned int paddedShape[]  = {1, 6, 6, 3};
     const unsigned int weightsShape[] = {4, 2, 2, 3}; // CoutHWCin
     const unsigned int outputShape[]  = {1, 5, 5, 4}; // NHWCout

     std::vector<float> inputData({2.0f, 2.0f, 6.0f, 6.0f,
                                   4.0f, 4.0f, 8.0f, 8.0f,
                                   10.0f, 12.0f, 14.0f, 16.0f,
                                   10.0f, 12.0f, 16.0f, 14.0f,

                                   18.0f, 20.0f, 24.0f, 22.0f,
                                   20.0f, 18.0f, 22.0f, 24.0f,
                                   26.0f, 28.0f, 0.0f, 0.0f,
                                   26.0f, 28.0f, 0.0f, 0.0f,

                                   2.0f, 2.0f, 6.0f, 6.0f,
                                   4.0f, 4.0f, 8.0f, 8.0f,
                                   10.0f, 12.0f, 14.0f, 16.0f,
                                   10.0f, 12.0f, 16.0f, 14.0f,
                                  });
     try
     {
         // Create a network of input, pad, pooling 2D, output.
         INetworkPtr network = INetwork::Create();

         IConnectableLayer* inputLayer = network->AddInputLayer(0);
         TensorInfo inputInfo(4, inputShape, DataType::Float32);
         inputLayer->GetOutputSlot(0).SetTensorInfo(inputInfo);

         PadDescriptor padDescriptor({{0, 0},
                                      {1, 1},
                                      {1, 1},
                                      {0, 0}});
         IConnectableLayer* padLayer = network->AddPadLayer(padDescriptor, "Pad");
         TensorInfo paddedInfo(4, paddedShape, DataType::Float32);
         padLayer->GetOutputSlot(0).SetTensorInfo(paddedInfo);

         Convolution2dDescriptor convDescriptor;
         convDescriptor.m_DataLayout  = DataLayout::NHWC;
         convDescriptor.m_StrideX     = 1;
         convDescriptor.m_StrideY     = 1;
         convDescriptor.m_BiasEnabled = true;

         std::vector<float>    weightsData  = {1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12,
                                               11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22,
                                               21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32,
                                               31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42};
         TensorInfo            weightsInfo(4, weightsShape, DataType::Float32, 1.0f, 0, true);
         ConstTensor           weights(weightsInfo, weightsData);
         std::vector<float>    biasVector   = {5, 6, 7, 8};
         TensorInfo            biasInfo({4}, DataType::Float32, 1.0f, 0, true);
         ConstTensor           bias(biasInfo, biasVector);

         IConnectableLayer* conv2dLayer = network->AddConvolution2dLayer(convDescriptor, "Conv2D");

         TensorInfo outputInfo(4, outputShape, DataType::Float32);
         conv2dLayer->GetOutputSlot(0).SetTensorInfo(outputInfo);

         IConnectableLayer* outputLayer = network->AddOutputLayer(0);

         // Connect layers
         inputLayer->GetOutputSlot(0).Connect(padLayer->GetInputSlot(0));
         padLayer->GetOutputSlot(0).Connect(conv2dLayer->GetInputSlot(0));
         conv2dLayer->GetOutputSlot(0).Connect(outputLayer->GetInputSlot(0));

         auto weightsLayer = network->AddConstantLayer(weights, "Weights");
         weightsLayer->GetOutputSlot(0).SetTensorInfo(weights.GetInfo());
         weightsLayer->GetOutputSlot(0).Connect(conv2dLayer->GetInputSlot(1));

         auto biasLayer = network->AddConstantLayer(bias, "Bias");
         biasLayer->GetOutputSlot(0).SetTensorInfo(bias.GetInfo());
         biasLayer->GetOutputSlot(0).Connect(conv2dLayer->GetInputSlot(2));

         // Create ArmNN runtime
         IRuntimePtr          run              = IRuntime::Create(IRuntime::CreationOptions());    // default options
         // Optimise the network
         IOptimizedNetworkPtr optimizedNetwork = Optimize(*network, {Compute::CpuRef}, run->GetDeviceSpec());
         // Load network into runtime
         NetworkId            networkIdentifier;
         CHECK(run->LoadNetwork(networkIdentifier, std::move(optimizedNetwork)) == Status::Success);

         TensorInfo inputTensorInfo = run->GetInputTensorInfo(networkIdentifier, 0);
         inputTensorInfo.SetConstant(true);
         InputTensors inputTensors{{0, ConstTensor(inputTensorInfo, inputData.data())}};

         // Set the initial values of the data to different values to the golden data just in case the inference fails.
         std::vector<float> optimizedData(100, -std::numeric_limits<float>::infinity());
         OutputTensors      outputTensors{{0, Tensor(outputInfo, optimizedData.data())}};
         // Execute network
         run->EnqueueWorkload(networkIdentifier, inputTensors, outputTensors);
         // Unload it.
         run->UnloadNetwork(networkIdentifier);

         // In this second case the pad will have two outputs, one connected to the conv layer the second connected to
         // a second output layer. This will prevent the FoldPadLayerIntoConv2dLayer optimization from working.
         // A previous test, FoldPadLayerIntoConv2d_PadWithMultipleOutputsShouldNotBeOptimized, has proved that doing
         // this will avoid the optimization.
         IConnectableLayer* dummyOutputLayer = network->AddOutputLayer(1);
         padLayer->GetOutputSlot(0).Connect(dummyOutputLayer->GetInputSlot(0));

         // Optimize and load and execute it a second time.
         optimizedNetwork = Optimize(*network, {Compute::CpuRef}, run->GetDeviceSpec());
         CHECK(run->LoadNetwork(networkIdentifier, std::move(optimizedNetwork)) == Status::Success);
         std::vector<float> goldenData(100, 0.0f);
         std::vector<float> padOutputData(108, 0.0f);
         OutputTensors      goldenTensors{{0, Tensor(outputInfo, goldenData.data())},
                                          {1, Tensor(paddedInfo, padOutputData.data())}};
         run->EnqueueWorkload(networkIdentifier, inputTensors, goldenTensors);

         // Now we can compare goldenData against optimizedData. They should be the same.
         CHECK(std::equal(goldenData.begin(), goldenData.end(), optimizedData.begin()));
     }
     catch (const std::exception& e)
     {
         std::cerr << e.what() << std::endl;
         ARMNN_ASSERT_MSG(false, e.what());
     }
 }

 TEST_CASE("FoldPadLayerIntoDepthwiseConv2dLayer_ExecuteInferenceWithAndWithoutOptimization")
 {
     // The idea of this test to run a simple pad+depthwiseconv2d network twice. Once
     // with FoldPadLayerIntoDeptwiseConv2dLayer enabled and a second time with it
     // avoided. The output tensors of each should match.
     const unsigned int inputShape[]   = {1, 4, 4, 3}; // NHWCin
     const unsigned int paddedShape[]  = {1, 6, 6, 3};
     const unsigned int weightsShape[] = {1, 2, 2, 12};  // 1HWCout
     const unsigned int outputShape[]  = {1, 5, 5, 12}; // NHWCout

     std::vector<float> inputData({2.0f, 2.0f, 6.0f, 6.0f,
                                   4.0f, 4.0f, 8.0f, 8.0f,
                                   10.0f, 12.0f, 14.0f, 16.0f,
                                   10.0f, 12.0f, 16.0f, 14.0f,

                                   18.0f, 20.0f, 24.0f, 22.0f,
                                   20.0f, 18.0f, 22.0f, 24.0f,
                                   26.0f, 28.0f, 0.0f, 0.0f,
                                   26.0f, 28.0f, 0.0f, 0.0f,

                                   2.0f, 2.0f, 6.0f, 6.0f,
                                   4.0f, 4.0f, 8.0f, 8.0f,
                                   10.0f, 12.0f, 14.0f, 16.0f,
                                   10.0f, 12.0f, 16.0f, 14.0f,
                                  });
     try
     {
         // Create a network of input, pad, pooling 2D, output.
         INetworkPtr network = INetwork::Create();

         IConnectableLayer* inputLayer = network->AddInputLayer(0);
         TensorInfo inputInfo(4, inputShape, DataType::Float32);
         inputLayer->GetOutputSlot(0).SetTensorInfo(inputInfo);

         PadDescriptor padDescriptor({{0, 0},
                                      {1, 1},
                                      {1, 1},
                                      {0, 0}});
         IConnectableLayer* padLayer = network->AddPadLayer(padDescriptor, "Pad");
         TensorInfo paddedInfo(4, paddedShape, DataType::Float32);
         padLayer->GetOutputSlot(0).SetTensorInfo(paddedInfo);

         DepthwiseConvolution2dDescriptor convDescriptor;
         convDescriptor.m_DataLayout  = DataLayout::NHWC;
         convDescriptor.m_StrideX     = 1;
         convDescriptor.m_StrideY     = 1;
         convDescriptor.m_BiasEnabled = true;

         std::vector<float>    weightsData  = {1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12,
                                               11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22,
                                               21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32,
                                               31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42};
         TensorInfo            weightsInfo(4, weightsShape, DataType::Float32, 0.0f, 0, true);
         ConstTensor           weights(weightsInfo, weightsData);
         std::vector<float>    biasVector   = {5, 6, 7, 8, 9, 10, 11, 12, 5, 6, 7, 8};
         TensorInfo            biasInfo({12}, DataType::Float32, 0.0f, 0, true);
         ConstTensor           bias(biasInfo, biasVector);

         IConnectableLayer* conv2dLayer = network->AddDepthwiseConvolution2dLayer(convDescriptor,
                                                                                  "DepthwiseConv2D");

         TensorInfo outputInfo(4, outputShape, DataType::Float32);
         conv2dLayer->GetOutputSlot(0).SetTensorInfo(outputInfo);

         IConnectableLayer* outputLayer = network->AddOutputLayer(0);

         // Connect layers
         inputLayer->GetOutputSlot(0).Connect(padLayer->GetInputSlot(0));
         padLayer->GetOutputSlot(0).Connect(conv2dLayer->GetInputSlot(0));
         conv2dLayer->GetOutputSlot(0).Connect(outputLayer->GetInputSlot(0));

         auto weightsLayer = network->AddConstantLayer(weights, "Weights");
         weightsLayer->GetOutputSlot(0).SetTensorInfo(weights.GetInfo());
         weightsLayer->GetOutputSlot(0).Connect(conv2dLayer->GetInputSlot(1));

         auto biasLayer = network->AddConstantLayer(bias, "Bias");
         biasLayer->GetOutputSlot(0).SetTensorInfo(bias.GetInfo());
         biasLayer->GetOutputSlot(0).Connect(conv2dLayer->GetInputSlot(2));

         // Create ArmNN runtime
         IRuntimePtr          run              = IRuntime::Create(IRuntime::CreationOptions());    // default options
         // Optimise the network
         IOptimizedNetworkPtr optimizedNetwork = Optimize(*network, {Compute::CpuRef}, run->GetDeviceSpec());
         // Load network into runtime
         NetworkId            networkIdentifier;
         CHECK(run->LoadNetwork(networkIdentifier, std::move(optimizedNetwork)) == Status::Success);

         TensorInfo inputTensorInfo = run->GetInputTensorInfo(networkIdentifier, 0);
         inputTensorInfo.SetConstant(true);
         InputTensors inputTensors{{0, ConstTensor(inputTensorInfo, inputData.data())}};

         // Set the initial values of the data to different values to the golden data just in case the inference fails.
         std::vector<float> optimizedData(300, -std::numeric_limits<float>::infinity());
         OutputTensors      outputTensors{{0, Tensor(outputInfo, optimizedData.data())}};
         // Execute network
         run->EnqueueWorkload(networkIdentifier, inputTensors, outputTensors);
         // Unload it.
         run->UnloadNetwork(networkIdentifier);

         // In this second case the pad will have two outputs, one connected to the conv layer the second connected to
         // a second output layer. This will prevent the FoldPadLayerIntoDepthwiseConv2dLayer optimization from working.
         // A previous test, FoldPadLayerIntoDepthwiseConv2d_PadWithMultipleOutputsShouldNotBeOptimized, has proved that
         // doing this will avoid the optimization.
         IConnectableLayer* dummyOutputLayer = network->AddOutputLayer(1);
         padLayer->GetOutputSlot(0).Connect(dummyOutputLayer->GetInputSlot(0));

         // Optimize and load and execute it a second time.
         optimizedNetwork = Optimize(*network, {Compute::CpuRef}, run->GetDeviceSpec());
         CHECK(run->LoadNetwork(networkIdentifier, std::move(optimizedNetwork)) == Status::Success);
         std::vector<float> goldenData(300, 0.0f);
         std::vector<float> padOutputData(108, 0.0f);
         OutputTensors      goldenTensors{{0, Tensor(outputInfo, goldenData.data())},
                                          {1, Tensor(paddedInfo, padOutputData.data())}};
         run->EnqueueWorkload(networkIdentifier, inputTensors, goldenTensors);

         // Now we can compare goldenData against optimizedData. They should be the same.
         CHECK(std::equal(goldenData.begin(), goldenData.end(), optimizedData.begin()));
     }
     catch (const std::exception& e)
     {
         std::cerr << e.what() << std::endl;
         ARMNN_ASSERT_MSG(false, e.what());
     }
 }
 #endif

 }
armnn::ConstantLayer
A layer that the constant data can be bound to.
Definition: ConstantLayer.hpp:15

armnn::Convolution2dDescriptor::m_BiasEnabled
bool m_BiasEnabled
Enable/disable bias.
Definition: Descriptors.hpp:543

armnn::Convolution2dDescriptor::m_DataLayout
DataLayout m_DataLayout
The data layout to be used (NCHW, NHWC).
Definition: Descriptors.hpp:545

armnn::IRuntime::Create
static IRuntimePtr Create(const CreationOptions &options)
Definition: Runtime.cpp:49

armnn::IConnectableLayer
Interface for a layer that is connectable to other layers via InputSlots and OutputSlots.
Definition: INetwork.hpp:68

armnn::Pooling2dDescriptor::m_PadBottom
uint32_t m_PadBottom
Padding bottom value in the height dimension.
Definition: Descriptors.hpp:374

armnn::DepthwiseConvolution2dDescriptor::m_BiasEnabled
bool m_BiasEnabled
Enable/disable bias.
Definition: Descriptors.hpp:669

armnn::Compute::CpuRef
CPU Execution: Reference C++ kernels.

armnn::Pooling2dDescriptor::m_PadLeft
uint32_t m_PadLeft
Padding left value in the width dimension.
Definition: Descriptors.hpp:368

armnn::optimizations::FoldPadIntoConvolution2d
OptimizeForExclusiveConnection< PadLayer, Convolution2dLayer, pad_fold::FoldPadIntoConvolution2dImpl > FoldPadIntoConvolution2d
Definition: FoldPadIntoLayer2d.hpp:271

armnn::MakeOptimizations
Optimizer::Optimizations MakeOptimizations(Args &&... args)
Definition: Optimizer.hpp:43

CheckSequence
bool CheckSequence(const armnn::Graph::ConstIterator first, const armnn::Graph::ConstIterator last)
Definition: TestUtils.hpp:21

armnn::optimizations::FoldPadIntoDepthwiseConvolution2d
OptimizeForExclusiveConnection< PadLayer, DepthwiseConvolution2dLayer, pad_fold::FoldPadIntoDepthwiseConvolution2dImpl > FoldPadIntoDepthwiseConvolution2d
Definition: FoldPadIntoLayer2d.hpp:275

armnn::PadDescriptor::m_PadValue
float m_PadValue
Optional value to use for padding, defaults to 0.
Definition: Descriptors.hpp:1198

armnn::DepthwiseConvolution2dDescriptor::m_DataLayout
DataLayout m_DataLayout
The data layout to be used (NCHW, NHWC).
Definition: Descriptors.hpp:671

armnn::TensorInfo
Definition: Tensor.hpp:152

armnn::DepthwiseConvolution2dLayer
This layer represents a depthwise convolution 2d operation.
Definition: DepthwiseConvolution2dLayer.hpp:15

armnn::optimizations
Definition: AddBroadcastReshapeLayer.hpp:15

armnn::ConstantLayer::m_LayerOutput
std::shared_ptr< ConstTensorHandle > m_LayerOutput
Definition: ConstantLayer.hpp:44

armnn::Graph::AddLayer
LayerT * AddLayer(Args &&... args)
Adds a new layer, of type LayerType, to the graph constructed with the arguments passed.
Definition: Graph.hpp:456

armnn::Pooling2dDescriptor::m_PoolWidth
uint32_t m_PoolWidth
Pooling width value.
Definition: Descriptors.hpp:376

armnn::Graph::cbegin
ConstIterator cbegin() const
Returns const iterator pointing to the beginning of the list. Lowercase for range-based for loops...
Definition: Graph.hpp:179

armnn::Convolution2dDescriptor
A Convolution2dDescriptor for the Convolution2dLayer.
Definition: Descriptors.hpp:495

armnn::OutputSlot::Connect
int Connect(InputSlot &destination)
Definition: Layer.cpp:112

armnn::Optimizer::Pass
static void Pass(Graph &graph, const Optimizations &optimizations)
Definition: Optimizer.cpp:16

armnn::IRuntimePtr
std::unique_ptr< IRuntime, void(*)(IRuntime *runtime)> IRuntimePtr
Definition: IRuntime.hpp:33

armnn::PaddingMethod::Exclude
The padding fields don&#39;t count and are ignored.

armnn::Pooling2dDescriptor::m_PaddingMethod
PaddingMethod m_PaddingMethod
The padding method to be used. (Exclude, IgnoreValue).
Definition: Descriptors.hpp:386

armnn::Pooling2dDescriptor::m_PadTop
uint32_t m_PadTop
Padding top value in the height dimension.
Definition: Descriptors.hpp:372

armnn::InputTensors
std::vector< std::pair< LayerBindingId, class ConstTensor > > InputTensors
Definition: Tensor.hpp:392

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_quick_start.dox:6

armnn::LayerWithParameters::GetParameters
const Parameters & GetParameters() const override
If the layer has a descriptor return it.
Definition: LayerWithParameters.hpp:19

armnn::PadLayer
This layer represents a pad operation.
Definition: PadLayer.hpp:14

armnn::Pooling2dDescriptor::m_StrideX
uint32_t m_StrideX
Stride value when proceeding through input for the width dimension.
Definition: Descriptors.hpp:380

armnn::IOutputSlot::SetTensorInfo
virtual void SetTensorInfo(const TensorInfo &tensorInfo)=0

Optimizer.hpp

armnn::Tensor
A tensor defined by a TensorInfo (shape and data type) and a mutable backing store.
Definition: Tensor.hpp:319

armnn::Pooling2dDescriptor::m_PoolHeight
uint32_t m_PoolHeight
Pooling height value.
Definition: Descriptors.hpp:378

armnn::PadDescriptor
A PadDescriptor for the PadLayer.
Definition: Descriptors.hpp:1173

armnn::Layer::GetInputSlot
const InputSlot & GetInputSlot(unsigned int index) const override
Get a const input slot handle by slot index.
Definition: Layer.hpp:324

armnn::Convolution2dDescriptor::m_StrideX
uint32_t m_StrideX
Stride value when proceeding through input for the width dimension.
Definition: Descriptors.hpp:535

armnn::DepthwiseConvolution2dDescriptor::m_StrideX
uint32_t m_StrideX
Stride value when proceeding through input for the width dimension.
Definition: Descriptors.hpp:661

armnn::OutputLayer
A layer user-provided data can be bound to (e.g. inputs, outputs).
Definition: OutputLayer.hpp:13

armnn::Status::Success

armnn::Pooling2dDescriptor::m_PadRight
uint32_t m_PadRight
Padding right value in the width dimension.
Definition: Descriptors.hpp:370

armnn::Optimize
IOptimizedNetworkPtr Optimize(const INetwork &network, const std::vector< BackendId > &backendPreferences, const IDeviceSpec &deviceSpec, const OptimizerOptions &options=OptimizerOptions(), Optional< std::vector< std::string > &> messages=EmptyOptional())
Create an optimized version of the network.
Definition: Network.cpp:1864

ARMNN_ASSERT_MSG
#define ARMNN_ASSERT_MSG(COND, MSG)
Definition: Assert.hpp:15

armnn::DataType::QAsymmU8

armnn::NetworkId
int NetworkId
Definition: IRuntime.hpp:27

armnn::ConstTensor
A tensor defined by a TensorInfo (shape and data type) and an immutable backing store.
Definition: Tensor.hpp:327

armnn::OutputTensors
std::vector< std::pair< LayerBindingId, class Tensor > > OutputTensors
Definition: Tensor.hpp:393

armnn::IOptimizedNetworkPtr
std::unique_ptr< IOptimizedNetwork, void(*)(IOptimizedNetwork *network)> IOptimizedNetworkPtr
Definition: INetwork.hpp:239

armnn::PoolingAlgorithm::Average

TensorHandle.hpp

armnn::BaseTensor::GetInfo
const TensorInfo & GetInfo() const
Definition: Tensor.hpp:295

armnn::Convolution2dDescriptor::m_StrideY
uint32_t m_StrideY
Stride value when proceeding through input for the height dimension.
Definition: Descriptors.hpp:537

armnn::Graph
Definition: Graph.hpp:30

armnn::Pooling2dLayer
This layer represents a pooling 2d operation.
Definition: Pooling2dLayer.hpp:13

armnn::Pooling2dDescriptor::m_DataLayout
DataLayout m_DataLayout
The data layout to be used (NCHW, NHWC).
Definition: Descriptors.hpp:388

armnn::IRuntime::CreationOptions
Definition: IRuntime.hpp:77

armnn::Pooling2dDescriptor::m_PoolType
PoolingAlgorithm m_PoolType
The pooling algorithm to use (Max. Average, L2).
Definition: Descriptors.hpp:366

armnn::DepthwiseConvolution2dDescriptor::m_StrideY
uint32_t m_StrideY
Stride value when proceeding through input for the height dimension.
Definition: Descriptors.hpp:663

armnn::PaddingMethod::IgnoreValue
The padding fields count, but are ignored.

armnn::optimizations::FoldPadIntoPooling2d
OptimizeForExclusiveConnection< PadLayer, Pooling2dLayer, pad_fold::FoldPadIntoPooling2dImpl > FoldPadIntoPooling2d
Definition: FoldPadIntoLayer2d.hpp:277

armnn::InputLayer
A layer user-provided data can be bound to (e.g. inputs, outputs).
Definition: InputLayer.hpp:13

Network.hpp

armnn::OutputSlot::SetTensorInfo
void SetTensorInfo(const TensorInfo &tensorInfo) override
Definition: Layer.cpp:87

armnn::IConnectableLayer::GetInputSlot
virtual const IInputSlot & GetInputSlot(unsigned int index) const =0
Get a const input slot handle by slot index.

armnn::TensorInfo::SetConstant
void SetConstant(const bool IsConstant=true)
Marks the data corresponding to this tensor info as constant.
Definition: Tensor.cpp:514

armnn::Layer::GetOutputSlot
const OutputSlot & GetOutputSlot(unsigned int index=0) const override
Get the const output slot handle by slot index.
Definition: Layer.hpp:326

armnn::PoolingAlgorithm::Max

armnn::DataType::Float32

armnn::IConnectableLayer::GetOutputSlot
virtual const IOutputSlot & GetOutputSlot(unsigned int index) const =0
Get the const output slot handle by slot index.

LayersFwd.hpp

armnn::Graph::cend
ConstIterator cend() const
Returns const iterator pointing to the end of the list. Lowercase for range-based for loops...
Definition: Graph.hpp:181

armnn::Convolution2dLayer
This layer represents a convolution 2d operation.
Definition: Convolution2dLayer.hpp:15

armnn::INetworkPtr
std::unique_ptr< INetwork, void(*)(INetwork *network)> INetworkPtr
Definition: INetwork.hpp:238

armnn::IOutputSlot::Connect
virtual int Connect(IInputSlot &destination)=0

armnn::Pooling2dDescriptor
A Pooling2dDescriptor for the Pooling2dLayer.
Definition: Descriptors.hpp:332

TEST_SUITE
TEST_SUITE("Optimizer")
Definition: FoldPadTests.cpp:13

armnn::INetwork::Create
static INetworkPtr Create(NetworkOptions networkOptions={})
Definition: Network.cpp:475

armnn::Pooling2dDescriptor::m_StrideY
uint32_t m_StrideY
Stride value when proceeding through input for the height dimension.
Definition: Descriptors.hpp:382

armnn::DepthwiseConvolution2dDescriptor
A DepthwiseConvolution2dDescriptor for the DepthwiseConvolution2dLayer.
Definition: Descriptors.hpp:620

armnn::Layer
Definition: Layer.hpp:217

armnn::DataLayout::NHWC