1 files changed, 1440 insertions, 0 deletions
diff --git a/src/armnnTfLiteParser/TfLiteParser.cpp b/src/armnnTfLiteParser/TfLiteParser.cpp
new file mode 100644
index 0000000000..d5c48a10e2
--- /dev/null
+++ b/src/armnnTfLiteParser/TfLiteParser.cpp
@@ -0,0 +1,1440 @@
+//
+// Copyright © 2017 Arm Ltd. All rights reserved.
+// See LICENSE file in the project root for full license information.
+//
+#include "TfLiteParser.hpp"
+
+#include <armnn/ArmNN.hpp>
+#include <armnn/Exceptions.hpp>
+#include <armnn/TypesUtils.hpp>
+#include <boost/filesystem.hpp>
+
+// armnnUtils:
+#include <Permute.hpp>
+#include <VerificationHelpers.hpp>
+
+// The generated code based on the Tf Lite schema:
+#include <schema_generated.h>
+
+#include <boost/core/ignore_unused.hpp>
+#include <boost/assert.hpp>
+#include <boost/format.hpp>
+#include <boost/log/trivial.hpp>
+
+#include <fstream>
+#include <algorithm>
+#include <limits>
+
+using namespace armnn;
+using armnn::CheckLocation;
+namespace armnnTfLiteParser
+{
+namespace
+{
+const PermutationVector NHWCToArmNN = { 0, 2, 3, 1 };
+const PermutationVector ArmNNToNHWC = { 0, 3, 1, 2 };
+
+const uint32_t VIRTUAL_OPERATOR_ID = std::numeric_limits<uint32_t>::max();
+
+void CheckSubgraph(const TfLiteParser::ModelPtr & model,
+                   size_t subgraphIndex,
+                   const CheckLocation & location)
+{
+    if (model.get() == nullptr)
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("%1% was called with invalid (null) model. "
+                              "Possible reason is that the model is not yet loaded and Unpack(ed). "
+                              "subgraph:%2% at %3%") %
+                              location.m_Function %
+                              subgraphIndex %
+                              location.FileLine()));
+    }
+    else if (subgraphIndex >= model->subgraphs.size())
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("%1% was called with an invalid subgraph index. "
+                              "subgraph:%2% at %3%") %
+                              location.m_Function %
+                              subgraphIndex %
+                              location.FileLine()));
+    }
+}
+
+#define CHECK_SUBGRAPH(MODEL, SUBGRAPH_INDEX) \
+    CheckSubgraph(MODEL, SUBGRAPH_INDEX, CHECK_LOCATION())
+
+void CheckModel(const TfLiteParser::ModelPtr & model,
+                size_t subgraphIndex,
+                size_t operatorIndex,
+                const CheckLocation & location)
+{
+    if (model.get() == nullptr)
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("%1% was called with invalid (null) model. "
+                                "Possible reason is that the model is not yet loaded and Unpack(ed). "
+                                "subgraph:%2% operator:%3% at %4%") %
+                                location.m_Function %
+                                subgraphIndex %
+                                operatorIndex %
+                                location.FileLine()));
+    }
+    else if (subgraphIndex >= model->subgraphs.size())
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("%1% was called with an invalid subgraph index. "
+                                "subgraph:%2% operator:%3% at %4%") %
+                                location.m_Function %
+                                subgraphIndex %
+                                operatorIndex %
+                                location.FileLine()));
+    }
+    else if (operatorIndex >= model->subgraphs[subgraphIndex]->operators.size() &&
+             operatorIndex != VIRTUAL_OPERATOR_ID)
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("%1% was called with an invalid operator index. "
+                                "subgraph:%2% operator:%3% at %4%") %
+                                location.m_Function %
+                                subgraphIndex %
+                                operatorIndex %
+                                location.FileLine()));
+    }
+}
+
+#define CHECK_MODEL(MODEL, SUBGRAPH_INDEX, OPERATOR_INDEX) \
+    CheckModel(MODEL, SUBGRAPH_INDEX, OPERATOR_INDEX, CHECK_LOCATION())
+
+void CheckTensor(const TfLiteParser::ModelPtr & model,
+                 size_t subgraphIndex,
+                 size_t tensorIndex,
+                 const CheckLocation & location)
+{
+    // not checking model, because I assume CHECK_MODEL already run
+    // and checked that. An assert would do.
+    BOOST_ASSERT_MSG(model.get() != nullptr, "Expecting a valid model in this function");
+
+    // also subgraph index should be checked by CHECK_MODEL so
+    // I only add an assert here
+    BOOST_ASSERT_MSG(subgraphIndex < model->subgraphs.size(), "Expecting a valid subgraph index");
+
+    // the tensor index is the only one to check here
+    if (tensorIndex >= model->subgraphs[subgraphIndex]->tensors.size())
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("%1% was called with an invalid tensor index. "
+                                "subgraph:%2% tensor:%3% at %4%") %
+                                location.m_Function %
+                                subgraphIndex %
+                                tensorIndex %
+                                location.FileLine()));
+    }
+}
+
+#define CHECK_TENSOR(MODEL, SUBGRAPH_INDEX, TENSOR_INDEX) \
+    CheckTensor(MODEL, SUBGRAPH_INDEX, TENSOR_INDEX, CHECK_LOCATION())
+
+void CheckTensorPtr(TfLiteParser::TensorRawPtr rawPtr,
+                    const CheckLocation & location)
+{
+    if (rawPtr == nullptr)
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("%1% was called with a null tensor pointer. "
+                              "at %2%") %
+                              location.m_Function %
+                              location.FileLine()));
+
+    }
+}
+
+#define CHECK_TENSOR_PTR(TENSOR_PTR) \
+    CheckTensorPtr(TENSOR_PTR, CHECK_LOCATION())
+
+void CheckBuffer(const TfLiteParser::ModelPtr & model,
+                 size_t bufferIndex,
+                 const CheckLocation & location)
+{
+    if (model.get() == nullptr)
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("%1% was called with invalid (null) model. "
+                              "Possible reason is that the model is not yet loaded and Unpack(ed). "
+                              "buffer:%2% at %3%") %
+                              location.m_Function %
+                              bufferIndex %
+                              location.FileLine()));
+    }
+    else if (bufferIndex >= model->buffers.size())
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("%1% was called with an invalid buffer index. "
+                              "buffer index:%2% at %3%") %
+                              location.m_Function %
+                              bufferIndex %
+                              location.FileLine()));
+    }
+    else if (model->buffers[bufferIndex].get() == nullptr)
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("The buffer #%1% is null. %3%") %
+                              bufferIndex %
+                              location.AsString()));
+    }
+}
+
+#define CHECK_BUFFER(MODEL, BUFFER_INDEX) \
+    CheckBuffer(MODEL, BUFFER_INDEX, CHECK_LOCATION())
+
+void CheckBufferSize(TfLiteParser::BufferRawPtr bufferPtr,
+                     const armnn::TensorInfo & tensorInfo,
+                     uint32_t bufferId,
+                     const CheckLocation & location)
+{
+    if (bufferPtr == nullptr)
+    {
+        throw ParseException(
+            boost::str(
+                boost::format("BufferPtr is null for buffer:%1%. %2%") %
+                              bufferId %
+                              location.AsString()));
+    }
+    else if(tensorInfo.GetNumElements() > bufferPtr->data.size() ||
+            tensorInfo.GetNumBytes() > bufferPtr->data.size())
+    {
+        std::stringstream ss;
+        ss << "Buffer #" << bufferId << " has " << bufferPtr->data.size() << " bytes. "
+           << "For tensor: " << tensorInfo.GetShape()
+           << " expecting: " << tensorInfo.GetNumBytes() << " bytes and "
+           << tensorInfo.GetNumElements() << " elements. " << location.AsString();
+        throw ParseException(ss.str());
+    }
+}
+
+#define CHECK_BUFFER_SIZE(BUFFER_PTR, TENSOR_INFO, BUFFER_ID) \
+    CheckBufferSize(BUFFER_PTR, TENSOR_INFO, BUFFER_ID, CHECK_LOCATION())
+
+bool IsActivationSupported(tflite::ActivationFunctionType activationType)
+{
+    switch(activationType)
+    {
+        case tflite::ActivationFunctionType_NONE:
+        case tflite::ActivationFunctionType_RELU:
+        case tflite::ActivationFunctionType_RELU6:
+        case tflite::ActivationFunctionType_TANH:
+        {
+            return true;
+        }
+        default:
+        {
+            return false;
+        }
+    }
+}
+
+#define CHECK_SUPPORTED_FUSED_ACTIVATION(OPTION, SUBGRAPH_INDEX, OPERATOR_INDEX) \
+    do { \
+        if (IsActivationSupported(OPTION->fused_activation_function) == false) \
+        { \
+            throw ParseException( \
+                boost::str( \
+                    boost::format("TfLite parser doesn't suppport fused activation: " \
+                                  "%1%/%2% in %3% subgraph:%4% operator:%5% at %6%") % \
+                                  OPTION->fused_activation_function % \
+                                  tflite::EnumNameActivationFunctionType(\
+                                      OPTION->fused_activation_function) % \
+                                  __func__ % \
+                                  SUBGRAPH_INDEX % \
+                                  OPERATOR_INDEX % \
+                                  CHECK_LOCATION().FileLine())); \
+        } \
+    } while(false)
+
+
+std::vector<unsigned int> AsUnsignedVector(const std::vector<int32_t> & in)
+{
+    std::vector<unsigned int> result;
+    result.reserve(in.size());
+    for (auto & i : in)
+    {
+        result.push_back(CHECKED_NON_NEGATIVE(i));
+    }
+    return result;
+}
+
+void CalcPadding(uint32_t inputSize,
+                 uint32_t filterSize,
+                 uint32_t stride,
+                 uint32_t& paddingFront,
+                 uint32_t& paddingBack,
+                 tflite::Padding padding)
+{
+    paddingFront = 0;
+    paddingBack = 0;
+    if (padding == tflite::Padding_SAME)
+    {
+        uint32_t outputSize = (inputSize + stride - 1) / stride;
+        uint32_t temp = (outputSize - 1) * stride + filterSize;
+        if (temp > inputSize)
+        {
+            paddingFront = (temp - inputSize) / 2;
+            paddingBack = (temp - inputSize) - paddingFront;
+        }
+    }
+}
+
+armnn::TensorInfo ToTensorInfo(TfLiteParser::TensorRawPtr tensorPtr)
+{
+    armnn::DataType type;
+    CHECK_TENSOR_PTR(tensorPtr);
+
+    switch (tensorPtr->type)
+    {
+        case tflite::TensorType_UINT8:
+            type = armnn::DataType::QuantisedAsymm8;
+            break;
+        case tflite::TensorType_FLOAT32:
+            type = armnn::DataType::Float32;
+            break;
+        case tflite::TensorType_INT32:
+            type = armnn::DataType::Signed32;
+            break;
+
+        default:
+        {
+            CheckLocation location = CHECK_LOCATION();
+            throw ParseException(
+                boost::str(
+                    boost::format("Unsupported data type %1% = %2% for tensor: %3%. %4%") %
+                                  tensorPtr->type %
+                                  tflite::EnumNameTensorType(tensorPtr->type) %
+                                  tensorPtr->name %
+                                  location.AsString()));
+        }
+    }
+
+    float quantizationScale = 0.0f;
+    int32_t quantizationOffset = 0;
+
+    if (tensorPtr->quantization.get())
+    {
+        CHECK_VALID_SIZE(tensorPtr->quantization->scale.size(), 0, 1);
+        CHECK_VALID_SIZE(tensorPtr->quantization->zero_point.size(), 0, 1);
+
+        if (tensorPtr->quantization->scale.size() == 1)
+        {
+            quantizationScale = tensorPtr->quantization->scale[0];
+        }
+        if (tensorPtr->quantization->zero_point.size() == 1)
+        {
+            // NOTE: we lose precision here when converting from 64 bit to 32
+            //       but this is what we support at the monent in ArmNN
+            quantizationOffset = static_cast<int32_t>(tensorPtr->quantization->zero_point[0]);
+        }
+    }
+
+    auto const & dimensions = AsUnsignedVector(tensorPtr->shape);
+
+    // two statements (on purpose) for easier debugging:
+    armnn::TensorInfo result(static_cast<unsigned int>(tensorPtr->shape.size()),
+                             dimensions.data(),
+                             type,
+                             quantizationScale,
+                             quantizationOffset);
+    return result;
+}
+
+template<typename T>
+std::pair<armnn::ConstTensor, std::unique_ptr<T[]>>
+CreateConstTensorImpl(TfLiteParser::BufferRawPtr bufferPtr,
+                      TfLiteParser::TensorRawPtr tensorPtr,
+                      armnn::TensorInfo & tensorInfo,
+                      bool convertFromTfToArmnnFormat)
+{
+    BOOST_ASSERT_MSG(tensorPtr != nullptr, "tensorPtr is null");
+    BOOST_ASSERT_MSG(bufferPtr != nullptr,
+        boost::str(
+            boost::format("Buffer for buffer:%1% is null") % tensorPtr->buffer).c_str());
+
+    std::unique_ptr<T[]> data(new T[tensorInfo.GetNumElements()]);
+
+    if (convertFromTfToArmnnFormat)
+    {
+        tensorInfo = armnnUtils::Permuted(tensorInfo, NHWCToArmNN);
+        armnnUtils::Permute(tensorInfo.GetShape(),
+                            NHWCToArmNN,
+                            reinterpret_cast<const T *>(bufferPtr->data.data()),
+                            data.get());
+    }
+    else
+    {
+        ::memcpy(data.get(), bufferPtr->data.data(), tensorInfo.GetNumBytes());
+    }
+    return std::make_pair(ConstTensor(tensorInfo, data.get()), std::move(data));
+}
+
+IConnectableLayer* SwizzleIn(INetwork& network,
+                             IConnectableLayer* layer,
+                             unsigned int inputSlotIndex,
+                             const TensorInfo & inputInfo)
+{
+    BOOST_ASSERT(layer != nullptr);
+    // Add swizzle layer
+    std::stringstream name;
+    name << "swizzle_for-" << layer->GetName() << ":in" << inputSlotIndex;
+    IConnectableLayer* const swizzleLayer = network.AddPermuteLayer(NHWCToArmNN, name.str().c_str());
+    // Set swizzled output shape
+    const TensorInfo swizzleOutInfo = armnnUtils::Permuted(inputInfo, NHWCToArmNN);
+    swizzleLayer->GetOutputSlot(0).SetTensorInfo(swizzleOutInfo);
+    // Connect the swizzle layer to the actual layer
+    swizzleLayer->GetOutputSlot(0).Connect(layer->GetInputSlot(inputSlotIndex));
+
+    return swizzleLayer;
+}
+
+IConnectableLayer* DeswizzleOut(INetwork& network,
+                                IConnectableLayer* layer,
+                                unsigned int outputSlotIndex,
+                                const TensorInfo & outputInfo)
+{
+    BOOST_ASSERT(layer != nullptr);
+    // Add deswizzle layer
+    std::stringstream name;
+    name << "deswizzle_for-" << layer->GetName() << ":out" << outputSlotIndex;
+    IConnectableLayer* const deswizzleLayer = network.AddPermuteLayer(ArmNNToNHWC, name.str().c_str());
+    // Set deswizzled output shape
+    deswizzleLayer->GetOutputSlot(0).SetTensorInfo(outputInfo);
+    // Set original layer output shape
+    const TensorInfo deswizzleOutInfo = armnnUtils::Permuted(outputInfo, NHWCToArmNN);
+    layer->GetOutputSlot(outputSlotIndex).SetTensorInfo(deswizzleOutInfo);
+    // Connect the actual layer to the deswizzle layer
+    layer->GetOutputSlot(outputSlotIndex).Connect(deswizzleLayer->GetInputSlot(0));
+
+    return deswizzleLayer;
+}
+
+std::pair<IConnectableLayer*, IConnectableLayer*> SwizzleInDeswizzleOut(INetwork& network,
+                                                                        IConnectableLayer* layer,
+                                                                        unsigned int inputSlotIndex,
+                                                                        const TensorInfo & inputInfo,
+                                                                        unsigned int outputSlotIndex,
+                                                                        const TensorInfo & outputInfo)
+{
+    IConnectableLayer* const swizzleLayer = SwizzleIn(network, layer, inputSlotIndex, inputInfo);
+    IConnectableLayer* const deswizzleLayer = DeswizzleOut(network, layer, outputSlotIndex, outputInfo);
+    return std::make_pair(swizzleLayer, deswizzleLayer);
+}
+
+armnn::LayerBindingId GenerateLayerBindingId(size_t subgraphIndex, size_t tensorIndex)
+{
+    // generate the binding id by shifting the tensor id by 8 bit
+    // and add the subgraph id, which allows 256 subgraphs
+    return static_cast<armnn::LayerBindingId>((tensorIndex<<8)+subgraphIndex);
+}
+
+} // <anonymous>
+
+TfLiteParser::TfLiteParser()
+: m_Network(nullptr, nullptr)
+, m_ParserFunctions(tflite::BuiltinOperator_MAX+1, &TfLiteParser::ParseUnsupportedOperator)
+{
+    // register supported operators
+    m_ParserFunctions[tflite::BuiltinOperator_AVERAGE_POOL_2D]   =  &TfLiteParser::ParseAveragePool2D;
+    m_ParserFunctions[tflite::BuiltinOperator_CONV_2D]           =  &TfLiteParser::ParseConv2D;
+    m_ParserFunctions[tflite::BuiltinOperator_DEPTHWISE_CONV_2D] =  &TfLiteParser::ParseDepthwiseConv2D;
+    m_ParserFunctions[tflite::BuiltinOperator_SOFTMAX]           =  &TfLiteParser::ParseSoftmax;
+    m_ParserFunctions[tflite::BuiltinOperator_SQUEEZE]           =  &TfLiteParser::ParseSqueeze;
+}
+
+void TfLiteParser::ResetParser()
+{
+    m_Network = armnn::INetworkPtr(nullptr, nullptr);
+    m_Model = nullptr;
+    m_SubgraphConnections.clear();
+}
+
+INetworkPtr TfLiteParser::CreateNetworkFromBinaryFile(const char* graphFile)
+{
+    ResetParser();
+    m_Model = LoadModelFromFile(graphFile);
+    return CreateNetworkFromModel();
+}
+
+INetworkPtr TfLiteParser::CreateNetworkFromBinary(const std::vector<uint8_t> & binaryContent)
+{
+    ResetParser();
+    m_Model = LoadModelFromBinary(binaryContent.data(), binaryContent.size());
+    return CreateNetworkFromModel();
+}
+
+INetworkPtr TfLiteParser::CreateNetworkFromModel()
+{
+    m_Network = INetwork::Create();
+    BOOST_ASSERT(m_Model.get() != nullptr);
+
+    bool failedToCreate = false;
+    std::stringstream errors;
+
+    if (m_Model->subgraphs.size() != 1)
+    {
+        throw ParseException(
+                boost::str(
+                        boost::format("Current TfLite parser only supports 1 subgraph. Current one has: %1% %2%") %
+                        m_Model->subgraphs.size() %
+                        CHECK_LOCATION().AsString()));
+    }
+
+    size_t subgraphIndex = 0;
+    for (SubGraphPtr const & subgraph : m_Model->subgraphs)
+    {
+        m_SubgraphConnections.emplace_back(subgraph->tensors.size());
+
+        size_t operatorIndex = 0;
+        for (OperatorPtr const & op : subgraph->operators)
+        {
+            try
+            {
+                if (op->custom_options.size() > 0)
+                {
+                    throw ParseException(
+                            boost::str(
+                                    boost::format("Custom options for op: %1% is not supported. "
+                                                  "It has %2% bytes of custom options. %3%") %
+                                                  op->opcode_index %
+                                                  op->custom_options.size() %
+                                                  CHECK_LOCATION().AsString()));
+                }
+
+                auto const & opCodePtr = m_Model->operator_codes[op->opcode_index];
+                auto builtinCode = opCodePtr->builtin_code;
+
+                if (builtinCode > tflite::BuiltinOperator_MAX)
+                {
+                    throw ParseException(
+                            boost::str(
+                                    boost::format("Operator code %1% is out of range 0-%2%. "
+                                                  "subgraph:%3% operator idx:%4%. %5%") %
+                                                  builtinCode %
+                                                  tflite::BuiltinOperator_MAX %
+                                                  subgraphIndex %
+                                                  operatorIndex %
+                                                  CHECK_LOCATION().AsString()));
+                }
+
+                // lookup and call the parser function
+                auto & parserFunction = m_ParserFunctions[builtinCode];
+                (this->*parserFunction)(subgraphIndex, operatorIndex);
+            }
+            catch (const ParseException& e)
+            {
+                failedToCreate = true;
+                std::stringstream errorString;
+
+                errorString << "Failed to parse operator #" << operatorIndex
+                            << " within subgraph #" << subgraphIndex
+                            << " error: " << e.what();
+                BOOST_LOG_TRIVIAL(error) << errorString.str();
+
+                errors << errorString.str() << "\n";
+            }
+            ++operatorIndex;
+        }
+
+        SetupInputLayers(subgraphIndex);
+        SetupOutputLayers(subgraphIndex);
+
+        ++subgraphIndex;
+    }
+
+    if (failedToCreate)
+    {
+        // we can skip everything and let the outer exception handler deal with the error
+        throw ParseException(errors.str());
+    }
+
+    // establish the connections from the layer outputs to the inputs of the subsequent layers
+    for (size_t subgraphIndex = 0; subgraphIndex < m_SubgraphConnections.size(); ++subgraphIndex)
+    {
+        for (size_t tensorIndex = 0; tensorIndex < m_SubgraphConnections[subgraphIndex].size(); ++tensorIndex)
+        {
+            if (m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot != nullptr)
+            {
+                for (size_t inputSlotIdx = 0;
+                    inputSlotIdx < m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots.size();
+                    ++inputSlotIdx)
+                {
+                    m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot->Connect(
+                        *(m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots[inputSlotIdx]));
+                }
+            }
+        }
+    }
+
+    return std::move(m_Network);
+}
+
+void TfLiteParser::RegisterProducerOfTensor(size_t subgraphIndex,
+                                            size_t tensorIndex,
+                                            armnn::IOutputSlot* slot)
+{
+    CHECK_TENSOR(m_Model, subgraphIndex, tensorIndex);
+    BOOST_ASSERT(m_SubgraphConnections.size() > subgraphIndex);
+    BOOST_ASSERT(m_SubgraphConnections[subgraphIndex].size() > tensorIndex);
+
+    TensorSlots & tensorSlots = m_SubgraphConnections[subgraphIndex][tensorIndex];
+
+    // assuming there is only one producer for that tensor
+    if (tensorSlots.outputSlot != nullptr)
+    {
+        throw ParseException(boost::str(
+                boost::format("Another layer has already registered itself as the producer of "
+                              "subgraph:%1% tensor:%2% %3%") %
+                               subgraphIndex %
+                               tensorIndex %
+                               CHECK_LOCATION().AsString()));
+    }
+
+    tensorSlots.outputSlot = slot;
+}
+
+void TfLiteParser::RegisterConsumerOfTensor(size_t subgraphIndex,
+                                            size_t tensorIndex,
+                                            armnn::IInputSlot* slot)
+{
+    CHECK_TENSOR(m_Model, subgraphIndex, tensorIndex);
+    BOOST_ASSERT(m_SubgraphConnections.size() > subgraphIndex);
+    BOOST_ASSERT(m_SubgraphConnections[subgraphIndex].size() > tensorIndex);
+
+    TensorSlots & tensorSlots = m_SubgraphConnections[subgraphIndex][tensorIndex];
+    tensorSlots.inputSlots.push_back(slot);
+}
+
+void TfLiteParser::ParseUnsupportedOperator(size_t subgraphIndex, size_t operatorIndex)
+{
+    CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+    const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+    //
+    auto opcodeIndex = operatorPtr->opcode_index;
+    auto opcode = m_Model->operator_codes[opcodeIndex]->builtin_code;
+
+    throw ParseException(
+        boost::str(
+            boost::format("Operator not supported. "
+                          "subgraph:%1% operator:%2% "
+                          "opcode_index:%3% opcode:%4% / %5% %6%") %
+                          subgraphIndex %
+                          operatorIndex %
+                          opcodeIndex %
+                          opcode %
+                          tflite::EnumNameBuiltinOperator(opcode) %
+                          CHECK_LOCATION().AsString()));
+}
+
+void TfLiteParser::ParseAveragePool2D(size_t subgraphIndex, size_t operatorIndex)
+{
+    CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+
+    const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+    const auto * options = operatorPtr->builtin_options.AsPool2DOptions();
+
+    CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
+
+    Pooling2dDescriptor desc;
+
+    desc.m_PoolType = PoolingAlgorithm::Average;
+    desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
+    desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
+    desc.m_PoolWidth = CHECKED_NON_NEGATIVE(options->filter_width);
+    desc.m_PoolHeight = CHECKED_NON_NEGATIVE(options->filter_height);
+    desc.m_PaddingMethod = PaddingMethod::Exclude;
+    desc.m_OutputShapeRounding = OutputShapeRounding::Floor;
+
+    auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(inputs.size(), 1);
+    armnn::TensorInfo inputTensorInfo  = ToTensorInfo(inputs[0]);
+
+    // assuming input is NHWC
+    unsigned int inputHeight = inputTensorInfo.GetShape()[1];
+    unsigned int inputWidth  = inputTensorInfo.GetShape()[2];
+
+    CalcPadding(inputHeight, desc.m_PoolHeight, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, options->padding);
+    CalcPadding(inputWidth, desc.m_PoolWidth, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, options->padding);
+
+    auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(outputs.size(), 1);
+    armnn::TensorInfo outputTensorInfo  = ToTensorInfo(outputs[0]);
+
+    auto layerName = boost::str(boost::format("AveragePool2D:%1%:%2%") % subgraphIndex % operatorIndex);
+    IConnectableLayer* layer = m_Network->AddPooling2dLayer(desc, layerName.c_str());
+
+    BOOST_ASSERT(layer != nullptr);
+
+    // add permute layers to swizzle the input and deswizzle the output
+    std::pair<IConnectableLayer*, IConnectableLayer*> permuteLayers =
+            SwizzleInDeswizzleOut(*m_Network, layer, 0, inputTensorInfo, 0, outputTensorInfo);
+
+    // register the input connection slots for the layer, connections are made after all layers have been created
+    // only the tensors for the inputs are relevant, exclude the const tensors
+    auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterInputSlots(subgraphIndex, operatorIndex, permuteLayers.first, {inputTensorIndexes[0]});
+
+    // we need to add the activation layer and fortunately we don't need to care about the data layout
+    // beause the activation function is element-wise, so it is OK to have the activation after the trailing
+    // swizzle layer
+    layer = AddActivationLayer(permuteLayers.second, 0, options->fused_activation_function);
+    // register the output connection slots for the layer, connections are made after all layers have been created
+    auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+void TfLiteParser::ParseConv2D(size_t subgraphIndex, size_t operatorIndex)
+{
+    CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+
+    const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+    const auto * options = operatorPtr->builtin_options.AsConv2DOptions();
+
+    CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
+
+    Convolution2dDescriptor desc;
+    desc.m_BiasEnabled = false;
+    desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
+    desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
+
+    auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(inputs.size(), 2, 3);
+
+    auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(outputs.size(), 1);
+
+    armnn::TensorInfo inputTensorInfo  = ToTensorInfo(inputs[0]);
+    armnn::TensorInfo filterTensorInfo = ToTensorInfo(inputs[1]);
+
+    // assuming input is NHWC
+    unsigned int inputHeight = inputTensorInfo.GetShape()[1];
+    unsigned int inputWidth  = inputTensorInfo.GetShape()[2];
+
+    // assuming the filter is OHWI : Output, H, W, Input
+    // which is essentially the same as NHWC
+    unsigned int filterHeight = filterTensorInfo.GetShape()[1];
+    unsigned int filterWidth  = filterTensorInfo.GetShape()[2];
+
+    CalcPadding(inputHeight, filterHeight, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, options->padding);
+    CalcPadding(inputWidth, filterWidth, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, options->padding);
+
+    auto filterTensorAndData = CreateConstTensor(inputs[1], filterTensorInfo, true);
+    armnn::IConnectableLayer* layer;
+
+    auto layerName = boost::str(boost::format("Conv2D:%1%:%2%") % subgraphIndex % operatorIndex);
+
+    if (inputs.size() == 3)
+    {
+        desc.m_BiasEnabled = true;
+        armnn::TensorInfo biasTensorInfo = ToTensorInfo(inputs[2]);
+        auto biasTensorAndData = CreateConstTensor(inputs[2], biasTensorInfo, false);
+        layer = m_Network->AddConvolution2dLayer(desc,
+                                                 filterTensorAndData.first,
+                                                 biasTensorAndData.first,
+                                                 layerName.c_str());
+    }
+    else
+    {
+        layer = m_Network->AddConvolution2dLayer(desc,
+                                                 filterTensorAndData.first,
+                                                 layerName.c_str());
+    }
+
+    BOOST_ASSERT(layer != nullptr);
+
+    // add permute layers to swizzle the input and deswizzle the output
+    armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
+    std::pair<IConnectableLayer*, IConnectableLayer*> permuteLayers =
+        SwizzleInDeswizzleOut(*m_Network, layer, 0, inputTensorInfo, 0, outputTensorInfo);
+
+    // register the input connection slots for the layer, connections are made after all layers have been created
+    // only the tensors for the inputs are relevant, exclude the const tensors
+    auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterInputSlots(subgraphIndex, operatorIndex, permuteLayers.first, {inputTensorIndexes[0]});
+
+    // we need to add the activation layer and fortunately we don't need to care about the data layout
+    // beause the activation function is element-wise, so it is OK to have the activation after the trailing
+    // swizzle layer
+    layer = AddActivationLayer(permuteLayers.second, 0, options->fused_activation_function);
+    // register the output connection slots for the layer, connections are made after all layers have been created
+    auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+void TfLiteParser::ParseDepthwiseConv2D(size_t subgraphIndex, size_t operatorIndex)
+{
+    CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+
+    const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+    const auto * options = operatorPtr->builtin_options.AsDepthwiseConv2DOptions();
+
+    CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
+
+    DepthwiseConvolution2dDescriptor desc;
+    desc.m_BiasEnabled = false;
+    desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
+    desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
+    // ACL only supports a depth (channel) multiplier of 1, it is not currently stored in the descriptor
+    CHECK_VALID_SIZE(CHECKED_NON_NEGATIVE(options->depth_multiplier), 1);
+
+    auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(inputs.size(), 2, 3);
+    auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(outputs.size(), 1);
+
+    armnn::TensorInfo inputTensorInfo  = ToTensorInfo(inputs[0]);
+    armnn::TensorInfo filterTensorInfo = ToTensorInfo(inputs[1]);
+
+    // assuming input is NHWC
+    unsigned int inputHeight = inputTensorInfo.GetShape()[1];
+    unsigned int inputWidth  = inputTensorInfo.GetShape()[2];
+    // assuming the filter is OHWI : Output, H, W, Input
+    unsigned int filterHeight = filterTensorInfo.GetShape()[1];
+    unsigned int filterWidth  = filterTensorInfo.GetShape()[2];
+
+    CalcPadding(inputHeight, filterHeight, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, options->padding);
+    CalcPadding(inputWidth, filterWidth, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, options->padding);
+
+    auto filterTensorAndData = CreateConstTensor(inputs[1], filterTensorInfo, true);
+    armnn::IConnectableLayer* layer;
+    auto layerName = boost::str(boost::format("DepthwiseConv2D:%1%:%2%") % subgraphIndex % operatorIndex);
+
+    if (inputs.size() == 3)
+    {
+        desc.m_BiasEnabled = true;
+        TensorInfo biasTensorInfo = ToTensorInfo(inputs[2]);
+        auto biasTensorAndData = CreateConstTensor(inputs[2], biasTensorInfo, false);
+        layer = m_Network->AddDepthwiseConvolution2dLayer(desc,
+                                                          filterTensorAndData.first,
+                                                          biasTensorAndData.first,
+                                                          layerName.c_str());
+    }
+    else
+    {
+        layer = m_Network->AddDepthwiseConvolution2dLayer(desc,
+                                                          filterTensorAndData.first,
+                                                          layerName.c_str());
+    }
+    BOOST_ASSERT(layer != nullptr);
+
+    // add permute layers to swizzle the input and deswizzle the output
+    armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
+    std::pair<IConnectableLayer*, IConnectableLayer*> permuteLayers =
+        SwizzleInDeswizzleOut(*m_Network, layer, 0, inputTensorInfo, 0, outputTensorInfo);
+
+    // register the input connection slots for the layer, connections are made after all layers have been created
+    // only the tensors for the inputs are relevant, exclude the const tensors
+    auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterInputSlots(subgraphIndex, operatorIndex, permuteLayers.first, {inputTensorIndexes[0]});
+
+    // we need to add the activation layer and fortunately we don't need to care about the data layout
+    // beause the activation function is element-wise, so it is OK to have the activation after the trailing
+    // swizzle layer
+    layer = AddActivationLayer(permuteLayers.second, 0, options->fused_activation_function);
+    // register the output connection slots for the layer, connections are made after all layers have been created
+    auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+void TfLiteParser::ParseSoftmax(size_t subgraphIndex, size_t operatorIndex)
+{
+    CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+    const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+    const auto * options = operatorPtr->builtin_options.AsSoftmaxOptions();
+
+    SoftmaxDescriptor desc;
+    desc.m_Beta = options->beta;
+
+    auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(inputs.size(), 1);
+    auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(outputs.size(), 1);
+
+    auto layerName = boost::str(boost::format("Softmax:%1%:%2%") % subgraphIndex % operatorIndex);
+    IConnectableLayer* const layer = m_Network->AddSoftmaxLayer(desc, layerName.c_str());
+
+    armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
+    layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
+
+    // register the input connection slots for the layer, connections are made after all layers have been created
+    // only the tensors for the inputs are relevant, exclude the const tensors
+    auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
+
+    // register the output connection slots for the layer, connections are made after all layers have been created
+    auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+armnn::TensorInfo TfLiteParser::OutputShapeOfSqueeze(const std::vector<uint32_t> & squeezeDimsIn,
+                                                     const armnn::TensorInfo & inputTensorInfo)
+{
+    CHECK_VALID_SIZE(squeezeDimsIn.size(), 0, 1, 2, 3, 4);
+    std::vector<uint32_t> squeezeDims = squeezeDimsIn;
+    static const uint32_t dimensionSequence[] = { 0, 1, 2, 3 };
+
+    if (inputTensorInfo.GetNumDimensions() > 4)
+    {
+        std::stringstream ss;
+        ss << "Input tensor has unexpected number of dimensions:" << inputTensorInfo.GetNumDimensions()
+           << " shape:" << inputTensorInfo.GetShape() << " "
+           << CHECK_LOCATION().AsString();
+        throw ParseException(ss.str());
+    }
+
+    if (squeezeDims.empty())
+    {
+        squeezeDims.assign(dimensionSequence,
+                           dimensionSequence+inputTensorInfo.GetNumDimensions());
+    }
+
+    std::vector<uint32_t> outputDims;
+    for(unsigned int i = 0; i < inputTensorInfo.GetNumDimensions(); i++)
+    {
+        bool skipSqueeze = (std::find(squeezeDims.begin(), squeezeDims.end(), i) == squeezeDims.end());
+        auto currentDimension = inputTensorInfo.GetShape()[i];
+        if (skipSqueeze || currentDimension != 1)
+        {
+            outputDims.push_back(currentDimension);
+        }
+    }
+
+    if (outputDims.size() > 4)
+    {
+        std::stringstream ss;
+        ss << "Output tensor has unexpected number of dimensions:" << inputTensorInfo.GetNumDimensions()
+           << " shape:" << inputTensorInfo.GetShape() << " "
+           << CHECK_LOCATION().AsString();
+        throw ParseException(ss.str());
+    }
+
+    TensorShape outShape = TensorShape(static_cast<unsigned int>(outputDims.size()),
+                                       outputDims.data());
+
+    // we need to preserve the tensor type and the quantization data as well
+    TensorInfo outTensorInfo = inputTensorInfo;
+    outTensorInfo.SetShape(outShape);
+
+    return outTensorInfo;
+}
+
+void TfLiteParser::ParseSqueeze(size_t subgraphIndex, size_t operatorIndex)
+{
+    CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+
+    auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(inputs.size(), 1);
+
+    auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+    CHECK_VALID_SIZE(outputs.size(), 1);
+
+    const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+    const auto * options = operatorPtr->builtin_options.AsSqueezeOptions();
+
+    armnn::TensorInfo inputTensorInfo  = ToTensorInfo(inputs[0]);
+    armnn::TensorInfo outputTensorInfo =
+        TfLiteParser::OutputShapeOfSqueeze(AsUnsignedVector(options->squeeze_dims),
+                                           inputTensorInfo);
+
+    ReshapeDescriptor reshapeDesc;
+    reshapeDesc.m_TargetShape = outputTensorInfo.GetShape();
+
+    auto layerName = boost::str(boost::format("Squeeze:%1%:%2%") % subgraphIndex % operatorIndex);
+    IConnectableLayer* layer = m_Network->AddReshapeLayer(reshapeDesc, layerName.c_str());
+    layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
+
+    auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
+
+    auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+    RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+armnn::IConnectableLayer* TfLiteParser::AddActivationLayer(armnn::IConnectableLayer* prevLayer,
+                                                           unsigned int outputSlot,
+                                                           tflite::ActivationFunctionType activationType)
+{
+    ActivationDescriptor activationDesc;
+    std::string layerName = prevLayer->GetName();
+
+    switch(activationType)
+    {
+        case tflite::ActivationFunctionType_NONE:
+        {
+            // this is a no-op: return previous layer
+            return prevLayer;
+        }
+        case tflite::ActivationFunctionType_RELU:
+        {
+            activationDesc.m_Function = ActivationFunction::ReLu;
+            layerName += ":RELU";
+            break;
+        }
+        case tflite::ActivationFunctionType_RELU6:
+        {
+            activationDesc.m_Function = ActivationFunction::BoundedReLu;
+            activationDesc.m_A = 6.0f;
+            activationDesc.m_B = 0.0f;
+            layerName += ":RELU6";
+            break;
+        }
+        case tflite::ActivationFunctionType_TANH:
+        {
+            activationDesc.m_Function = ActivationFunction::TanH;
+            activationDesc.m_A = 1.0f;
+            activationDesc.m_B = 1.0f;
+            layerName += ":TANH";
+            break;
+        }
+
+        // I only put these here as a reminder what others we could support
+        case tflite::ActivationFunctionType_RELU_N1_TO_1:
+        case tflite::ActivationFunctionType_SIGN_BIT:
+        default:
+        {
+            throw ParseException(
+                boost::str(
+                    boost::format("TfLite parser doesn't suppport fused activation: "
+                                  "%1%/%2% %3% ") %
+                                  activationType %
+                                  tflite::EnumNameActivationFunctionType(activationType) %
+                                  CHECK_LOCATION().AsString()));
+
+        }
+    }
+
+    IConnectableLayer* activationLayer =
+        m_Network->AddActivationLayer(activationDesc, layerName.c_str());
+
+    auto & prevOutputSlot = prevLayer->GetOutputSlot(outputSlot);
+    prevOutputSlot.Connect(activationLayer->GetInputSlot(0));
+    activationLayer->GetOutputSlot(0).SetTensorInfo(prevOutputSlot.GetTensorInfo());
+    return activationLayer;
+}
+
+TfLiteParser::ModelPtr TfLiteParser::LoadModelFromFile(const char * fileName)
+{
+    if (fileName == nullptr)
+    {
+        throw InvalidArgumentException(boost::str(boost::format("Invalid (null) file name %1%") %
+                                       CHECK_LOCATION().AsString()));
+    }
+    boost::system::error_code errorCode;
+    boost::filesystem::path pathToFile(fileName);
+    if (!boost::filesystem::exists(pathToFile, errorCode))
+    {
+        throw FileNotFoundException(boost::str(boost::format("Cannot find the file (%1%) errorCode: %2% %3%") %
+                                    fileName %
+                                    errorCode %
+                                    CHECK_LOCATION().AsString()));
+    }
+    std::ifstream file(fileName, std::ios::binary);
+    std::string fileContent((std::istreambuf_iterator<char>(file)), std::istreambuf_iterator<char>());
+    return LoadModelFromBinary(reinterpret_cast<const uint8_t *>(fileContent.c_str()),
+                               fileContent.size());
+}
+
+TfLiteParser::ModelPtr TfLiteParser::LoadModelFromBinary(const uint8_t * binaryContent, size_t len)
+{
+    if (binaryContent == nullptr)
+     {
+        throw InvalidArgumentException(boost::str(boost::format("Invalid (null) binary content %1%") %
+                                       CHECK_LOCATION().AsString()));
+     }
+    flatbuffers::Verifier verifier(binaryContent, len);
+    if (verifier.VerifyBuffer<tflite::Model>() == false)
+    {
+        throw ParseException(
+            boost::str(boost::format("Buffer doesn't conform to the expected Tensorflow Lite "
+                                     "flatbuffers format. size:%1% %2%") %
+                       len %
+                       CHECK_LOCATION().AsString()));
+    }
+    return tflite::UnPackModel(binaryContent);
+}
+
+TfLiteParser::TensorRawPtrVector TfLiteParser::GetInputs(const ModelPtr & model,
+                                                         size_t subgraphIndex,
+                                                         size_t operatorIndex)
+{
+    CHECK_MODEL(model, subgraphIndex, operatorIndex);
+
+    const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+    const auto & operatorPtr = subGraphPtr->operators[operatorIndex];
+
+    size_t inputCount = operatorPtr->inputs.size();
+    TensorRawPtrVector result(inputCount);
+    for (size_t i=0; i<inputCount; ++i)
+    {
+        uint32_t inputId = CHECKED_NON_NEGATIVE(operatorPtr->inputs[i]);
+        result[i] = subGraphPtr->tensors[inputId].get();
+    }
+    return result;
+}
+
+TfLiteParser::TensorRawPtrVector TfLiteParser::GetOutputs(const ModelPtr & model,
+                                                          size_t subgraphIndex,
+                                                          size_t operatorIndex)
+{
+    CHECK_MODEL(model, subgraphIndex, operatorIndex);
+
+    const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+    const auto & operatorPtr = subGraphPtr->operators[operatorIndex];
+
+    size_t outputCount = operatorPtr->outputs.size();
+    TensorRawPtrVector result(outputCount);
+    for (size_t i=0; i<outputCount; ++i)
+    {
+        uint32_t outputId = CHECKED_NON_NEGATIVE(operatorPtr->outputs[i]);
+        CHECK_TENSOR(model, subgraphIndex, outputId);
+        result[i] = subGraphPtr->tensors[outputId].get();
+    }
+    return result;
+}
+
+TfLiteParser::TensorIdRawPtrVector TfLiteParser::GetSubgraphInputs(const ModelPtr & model,
+                                                                   size_t subgraphIndex)
+{
+    CHECK_SUBGRAPH(model, subgraphIndex);
+    const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+
+    size_t inputCount = subGraphPtr->inputs.size();
+    TensorIdRawPtrVector result(inputCount);
+    for (size_t i=0; i<inputCount; ++i)
+    {
+        uint32_t inputId = CHECKED_NON_NEGATIVE(subGraphPtr->inputs[i]);
+        CHECK_TENSOR(model, subgraphIndex, inputId);
+        result[i] = std::make_pair(inputId, subGraphPtr->tensors[inputId].get());
+    }
+    return result;
+}
+
+TfLiteParser::TensorIdRawPtrVector TfLiteParser::GetSubgraphOutputs(const ModelPtr & model,
+                                                                    size_t subgraphIndex)
+{
+    CHECK_SUBGRAPH(model, subgraphIndex);
+    const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+
+    size_t outputCount = subGraphPtr->outputs.size();
+    TensorIdRawPtrVector result(outputCount);
+    for (size_t i=0; i<outputCount; ++i)
+    {
+        uint32_t outputId = CHECKED_NON_NEGATIVE(subGraphPtr->outputs[i]);
+        result[i] = std::make_pair(outputId, subGraphPtr->tensors[outputId].get());
+    }
+    return result;
+}
+
+std::vector<int32_t>& TfLiteParser::GetInputTensorIds(const ModelPtr& model,
+                                                      size_t subgraphIndex,
+                                                      size_t operatorIndex)
+{
+    CHECK_MODEL(model, subgraphIndex, operatorIndex);
+    const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+    const auto & operatorPtr = subGraphPtr->operators[operatorIndex];
+    return operatorPtr->inputs;
+}
+
+std::vector<int32_t>& TfLiteParser::GetOutputTensorIds(const ModelPtr& model,
+                                                       size_t subgraphIndex,
+                                                       size_t operatorIndex)
+{
+    CHECK_MODEL(model, subgraphIndex, operatorIndex);
+    const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+    const auto & operatorPtr = subGraphPtr->operators[operatorIndex];
+    return operatorPtr->outputs;
+}
+
+void TfLiteParser::RegisterInputSlots(size_t subgraphIndex,
+                                      size_t operatorIndex,
+                                      IConnectableLayer* layer,
+                                      const std::vector<unsigned int>& tensorIndexes)
+{
+    CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+    BOOST_ASSERT(layer != nullptr);
+    if (tensorIndexes.size() != layer->GetNumInputSlots())
+    {
+        throw ParseException(
+            boost::str(boost::format("The number of tensor inputs (%1%) does not match the number expected (%2%)"
+                                     " for subgraph:%3% operator index:%4% %5%") %
+                       tensorIndexes.size() %
+                       layer->GetNumInputSlots() %
+                       subgraphIndex %
+                       operatorIndex %
+                       CHECK_LOCATION().AsString()));
+    }
+
+    for (unsigned int slotIndex = 0; slotIndex < layer->GetNumInputSlots(); ++slotIndex)
+    {
+        unsigned int tensorIndex = tensorIndexes[slotIndex];
+        armnn::IInputSlot* slot = &(layer->GetInputSlot(slotIndex));
+        RegisterConsumerOfTensor(subgraphIndex, tensorIndex, slot);
+    }
+}
+
+void TfLiteParser::RegisterOutputSlots(size_t subgraphIndex,
+                                       size_t operatorIndex,
+                                       IConnectableLayer* layer,
+                                       const std::vector<unsigned int>& tensorIndexes)
+{
+    CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+    BOOST_ASSERT(layer != nullptr);
+    if (tensorIndexes.size() != layer->GetNumOutputSlots())
+    {
+        throw ParseException(
+            boost::str(boost::format("The number of tensor outputs (%1%) does not match the number expected (%2%)"
+                                     " for subgraph:%3% operator index:%4% %5%") %
+                       tensorIndexes.size() %
+                       layer->GetNumOutputSlots() %
+                       subgraphIndex %
+                       operatorIndex %
+                       CHECK_LOCATION().AsString()));
+    }
+
+    for (unsigned int slotIndex = 0; slotIndex < layer->GetNumOutputSlots(); ++slotIndex)
+    {
+        unsigned int tensorIndex = tensorIndexes[slotIndex];
+        armnn::IOutputSlot* slot = &(layer->GetOutputSlot(slotIndex));
+        RegisterProducerOfTensor(subgraphIndex, tensorIndex, slot);
+    }
+}
+
+void TfLiteParser::SetupInputLayers(size_t subgraphIndex)
+{
+    CHECK_SUBGRAPH(m_Model, subgraphIndex);
+
+    auto inputs = GetSubgraphInputs(m_Model, subgraphIndex);
+    for (auto const & tensorIdAndPtr : inputs)
+    {
+        auto bindingId = GenerateLayerBindingId(subgraphIndex, tensorIdAndPtr.first);
+        IConnectableLayer* layer =
+            m_Network->AddInputLayer(bindingId, tensorIdAndPtr.second->name.c_str());
+
+        auto tensorInfo = ToTensorInfo(tensorIdAndPtr.second);
+        layer->GetOutputSlot(0).SetTensorInfo(tensorInfo);
+
+        RegisterOutputSlots(subgraphIndex,
+                            VIRTUAL_OPERATOR_ID,
+                            layer,
+                            { static_cast<uint32_t>(tensorIdAndPtr.first) });
+    }
+}
+
+void TfLiteParser::SetupOutputLayers(size_t subgraphIndex)
+{
+    CHECK_SUBGRAPH(m_Model, subgraphIndex);
+
+    auto outputs = GetSubgraphOutputs(m_Model, subgraphIndex);
+    for (auto const & tensorIdAndPtr : outputs)
+    {
+        auto bindingId = GenerateLayerBindingId(subgraphIndex, tensorIdAndPtr.first);
+        IConnectableLayer* layer =
+            m_Network->AddOutputLayer(bindingId, tensorIdAndPtr.second->name.c_str());
+
+        RegisterInputSlots(subgraphIndex,
+                           VIRTUAL_OPERATOR_ID,
+                           layer,
+                           { static_cast<uint32_t>(tensorIdAndPtr.first) });
+    }
+}
+
+// example usage: BufferRawPtr bufferPtr = GetBuffer(m_Model, inputs[0]->buffer);
+TfLiteParser::BufferRawPtr TfLiteParser::GetBuffer(const ModelPtr& model, size_t bufferIndex)
+{
+    CHECK_BUFFER(model, bufferIndex);
+    return model->buffers[bufferIndex].get();
+}
+
+std::pair<armnn::ConstTensor, TfLiteParser::SupportedDataStorage>
+TfLiteParser::CreateConstTensor(TensorRawPtr tensorPtr,
+                                armnn::TensorInfo & tensorInfo,
+                                bool convertFromTfToArmnnFormat)
+{
+    CHECK_TENSOR_PTR(tensorPtr);
+    auto bufferPtr = GetBuffer(m_Model, tensorPtr->buffer);
+    CHECK_BUFFER_SIZE(bufferPtr, tensorInfo, tensorPtr->buffer);
+
+    switch (tensorInfo.GetDataType())
+    {
+        case armnn::DataType::Float32:
+        {
+            auto constData = CreateConstTensorImpl<float>(bufferPtr,
+                                                          tensorPtr,
+                                                          tensorInfo,
+                                                          convertFromTfToArmnnFormat);
+            SupportedDataStorage storage(std::move(constData.second));
+            return std::make_pair(constData.first, std::move(storage));
+        }
+        case armnn::DataType::QuantisedAsymm8:
+        {
+            auto constData = CreateConstTensorImpl<uint8_t>(bufferPtr,
+                                                            tensorPtr,
+                                                            tensorInfo,
+                                                            convertFromTfToArmnnFormat);
+            SupportedDataStorage storage(std::move(constData.second));
+            return std::make_pair(constData.first, std::move(storage));
+        }
+        case armnn::DataType::Signed32:
+        {
+            auto constData = CreateConstTensorImpl<int32_t>(bufferPtr,
+                                                            tensorPtr,
+                                                            tensorInfo,
+                                                            convertFromTfToArmnnFormat);
+            SupportedDataStorage storage(std::move(constData.second));
+            return std::make_pair(constData.first, std::move(storage));
+        }
+        default:
+        {
+            std::stringstream errString;
+            errString << "Unexpected datatype when creating const tensor: "
+                        << armnn::GetDataTypeName(tensorInfo.GetDataType())
+                        << " shape:" << tensorInfo.GetShape()
+                        << CHECK_LOCATION().AsString();
+            throw ParseException(errString.str());
+        }
+    }
+}
+
+BindingPointInfo TfLiteParser::GetNetworkInputBindingInfo(size_t subgraphId,
+                                                          const std::string& name) const
+{
+    CHECK_SUBGRAPH(m_Model, subgraphId);
+    auto inputs = GetSubgraphInputs(m_Model, subgraphId);
+    for (auto const & input : inputs)
+    {
+        if (input.second->name == name)
+        {
+            auto bindingId = GenerateLayerBindingId(subgraphId, input.first);
+            return std::make_pair(bindingId, ToTensorInfo(input.second));
+        }
+    }
+
+    std::stringstream bindings;
+    for (auto const & input : inputs)
+    {
+        bindings << "'" << input.second->name << "' ";
+    }
+
+    throw ParseException(
+        boost::str(
+            boost::format("No input binding found for subgraph:%1% and name:%2%. "
+                          "Possible inputs are: [%3%] %4%") %
+            subgraphId %
+            name %
+            bindings.str() %
+            CHECK_LOCATION().AsString()));
+}
+
+BindingPointInfo TfLiteParser::GetNetworkOutputBindingInfo(size_t subgraphId,
+                                                           const std::string& name) const
+{
+    CHECK_SUBGRAPH(m_Model, subgraphId);
+    auto outputs = GetSubgraphOutputs(m_Model, subgraphId);
+    for (auto const & output : outputs)
+    {
+        if (output.second->name == name)
+        {
+            auto bindingId = GenerateLayerBindingId(subgraphId, output.first);
+            return std::make_pair(bindingId, ToTensorInfo(output.second));
+        }
+    }
+
+    std::stringstream bindings;
+    for (auto const & output : outputs)
+    {
+        bindings << "'" << output.second->name << "' ";
+    }
+
+    throw ParseException(
+        boost::str(
+            boost::format("No output binding found for subgraph:%1% and name:%2%. "
+                          "Possible outputs are: [%3%] %4%") %
+            subgraphId %
+            name %
+            bindings.str() %
+            CHECK_LOCATION().AsString()));
+}
+
+size_t TfLiteParser::GetSubgraphCount() const
+{
+    return m_Model->subgraphs.size();
+}
+
+std::vector<std::string> TfLiteParser::GetSubgraphInputTensorNames(size_t subgraphId) const
+{
+    CHECK_SUBGRAPH(m_Model, subgraphId);
+    auto inputs = GetSubgraphInputs(m_Model, subgraphId);
+    std::vector<std::string> result;
+    result.reserve(inputs.size());
+    for (auto const & input : inputs)
+    {
+        result.push_back(input.second->name);
+    }
+    return result;
+}
+
+std::vector<std::string> TfLiteParser::GetSubgraphOutputTensorNames(size_t subgraphId) const
+{
+    CHECK_SUBGRAPH(m_Model, subgraphId);
+    auto outputs = GetSubgraphOutputs(m_Model, subgraphId);
+    std::vector<std::string> result;
+    result.reserve(outputs.size());
+    for (auto const & output : outputs)
+    {
+        result.push_back(output.second->name);
+    }
+    return result;
+}
+
+ITfLiteParser* ITfLiteParser::CreateRaw()
+{
+    return new TfLiteParser();
+}
+
+ITfLiteParserPtr ITfLiteParser::Create()
+{
+    return ITfLiteParserPtr(CreateRaw(), &ITfLiteParser::Destroy);
+}
+
+void ITfLiteParser::Destroy(ITfLiteParser* parser)
+{
+    delete parser;
+}
+
+TfLiteParser::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<float[]> && data)
+: m_FloatData(std::move(data))
+, m_Uint8Data(nullptr)
+, m_Int32Data(nullptr)
+{
+}
+
+TfLiteParser::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<uint8_t[]> && data)
+: m_FloatData(nullptr)
+, m_Uint8Data(std::move(data))
+, m_Int32Data(nullptr)
+{
+}
+
+TfLiteParser::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<int32_t[]> && data)
+: m_FloatData(nullptr)
+, m_Uint8Data(nullptr)
+, m_Int32Data(std::move(data))
+{
+}
+
+} // armnnTfLiteParser