aboutsummaryrefslogtreecommitdiff
path: root/src/armnnTfLiteParser/TfLiteParser.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/armnnTfLiteParser/TfLiteParser.cpp')
-rw-r--r--src/armnnTfLiteParser/TfLiteParser.cpp1440
1 files changed, 1440 insertions, 0 deletions
diff --git a/src/armnnTfLiteParser/TfLiteParser.cpp b/src/armnnTfLiteParser/TfLiteParser.cpp
new file mode 100644
index 0000000000..d5c48a10e2
--- /dev/null
+++ b/src/armnnTfLiteParser/TfLiteParser.cpp
@@ -0,0 +1,1440 @@
+//
+// Copyright © 2017 Arm Ltd. All rights reserved.
+// See LICENSE file in the project root for full license information.
+//
+#include "TfLiteParser.hpp"
+
+#include <armnn/ArmNN.hpp>
+#include <armnn/Exceptions.hpp>
+#include <armnn/TypesUtils.hpp>
+#include <boost/filesystem.hpp>
+
+// armnnUtils:
+#include <Permute.hpp>
+#include <VerificationHelpers.hpp>
+
+// The generated code based on the Tf Lite schema:
+#include <schema_generated.h>
+
+#include <boost/core/ignore_unused.hpp>
+#include <boost/assert.hpp>
+#include <boost/format.hpp>
+#include <boost/log/trivial.hpp>
+
+#include <fstream>
+#include <algorithm>
+#include <limits>
+
+using namespace armnn;
+using armnn::CheckLocation;
+namespace armnnTfLiteParser
+{
+namespace
+{
+const PermutationVector NHWCToArmNN = { 0, 2, 3, 1 };
+const PermutationVector ArmNNToNHWC = { 0, 3, 1, 2 };
+
+const uint32_t VIRTUAL_OPERATOR_ID = std::numeric_limits<uint32_t>::max();
+
+void CheckSubgraph(const TfLiteParser::ModelPtr & model,
+ size_t subgraphIndex,
+ const CheckLocation & location)
+{
+ if (model.get() == nullptr)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("%1% was called with invalid (null) model. "
+ "Possible reason is that the model is not yet loaded and Unpack(ed). "
+ "subgraph:%2% at %3%") %
+ location.m_Function %
+ subgraphIndex %
+ location.FileLine()));
+ }
+ else if (subgraphIndex >= model->subgraphs.size())
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("%1% was called with an invalid subgraph index. "
+ "subgraph:%2% at %3%") %
+ location.m_Function %
+ subgraphIndex %
+ location.FileLine()));
+ }
+}
+
+#define CHECK_SUBGRAPH(MODEL, SUBGRAPH_INDEX) \
+ CheckSubgraph(MODEL, SUBGRAPH_INDEX, CHECK_LOCATION())
+
+void CheckModel(const TfLiteParser::ModelPtr & model,
+ size_t subgraphIndex,
+ size_t operatorIndex,
+ const CheckLocation & location)
+{
+ if (model.get() == nullptr)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("%1% was called with invalid (null) model. "
+ "Possible reason is that the model is not yet loaded and Unpack(ed). "
+ "subgraph:%2% operator:%3% at %4%") %
+ location.m_Function %
+ subgraphIndex %
+ operatorIndex %
+ location.FileLine()));
+ }
+ else if (subgraphIndex >= model->subgraphs.size())
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("%1% was called with an invalid subgraph index. "
+ "subgraph:%2% operator:%3% at %4%") %
+ location.m_Function %
+ subgraphIndex %
+ operatorIndex %
+ location.FileLine()));
+ }
+ else if (operatorIndex >= model->subgraphs[subgraphIndex]->operators.size() &&
+ operatorIndex != VIRTUAL_OPERATOR_ID)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("%1% was called with an invalid operator index. "
+ "subgraph:%2% operator:%3% at %4%") %
+ location.m_Function %
+ subgraphIndex %
+ operatorIndex %
+ location.FileLine()));
+ }
+}
+
+#define CHECK_MODEL(MODEL, SUBGRAPH_INDEX, OPERATOR_INDEX) \
+ CheckModel(MODEL, SUBGRAPH_INDEX, OPERATOR_INDEX, CHECK_LOCATION())
+
+void CheckTensor(const TfLiteParser::ModelPtr & model,
+ size_t subgraphIndex,
+ size_t tensorIndex,
+ const CheckLocation & location)
+{
+ // not checking model, because I assume CHECK_MODEL already run
+ // and checked that. An assert would do.
+ BOOST_ASSERT_MSG(model.get() != nullptr, "Expecting a valid model in this function");
+
+ // also subgraph index should be checked by CHECK_MODEL so
+ // I only add an assert here
+ BOOST_ASSERT_MSG(subgraphIndex < model->subgraphs.size(), "Expecting a valid subgraph index");
+
+ // the tensor index is the only one to check here
+ if (tensorIndex >= model->subgraphs[subgraphIndex]->tensors.size())
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("%1% was called with an invalid tensor index. "
+ "subgraph:%2% tensor:%3% at %4%") %
+ location.m_Function %
+ subgraphIndex %
+ tensorIndex %
+ location.FileLine()));
+ }
+}
+
+#define CHECK_TENSOR(MODEL, SUBGRAPH_INDEX, TENSOR_INDEX) \
+ CheckTensor(MODEL, SUBGRAPH_INDEX, TENSOR_INDEX, CHECK_LOCATION())
+
+void CheckTensorPtr(TfLiteParser::TensorRawPtr rawPtr,
+ const CheckLocation & location)
+{
+ if (rawPtr == nullptr)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("%1% was called with a null tensor pointer. "
+ "at %2%") %
+ location.m_Function %
+ location.FileLine()));
+
+ }
+}
+
+#define CHECK_TENSOR_PTR(TENSOR_PTR) \
+ CheckTensorPtr(TENSOR_PTR, CHECK_LOCATION())
+
+void CheckBuffer(const TfLiteParser::ModelPtr & model,
+ size_t bufferIndex,
+ const CheckLocation & location)
+{
+ if (model.get() == nullptr)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("%1% was called with invalid (null) model. "
+ "Possible reason is that the model is not yet loaded and Unpack(ed). "
+ "buffer:%2% at %3%") %
+ location.m_Function %
+ bufferIndex %
+ location.FileLine()));
+ }
+ else if (bufferIndex >= model->buffers.size())
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("%1% was called with an invalid buffer index. "
+ "buffer index:%2% at %3%") %
+ location.m_Function %
+ bufferIndex %
+ location.FileLine()));
+ }
+ else if (model->buffers[bufferIndex].get() == nullptr)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("The buffer #%1% is null. %3%") %
+ bufferIndex %
+ location.AsString()));
+ }
+}
+
+#define CHECK_BUFFER(MODEL, BUFFER_INDEX) \
+ CheckBuffer(MODEL, BUFFER_INDEX, CHECK_LOCATION())
+
+void CheckBufferSize(TfLiteParser::BufferRawPtr bufferPtr,
+ const armnn::TensorInfo & tensorInfo,
+ uint32_t bufferId,
+ const CheckLocation & location)
+{
+ if (bufferPtr == nullptr)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("BufferPtr is null for buffer:%1%. %2%") %
+ bufferId %
+ location.AsString()));
+ }
+ else if(tensorInfo.GetNumElements() > bufferPtr->data.size() ||
+ tensorInfo.GetNumBytes() > bufferPtr->data.size())
+ {
+ std::stringstream ss;
+ ss << "Buffer #" << bufferId << " has " << bufferPtr->data.size() << " bytes. "
+ << "For tensor: " << tensorInfo.GetShape()
+ << " expecting: " << tensorInfo.GetNumBytes() << " bytes and "
+ << tensorInfo.GetNumElements() << " elements. " << location.AsString();
+ throw ParseException(ss.str());
+ }
+}
+
+#define CHECK_BUFFER_SIZE(BUFFER_PTR, TENSOR_INFO, BUFFER_ID) \
+ CheckBufferSize(BUFFER_PTR, TENSOR_INFO, BUFFER_ID, CHECK_LOCATION())
+
+bool IsActivationSupported(tflite::ActivationFunctionType activationType)
+{
+ switch(activationType)
+ {
+ case tflite::ActivationFunctionType_NONE:
+ case tflite::ActivationFunctionType_RELU:
+ case tflite::ActivationFunctionType_RELU6:
+ case tflite::ActivationFunctionType_TANH:
+ {
+ return true;
+ }
+ default:
+ {
+ return false;
+ }
+ }
+}
+
+#define CHECK_SUPPORTED_FUSED_ACTIVATION(OPTION, SUBGRAPH_INDEX, OPERATOR_INDEX) \
+ do { \
+ if (IsActivationSupported(OPTION->fused_activation_function) == false) \
+ { \
+ throw ParseException( \
+ boost::str( \
+ boost::format("TfLite parser doesn't suppport fused activation: " \
+ "%1%/%2% in %3% subgraph:%4% operator:%5% at %6%") % \
+ OPTION->fused_activation_function % \
+ tflite::EnumNameActivationFunctionType(\
+ OPTION->fused_activation_function) % \
+ __func__ % \
+ SUBGRAPH_INDEX % \
+ OPERATOR_INDEX % \
+ CHECK_LOCATION().FileLine())); \
+ } \
+ } while(false)
+
+
+std::vector<unsigned int> AsUnsignedVector(const std::vector<int32_t> & in)
+{
+ std::vector<unsigned int> result;
+ result.reserve(in.size());
+ for (auto & i : in)
+ {
+ result.push_back(CHECKED_NON_NEGATIVE(i));
+ }
+ return result;
+}
+
+void CalcPadding(uint32_t inputSize,
+ uint32_t filterSize,
+ uint32_t stride,
+ uint32_t& paddingFront,
+ uint32_t& paddingBack,
+ tflite::Padding padding)
+{
+ paddingFront = 0;
+ paddingBack = 0;
+ if (padding == tflite::Padding_SAME)
+ {
+ uint32_t outputSize = (inputSize + stride - 1) / stride;
+ uint32_t temp = (outputSize - 1) * stride + filterSize;
+ if (temp > inputSize)
+ {
+ paddingFront = (temp - inputSize) / 2;
+ paddingBack = (temp - inputSize) - paddingFront;
+ }
+ }
+}
+
+armnn::TensorInfo ToTensorInfo(TfLiteParser::TensorRawPtr tensorPtr)
+{
+ armnn::DataType type;
+ CHECK_TENSOR_PTR(tensorPtr);
+
+ switch (tensorPtr->type)
+ {
+ case tflite::TensorType_UINT8:
+ type = armnn::DataType::QuantisedAsymm8;
+ break;
+ case tflite::TensorType_FLOAT32:
+ type = armnn::DataType::Float32;
+ break;
+ case tflite::TensorType_INT32:
+ type = armnn::DataType::Signed32;
+ break;
+
+ default:
+ {
+ CheckLocation location = CHECK_LOCATION();
+ throw ParseException(
+ boost::str(
+ boost::format("Unsupported data type %1% = %2% for tensor: %3%. %4%") %
+ tensorPtr->type %
+ tflite::EnumNameTensorType(tensorPtr->type) %
+ tensorPtr->name %
+ location.AsString()));
+ }
+ }
+
+ float quantizationScale = 0.0f;
+ int32_t quantizationOffset = 0;
+
+ if (tensorPtr->quantization.get())
+ {
+ CHECK_VALID_SIZE(tensorPtr->quantization->scale.size(), 0, 1);
+ CHECK_VALID_SIZE(tensorPtr->quantization->zero_point.size(), 0, 1);
+
+ if (tensorPtr->quantization->scale.size() == 1)
+ {
+ quantizationScale = tensorPtr->quantization->scale[0];
+ }
+ if (tensorPtr->quantization->zero_point.size() == 1)
+ {
+ // NOTE: we lose precision here when converting from 64 bit to 32
+ // but this is what we support at the monent in ArmNN
+ quantizationOffset = static_cast<int32_t>(tensorPtr->quantization->zero_point[0]);
+ }
+ }
+
+ auto const & dimensions = AsUnsignedVector(tensorPtr->shape);
+
+ // two statements (on purpose) for easier debugging:
+ armnn::TensorInfo result(static_cast<unsigned int>(tensorPtr->shape.size()),
+ dimensions.data(),
+ type,
+ quantizationScale,
+ quantizationOffset);
+ return result;
+}
+
+template<typename T>
+std::pair<armnn::ConstTensor, std::unique_ptr<T[]>>
+CreateConstTensorImpl(TfLiteParser::BufferRawPtr bufferPtr,
+ TfLiteParser::TensorRawPtr tensorPtr,
+ armnn::TensorInfo & tensorInfo,
+ bool convertFromTfToArmnnFormat)
+{
+ BOOST_ASSERT_MSG(tensorPtr != nullptr, "tensorPtr is null");
+ BOOST_ASSERT_MSG(bufferPtr != nullptr,
+ boost::str(
+ boost::format("Buffer for buffer:%1% is null") % tensorPtr->buffer).c_str());
+
+ std::unique_ptr<T[]> data(new T[tensorInfo.GetNumElements()]);
+
+ if (convertFromTfToArmnnFormat)
+ {
+ tensorInfo = armnnUtils::Permuted(tensorInfo, NHWCToArmNN);
+ armnnUtils::Permute(tensorInfo.GetShape(),
+ NHWCToArmNN,
+ reinterpret_cast<const T *>(bufferPtr->data.data()),
+ data.get());
+ }
+ else
+ {
+ ::memcpy(data.get(), bufferPtr->data.data(), tensorInfo.GetNumBytes());
+ }
+ return std::make_pair(ConstTensor(tensorInfo, data.get()), std::move(data));
+}
+
+IConnectableLayer* SwizzleIn(INetwork& network,
+ IConnectableLayer* layer,
+ unsigned int inputSlotIndex,
+ const TensorInfo & inputInfo)
+{
+ BOOST_ASSERT(layer != nullptr);
+ // Add swizzle layer
+ std::stringstream name;
+ name << "swizzle_for-" << layer->GetName() << ":in" << inputSlotIndex;
+ IConnectableLayer* const swizzleLayer = network.AddPermuteLayer(NHWCToArmNN, name.str().c_str());
+ // Set swizzled output shape
+ const TensorInfo swizzleOutInfo = armnnUtils::Permuted(inputInfo, NHWCToArmNN);
+ swizzleLayer->GetOutputSlot(0).SetTensorInfo(swizzleOutInfo);
+ // Connect the swizzle layer to the actual layer
+ swizzleLayer->GetOutputSlot(0).Connect(layer->GetInputSlot(inputSlotIndex));
+
+ return swizzleLayer;
+}
+
+IConnectableLayer* DeswizzleOut(INetwork& network,
+ IConnectableLayer* layer,
+ unsigned int outputSlotIndex,
+ const TensorInfo & outputInfo)
+{
+ BOOST_ASSERT(layer != nullptr);
+ // Add deswizzle layer
+ std::stringstream name;
+ name << "deswizzle_for-" << layer->GetName() << ":out" << outputSlotIndex;
+ IConnectableLayer* const deswizzleLayer = network.AddPermuteLayer(ArmNNToNHWC, name.str().c_str());
+ // Set deswizzled output shape
+ deswizzleLayer->GetOutputSlot(0).SetTensorInfo(outputInfo);
+ // Set original layer output shape
+ const TensorInfo deswizzleOutInfo = armnnUtils::Permuted(outputInfo, NHWCToArmNN);
+ layer->GetOutputSlot(outputSlotIndex).SetTensorInfo(deswizzleOutInfo);
+ // Connect the actual layer to the deswizzle layer
+ layer->GetOutputSlot(outputSlotIndex).Connect(deswizzleLayer->GetInputSlot(0));
+
+ return deswizzleLayer;
+}
+
+std::pair<IConnectableLayer*, IConnectableLayer*> SwizzleInDeswizzleOut(INetwork& network,
+ IConnectableLayer* layer,
+ unsigned int inputSlotIndex,
+ const TensorInfo & inputInfo,
+ unsigned int outputSlotIndex,
+ const TensorInfo & outputInfo)
+{
+ IConnectableLayer* const swizzleLayer = SwizzleIn(network, layer, inputSlotIndex, inputInfo);
+ IConnectableLayer* const deswizzleLayer = DeswizzleOut(network, layer, outputSlotIndex, outputInfo);
+ return std::make_pair(swizzleLayer, deswizzleLayer);
+}
+
+armnn::LayerBindingId GenerateLayerBindingId(size_t subgraphIndex, size_t tensorIndex)
+{
+ // generate the binding id by shifting the tensor id by 8 bit
+ // and add the subgraph id, which allows 256 subgraphs
+ return static_cast<armnn::LayerBindingId>((tensorIndex<<8)+subgraphIndex);
+}
+
+} // <anonymous>
+
+TfLiteParser::TfLiteParser()
+: m_Network(nullptr, nullptr)
+, m_ParserFunctions(tflite::BuiltinOperator_MAX+1, &TfLiteParser::ParseUnsupportedOperator)
+{
+ // register supported operators
+ m_ParserFunctions[tflite::BuiltinOperator_AVERAGE_POOL_2D] = &TfLiteParser::ParseAveragePool2D;
+ m_ParserFunctions[tflite::BuiltinOperator_CONV_2D] = &TfLiteParser::ParseConv2D;
+ m_ParserFunctions[tflite::BuiltinOperator_DEPTHWISE_CONV_2D] = &TfLiteParser::ParseDepthwiseConv2D;
+ m_ParserFunctions[tflite::BuiltinOperator_SOFTMAX] = &TfLiteParser::ParseSoftmax;
+ m_ParserFunctions[tflite::BuiltinOperator_SQUEEZE] = &TfLiteParser::ParseSqueeze;
+}
+
+void TfLiteParser::ResetParser()
+{
+ m_Network = armnn::INetworkPtr(nullptr, nullptr);
+ m_Model = nullptr;
+ m_SubgraphConnections.clear();
+}
+
+INetworkPtr TfLiteParser::CreateNetworkFromBinaryFile(const char* graphFile)
+{
+ ResetParser();
+ m_Model = LoadModelFromFile(graphFile);
+ return CreateNetworkFromModel();
+}
+
+INetworkPtr TfLiteParser::CreateNetworkFromBinary(const std::vector<uint8_t> & binaryContent)
+{
+ ResetParser();
+ m_Model = LoadModelFromBinary(binaryContent.data(), binaryContent.size());
+ return CreateNetworkFromModel();
+}
+
+INetworkPtr TfLiteParser::CreateNetworkFromModel()
+{
+ m_Network = INetwork::Create();
+ BOOST_ASSERT(m_Model.get() != nullptr);
+
+ bool failedToCreate = false;
+ std::stringstream errors;
+
+ if (m_Model->subgraphs.size() != 1)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("Current TfLite parser only supports 1 subgraph. Current one has: %1% %2%") %
+ m_Model->subgraphs.size() %
+ CHECK_LOCATION().AsString()));
+ }
+
+ size_t subgraphIndex = 0;
+ for (SubGraphPtr const & subgraph : m_Model->subgraphs)
+ {
+ m_SubgraphConnections.emplace_back(subgraph->tensors.size());
+
+ size_t operatorIndex = 0;
+ for (OperatorPtr const & op : subgraph->operators)
+ {
+ try
+ {
+ if (op->custom_options.size() > 0)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("Custom options for op: %1% is not supported. "
+ "It has %2% bytes of custom options. %3%") %
+ op->opcode_index %
+ op->custom_options.size() %
+ CHECK_LOCATION().AsString()));
+ }
+
+ auto const & opCodePtr = m_Model->operator_codes[op->opcode_index];
+ auto builtinCode = opCodePtr->builtin_code;
+
+ if (builtinCode > tflite::BuiltinOperator_MAX)
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("Operator code %1% is out of range 0-%2%. "
+ "subgraph:%3% operator idx:%4%. %5%") %
+ builtinCode %
+ tflite::BuiltinOperator_MAX %
+ subgraphIndex %
+ operatorIndex %
+ CHECK_LOCATION().AsString()));
+ }
+
+ // lookup and call the parser function
+ auto & parserFunction = m_ParserFunctions[builtinCode];
+ (this->*parserFunction)(subgraphIndex, operatorIndex);
+ }
+ catch (const ParseException& e)
+ {
+ failedToCreate = true;
+ std::stringstream errorString;
+
+ errorString << "Failed to parse operator #" << operatorIndex
+ << " within subgraph #" << subgraphIndex
+ << " error: " << e.what();
+ BOOST_LOG_TRIVIAL(error) << errorString.str();
+
+ errors << errorString.str() << "\n";
+ }
+ ++operatorIndex;
+ }
+
+ SetupInputLayers(subgraphIndex);
+ SetupOutputLayers(subgraphIndex);
+
+ ++subgraphIndex;
+ }
+
+ if (failedToCreate)
+ {
+ // we can skip everything and let the outer exception handler deal with the error
+ throw ParseException(errors.str());
+ }
+
+ // establish the connections from the layer outputs to the inputs of the subsequent layers
+ for (size_t subgraphIndex = 0; subgraphIndex < m_SubgraphConnections.size(); ++subgraphIndex)
+ {
+ for (size_t tensorIndex = 0; tensorIndex < m_SubgraphConnections[subgraphIndex].size(); ++tensorIndex)
+ {
+ if (m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot != nullptr)
+ {
+ for (size_t inputSlotIdx = 0;
+ inputSlotIdx < m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots.size();
+ ++inputSlotIdx)
+ {
+ m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot->Connect(
+ *(m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots[inputSlotIdx]));
+ }
+ }
+ }
+ }
+
+ return std::move(m_Network);
+}
+
+void TfLiteParser::RegisterProducerOfTensor(size_t subgraphIndex,
+ size_t tensorIndex,
+ armnn::IOutputSlot* slot)
+{
+ CHECK_TENSOR(m_Model, subgraphIndex, tensorIndex);
+ BOOST_ASSERT(m_SubgraphConnections.size() > subgraphIndex);
+ BOOST_ASSERT(m_SubgraphConnections[subgraphIndex].size() > tensorIndex);
+
+ TensorSlots & tensorSlots = m_SubgraphConnections[subgraphIndex][tensorIndex];
+
+ // assuming there is only one producer for that tensor
+ if (tensorSlots.outputSlot != nullptr)
+ {
+ throw ParseException(boost::str(
+ boost::format("Another layer has already registered itself as the producer of "
+ "subgraph:%1% tensor:%2% %3%") %
+ subgraphIndex %
+ tensorIndex %
+ CHECK_LOCATION().AsString()));
+ }
+
+ tensorSlots.outputSlot = slot;
+}
+
+void TfLiteParser::RegisterConsumerOfTensor(size_t subgraphIndex,
+ size_t tensorIndex,
+ armnn::IInputSlot* slot)
+{
+ CHECK_TENSOR(m_Model, subgraphIndex, tensorIndex);
+ BOOST_ASSERT(m_SubgraphConnections.size() > subgraphIndex);
+ BOOST_ASSERT(m_SubgraphConnections[subgraphIndex].size() > tensorIndex);
+
+ TensorSlots & tensorSlots = m_SubgraphConnections[subgraphIndex][tensorIndex];
+ tensorSlots.inputSlots.push_back(slot);
+}
+
+void TfLiteParser::ParseUnsupportedOperator(size_t subgraphIndex, size_t operatorIndex)
+{
+ CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+ const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+ //
+ auto opcodeIndex = operatorPtr->opcode_index;
+ auto opcode = m_Model->operator_codes[opcodeIndex]->builtin_code;
+
+ throw ParseException(
+ boost::str(
+ boost::format("Operator not supported. "
+ "subgraph:%1% operator:%2% "
+ "opcode_index:%3% opcode:%4% / %5% %6%") %
+ subgraphIndex %
+ operatorIndex %
+ opcodeIndex %
+ opcode %
+ tflite::EnumNameBuiltinOperator(opcode) %
+ CHECK_LOCATION().AsString()));
+}
+
+void TfLiteParser::ParseAveragePool2D(size_t subgraphIndex, size_t operatorIndex)
+{
+ CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+
+ const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+ const auto * options = operatorPtr->builtin_options.AsPool2DOptions();
+
+ CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
+
+ Pooling2dDescriptor desc;
+
+ desc.m_PoolType = PoolingAlgorithm::Average;
+ desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
+ desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
+ desc.m_PoolWidth = CHECKED_NON_NEGATIVE(options->filter_width);
+ desc.m_PoolHeight = CHECKED_NON_NEGATIVE(options->filter_height);
+ desc.m_PaddingMethod = PaddingMethod::Exclude;
+ desc.m_OutputShapeRounding = OutputShapeRounding::Floor;
+
+ auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(inputs.size(), 1);
+ armnn::TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]);
+
+ // assuming input is NHWC
+ unsigned int inputHeight = inputTensorInfo.GetShape()[1];
+ unsigned int inputWidth = inputTensorInfo.GetShape()[2];
+
+ CalcPadding(inputHeight, desc.m_PoolHeight, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, options->padding);
+ CalcPadding(inputWidth, desc.m_PoolWidth, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, options->padding);
+
+ auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(outputs.size(), 1);
+ armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
+
+ auto layerName = boost::str(boost::format("AveragePool2D:%1%:%2%") % subgraphIndex % operatorIndex);
+ IConnectableLayer* layer = m_Network->AddPooling2dLayer(desc, layerName.c_str());
+
+ BOOST_ASSERT(layer != nullptr);
+
+ // add permute layers to swizzle the input and deswizzle the output
+ std::pair<IConnectableLayer*, IConnectableLayer*> permuteLayers =
+ SwizzleInDeswizzleOut(*m_Network, layer, 0, inputTensorInfo, 0, outputTensorInfo);
+
+ // register the input connection slots for the layer, connections are made after all layers have been created
+ // only the tensors for the inputs are relevant, exclude the const tensors
+ auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterInputSlots(subgraphIndex, operatorIndex, permuteLayers.first, {inputTensorIndexes[0]});
+
+ // we need to add the activation layer and fortunately we don't need to care about the data layout
+ // beause the activation function is element-wise, so it is OK to have the activation after the trailing
+ // swizzle layer
+ layer = AddActivationLayer(permuteLayers.second, 0, options->fused_activation_function);
+ // register the output connection slots for the layer, connections are made after all layers have been created
+ auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+void TfLiteParser::ParseConv2D(size_t subgraphIndex, size_t operatorIndex)
+{
+ CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+
+ const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+ const auto * options = operatorPtr->builtin_options.AsConv2DOptions();
+
+ CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
+
+ Convolution2dDescriptor desc;
+ desc.m_BiasEnabled = false;
+ desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
+ desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
+
+ auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(inputs.size(), 2, 3);
+
+ auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(outputs.size(), 1);
+
+ armnn::TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]);
+ armnn::TensorInfo filterTensorInfo = ToTensorInfo(inputs[1]);
+
+ // assuming input is NHWC
+ unsigned int inputHeight = inputTensorInfo.GetShape()[1];
+ unsigned int inputWidth = inputTensorInfo.GetShape()[2];
+
+ // assuming the filter is OHWI : Output, H, W, Input
+ // which is essentially the same as NHWC
+ unsigned int filterHeight = filterTensorInfo.GetShape()[1];
+ unsigned int filterWidth = filterTensorInfo.GetShape()[2];
+
+ CalcPadding(inputHeight, filterHeight, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, options->padding);
+ CalcPadding(inputWidth, filterWidth, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, options->padding);
+
+ auto filterTensorAndData = CreateConstTensor(inputs[1], filterTensorInfo, true);
+ armnn::IConnectableLayer* layer;
+
+ auto layerName = boost::str(boost::format("Conv2D:%1%:%2%") % subgraphIndex % operatorIndex);
+
+ if (inputs.size() == 3)
+ {
+ desc.m_BiasEnabled = true;
+ armnn::TensorInfo biasTensorInfo = ToTensorInfo(inputs[2]);
+ auto biasTensorAndData = CreateConstTensor(inputs[2], biasTensorInfo, false);
+ layer = m_Network->AddConvolution2dLayer(desc,
+ filterTensorAndData.first,
+ biasTensorAndData.first,
+ layerName.c_str());
+ }
+ else
+ {
+ layer = m_Network->AddConvolution2dLayer(desc,
+ filterTensorAndData.first,
+ layerName.c_str());
+ }
+
+ BOOST_ASSERT(layer != nullptr);
+
+ // add permute layers to swizzle the input and deswizzle the output
+ armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
+ std::pair<IConnectableLayer*, IConnectableLayer*> permuteLayers =
+ SwizzleInDeswizzleOut(*m_Network, layer, 0, inputTensorInfo, 0, outputTensorInfo);
+
+ // register the input connection slots for the layer, connections are made after all layers have been created
+ // only the tensors for the inputs are relevant, exclude the const tensors
+ auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterInputSlots(subgraphIndex, operatorIndex, permuteLayers.first, {inputTensorIndexes[0]});
+
+ // we need to add the activation layer and fortunately we don't need to care about the data layout
+ // beause the activation function is element-wise, so it is OK to have the activation after the trailing
+ // swizzle layer
+ layer = AddActivationLayer(permuteLayers.second, 0, options->fused_activation_function);
+ // register the output connection slots for the layer, connections are made after all layers have been created
+ auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+void TfLiteParser::ParseDepthwiseConv2D(size_t subgraphIndex, size_t operatorIndex)
+{
+ CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+
+ const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+ const auto * options = operatorPtr->builtin_options.AsDepthwiseConv2DOptions();
+
+ CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
+
+ DepthwiseConvolution2dDescriptor desc;
+ desc.m_BiasEnabled = false;
+ desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
+ desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
+ // ACL only supports a depth (channel) multiplier of 1, it is not currently stored in the descriptor
+ CHECK_VALID_SIZE(CHECKED_NON_NEGATIVE(options->depth_multiplier), 1);
+
+ auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(inputs.size(), 2, 3);
+ auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(outputs.size(), 1);
+
+ armnn::TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]);
+ armnn::TensorInfo filterTensorInfo = ToTensorInfo(inputs[1]);
+
+ // assuming input is NHWC
+ unsigned int inputHeight = inputTensorInfo.GetShape()[1];
+ unsigned int inputWidth = inputTensorInfo.GetShape()[2];
+ // assuming the filter is OHWI : Output, H, W, Input
+ unsigned int filterHeight = filterTensorInfo.GetShape()[1];
+ unsigned int filterWidth = filterTensorInfo.GetShape()[2];
+
+ CalcPadding(inputHeight, filterHeight, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, options->padding);
+ CalcPadding(inputWidth, filterWidth, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, options->padding);
+
+ auto filterTensorAndData = CreateConstTensor(inputs[1], filterTensorInfo, true);
+ armnn::IConnectableLayer* layer;
+ auto layerName = boost::str(boost::format("DepthwiseConv2D:%1%:%2%") % subgraphIndex % operatorIndex);
+
+ if (inputs.size() == 3)
+ {
+ desc.m_BiasEnabled = true;
+ TensorInfo biasTensorInfo = ToTensorInfo(inputs[2]);
+ auto biasTensorAndData = CreateConstTensor(inputs[2], biasTensorInfo, false);
+ layer = m_Network->AddDepthwiseConvolution2dLayer(desc,
+ filterTensorAndData.first,
+ biasTensorAndData.first,
+ layerName.c_str());
+ }
+ else
+ {
+ layer = m_Network->AddDepthwiseConvolution2dLayer(desc,
+ filterTensorAndData.first,
+ layerName.c_str());
+ }
+ BOOST_ASSERT(layer != nullptr);
+
+ // add permute layers to swizzle the input and deswizzle the output
+ armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
+ std::pair<IConnectableLayer*, IConnectableLayer*> permuteLayers =
+ SwizzleInDeswizzleOut(*m_Network, layer, 0, inputTensorInfo, 0, outputTensorInfo);
+
+ // register the input connection slots for the layer, connections are made after all layers have been created
+ // only the tensors for the inputs are relevant, exclude the const tensors
+ auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterInputSlots(subgraphIndex, operatorIndex, permuteLayers.first, {inputTensorIndexes[0]});
+
+ // we need to add the activation layer and fortunately we don't need to care about the data layout
+ // beause the activation function is element-wise, so it is OK to have the activation after the trailing
+ // swizzle layer
+ layer = AddActivationLayer(permuteLayers.second, 0, options->fused_activation_function);
+ // register the output connection slots for the layer, connections are made after all layers have been created
+ auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+void TfLiteParser::ParseSoftmax(size_t subgraphIndex, size_t operatorIndex)
+{
+ CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+ const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+ const auto * options = operatorPtr->builtin_options.AsSoftmaxOptions();
+
+ SoftmaxDescriptor desc;
+ desc.m_Beta = options->beta;
+
+ auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(inputs.size(), 1);
+ auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(outputs.size(), 1);
+
+ auto layerName = boost::str(boost::format("Softmax:%1%:%2%") % subgraphIndex % operatorIndex);
+ IConnectableLayer* const layer = m_Network->AddSoftmaxLayer(desc, layerName.c_str());
+
+ armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
+ layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
+
+ // register the input connection slots for the layer, connections are made after all layers have been created
+ // only the tensors for the inputs are relevant, exclude the const tensors
+ auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
+
+ // register the output connection slots for the layer, connections are made after all layers have been created
+ auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+armnn::TensorInfo TfLiteParser::OutputShapeOfSqueeze(const std::vector<uint32_t> & squeezeDimsIn,
+ const armnn::TensorInfo & inputTensorInfo)
+{
+ CHECK_VALID_SIZE(squeezeDimsIn.size(), 0, 1, 2, 3, 4);
+ std::vector<uint32_t> squeezeDims = squeezeDimsIn;
+ static const uint32_t dimensionSequence[] = { 0, 1, 2, 3 };
+
+ if (inputTensorInfo.GetNumDimensions() > 4)
+ {
+ std::stringstream ss;
+ ss << "Input tensor has unexpected number of dimensions:" << inputTensorInfo.GetNumDimensions()
+ << " shape:" << inputTensorInfo.GetShape() << " "
+ << CHECK_LOCATION().AsString();
+ throw ParseException(ss.str());
+ }
+
+ if (squeezeDims.empty())
+ {
+ squeezeDims.assign(dimensionSequence,
+ dimensionSequence+inputTensorInfo.GetNumDimensions());
+ }
+
+ std::vector<uint32_t> outputDims;
+ for(unsigned int i = 0; i < inputTensorInfo.GetNumDimensions(); i++)
+ {
+ bool skipSqueeze = (std::find(squeezeDims.begin(), squeezeDims.end(), i) == squeezeDims.end());
+ auto currentDimension = inputTensorInfo.GetShape()[i];
+ if (skipSqueeze || currentDimension != 1)
+ {
+ outputDims.push_back(currentDimension);
+ }
+ }
+
+ if (outputDims.size() > 4)
+ {
+ std::stringstream ss;
+ ss << "Output tensor has unexpected number of dimensions:" << inputTensorInfo.GetNumDimensions()
+ << " shape:" << inputTensorInfo.GetShape() << " "
+ << CHECK_LOCATION().AsString();
+ throw ParseException(ss.str());
+ }
+
+ TensorShape outShape = TensorShape(static_cast<unsigned int>(outputDims.size()),
+ outputDims.data());
+
+ // we need to preserve the tensor type and the quantization data as well
+ TensorInfo outTensorInfo = inputTensorInfo;
+ outTensorInfo.SetShape(outShape);
+
+ return outTensorInfo;
+}
+
+void TfLiteParser::ParseSqueeze(size_t subgraphIndex, size_t operatorIndex)
+{
+ CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+
+ auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(inputs.size(), 1);
+
+ auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
+ CHECK_VALID_SIZE(outputs.size(), 1);
+
+ const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
+ const auto * options = operatorPtr->builtin_options.AsSqueezeOptions();
+
+ armnn::TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]);
+ armnn::TensorInfo outputTensorInfo =
+ TfLiteParser::OutputShapeOfSqueeze(AsUnsignedVector(options->squeeze_dims),
+ inputTensorInfo);
+
+ ReshapeDescriptor reshapeDesc;
+ reshapeDesc.m_TargetShape = outputTensorInfo.GetShape();
+
+ auto layerName = boost::str(boost::format("Squeeze:%1%:%2%") % subgraphIndex % operatorIndex);
+ IConnectableLayer* layer = m_Network->AddReshapeLayer(reshapeDesc, layerName.c_str());
+ layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
+
+ auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
+
+ auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
+ RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
+}
+
+armnn::IConnectableLayer* TfLiteParser::AddActivationLayer(armnn::IConnectableLayer* prevLayer,
+ unsigned int outputSlot,
+ tflite::ActivationFunctionType activationType)
+{
+ ActivationDescriptor activationDesc;
+ std::string layerName = prevLayer->GetName();
+
+ switch(activationType)
+ {
+ case tflite::ActivationFunctionType_NONE:
+ {
+ // this is a no-op: return previous layer
+ return prevLayer;
+ }
+ case tflite::ActivationFunctionType_RELU:
+ {
+ activationDesc.m_Function = ActivationFunction::ReLu;
+ layerName += ":RELU";
+ break;
+ }
+ case tflite::ActivationFunctionType_RELU6:
+ {
+ activationDesc.m_Function = ActivationFunction::BoundedReLu;
+ activationDesc.m_A = 6.0f;
+ activationDesc.m_B = 0.0f;
+ layerName += ":RELU6";
+ break;
+ }
+ case tflite::ActivationFunctionType_TANH:
+ {
+ activationDesc.m_Function = ActivationFunction::TanH;
+ activationDesc.m_A = 1.0f;
+ activationDesc.m_B = 1.0f;
+ layerName += ":TANH";
+ break;
+ }
+
+ // I only put these here as a reminder what others we could support
+ case tflite::ActivationFunctionType_RELU_N1_TO_1:
+ case tflite::ActivationFunctionType_SIGN_BIT:
+ default:
+ {
+ throw ParseException(
+ boost::str(
+ boost::format("TfLite parser doesn't suppport fused activation: "
+ "%1%/%2% %3% ") %
+ activationType %
+ tflite::EnumNameActivationFunctionType(activationType) %
+ CHECK_LOCATION().AsString()));
+
+ }
+ }
+
+ IConnectableLayer* activationLayer =
+ m_Network->AddActivationLayer(activationDesc, layerName.c_str());
+
+ auto & prevOutputSlot = prevLayer->GetOutputSlot(outputSlot);
+ prevOutputSlot.Connect(activationLayer->GetInputSlot(0));
+ activationLayer->GetOutputSlot(0).SetTensorInfo(prevOutputSlot.GetTensorInfo());
+ return activationLayer;
+}
+
+TfLiteParser::ModelPtr TfLiteParser::LoadModelFromFile(const char * fileName)
+{
+ if (fileName == nullptr)
+ {
+ throw InvalidArgumentException(boost::str(boost::format("Invalid (null) file name %1%") %
+ CHECK_LOCATION().AsString()));
+ }
+ boost::system::error_code errorCode;
+ boost::filesystem::path pathToFile(fileName);
+ if (!boost::filesystem::exists(pathToFile, errorCode))
+ {
+ throw FileNotFoundException(boost::str(boost::format("Cannot find the file (%1%) errorCode: %2% %3%") %
+ fileName %
+ errorCode %
+ CHECK_LOCATION().AsString()));
+ }
+ std::ifstream file(fileName, std::ios::binary);
+ std::string fileContent((std::istreambuf_iterator<char>(file)), std::istreambuf_iterator<char>());
+ return LoadModelFromBinary(reinterpret_cast<const uint8_t *>(fileContent.c_str()),
+ fileContent.size());
+}
+
+TfLiteParser::ModelPtr TfLiteParser::LoadModelFromBinary(const uint8_t * binaryContent, size_t len)
+{
+ if (binaryContent == nullptr)
+ {
+ throw InvalidArgumentException(boost::str(boost::format("Invalid (null) binary content %1%") %
+ CHECK_LOCATION().AsString()));
+ }
+ flatbuffers::Verifier verifier(binaryContent, len);
+ if (verifier.VerifyBuffer<tflite::Model>() == false)
+ {
+ throw ParseException(
+ boost::str(boost::format("Buffer doesn't conform to the expected Tensorflow Lite "
+ "flatbuffers format. size:%1% %2%") %
+ len %
+ CHECK_LOCATION().AsString()));
+ }
+ return tflite::UnPackModel(binaryContent);
+}
+
+TfLiteParser::TensorRawPtrVector TfLiteParser::GetInputs(const ModelPtr & model,
+ size_t subgraphIndex,
+ size_t operatorIndex)
+{
+ CHECK_MODEL(model, subgraphIndex, operatorIndex);
+
+ const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+ const auto & operatorPtr = subGraphPtr->operators[operatorIndex];
+
+ size_t inputCount = operatorPtr->inputs.size();
+ TensorRawPtrVector result(inputCount);
+ for (size_t i=0; i<inputCount; ++i)
+ {
+ uint32_t inputId = CHECKED_NON_NEGATIVE(operatorPtr->inputs[i]);
+ result[i] = subGraphPtr->tensors[inputId].get();
+ }
+ return result;
+}
+
+TfLiteParser::TensorRawPtrVector TfLiteParser::GetOutputs(const ModelPtr & model,
+ size_t subgraphIndex,
+ size_t operatorIndex)
+{
+ CHECK_MODEL(model, subgraphIndex, operatorIndex);
+
+ const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+ const auto & operatorPtr = subGraphPtr->operators[operatorIndex];
+
+ size_t outputCount = operatorPtr->outputs.size();
+ TensorRawPtrVector result(outputCount);
+ for (size_t i=0; i<outputCount; ++i)
+ {
+ uint32_t outputId = CHECKED_NON_NEGATIVE(operatorPtr->outputs[i]);
+ CHECK_TENSOR(model, subgraphIndex, outputId);
+ result[i] = subGraphPtr->tensors[outputId].get();
+ }
+ return result;
+}
+
+TfLiteParser::TensorIdRawPtrVector TfLiteParser::GetSubgraphInputs(const ModelPtr & model,
+ size_t subgraphIndex)
+{
+ CHECK_SUBGRAPH(model, subgraphIndex);
+ const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+
+ size_t inputCount = subGraphPtr->inputs.size();
+ TensorIdRawPtrVector result(inputCount);
+ for (size_t i=0; i<inputCount; ++i)
+ {
+ uint32_t inputId = CHECKED_NON_NEGATIVE(subGraphPtr->inputs[i]);
+ CHECK_TENSOR(model, subgraphIndex, inputId);
+ result[i] = std::make_pair(inputId, subGraphPtr->tensors[inputId].get());
+ }
+ return result;
+}
+
+TfLiteParser::TensorIdRawPtrVector TfLiteParser::GetSubgraphOutputs(const ModelPtr & model,
+ size_t subgraphIndex)
+{
+ CHECK_SUBGRAPH(model, subgraphIndex);
+ const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+
+ size_t outputCount = subGraphPtr->outputs.size();
+ TensorIdRawPtrVector result(outputCount);
+ for (size_t i=0; i<outputCount; ++i)
+ {
+ uint32_t outputId = CHECKED_NON_NEGATIVE(subGraphPtr->outputs[i]);
+ result[i] = std::make_pair(outputId, subGraphPtr->tensors[outputId].get());
+ }
+ return result;
+}
+
+std::vector<int32_t>& TfLiteParser::GetInputTensorIds(const ModelPtr& model,
+ size_t subgraphIndex,
+ size_t operatorIndex)
+{
+ CHECK_MODEL(model, subgraphIndex, operatorIndex);
+ const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+ const auto & operatorPtr = subGraphPtr->operators[operatorIndex];
+ return operatorPtr->inputs;
+}
+
+std::vector<int32_t>& TfLiteParser::GetOutputTensorIds(const ModelPtr& model,
+ size_t subgraphIndex,
+ size_t operatorIndex)
+{
+ CHECK_MODEL(model, subgraphIndex, operatorIndex);
+ const auto & subGraphPtr = model->subgraphs[subgraphIndex];
+ const auto & operatorPtr = subGraphPtr->operators[operatorIndex];
+ return operatorPtr->outputs;
+}
+
+void TfLiteParser::RegisterInputSlots(size_t subgraphIndex,
+ size_t operatorIndex,
+ IConnectableLayer* layer,
+ const std::vector<unsigned int>& tensorIndexes)
+{
+ CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+ BOOST_ASSERT(layer != nullptr);
+ if (tensorIndexes.size() != layer->GetNumInputSlots())
+ {
+ throw ParseException(
+ boost::str(boost::format("The number of tensor inputs (%1%) does not match the number expected (%2%)"
+ " for subgraph:%3% operator index:%4% %5%") %
+ tensorIndexes.size() %
+ layer->GetNumInputSlots() %
+ subgraphIndex %
+ operatorIndex %
+ CHECK_LOCATION().AsString()));
+ }
+
+ for (unsigned int slotIndex = 0; slotIndex < layer->GetNumInputSlots(); ++slotIndex)
+ {
+ unsigned int tensorIndex = tensorIndexes[slotIndex];
+ armnn::IInputSlot* slot = &(layer->GetInputSlot(slotIndex));
+ RegisterConsumerOfTensor(subgraphIndex, tensorIndex, slot);
+ }
+}
+
+void TfLiteParser::RegisterOutputSlots(size_t subgraphIndex,
+ size_t operatorIndex,
+ IConnectableLayer* layer,
+ const std::vector<unsigned int>& tensorIndexes)
+{
+ CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
+ BOOST_ASSERT(layer != nullptr);
+ if (tensorIndexes.size() != layer->GetNumOutputSlots())
+ {
+ throw ParseException(
+ boost::str(boost::format("The number of tensor outputs (%1%) does not match the number expected (%2%)"
+ " for subgraph:%3% operator index:%4% %5%") %
+ tensorIndexes.size() %
+ layer->GetNumOutputSlots() %
+ subgraphIndex %
+ operatorIndex %
+ CHECK_LOCATION().AsString()));
+ }
+
+ for (unsigned int slotIndex = 0; slotIndex < layer->GetNumOutputSlots(); ++slotIndex)
+ {
+ unsigned int tensorIndex = tensorIndexes[slotIndex];
+ armnn::IOutputSlot* slot = &(layer->GetOutputSlot(slotIndex));
+ RegisterProducerOfTensor(subgraphIndex, tensorIndex, slot);
+ }
+}
+
+void TfLiteParser::SetupInputLayers(size_t subgraphIndex)
+{
+ CHECK_SUBGRAPH(m_Model, subgraphIndex);
+
+ auto inputs = GetSubgraphInputs(m_Model, subgraphIndex);
+ for (auto const & tensorIdAndPtr : inputs)
+ {
+ auto bindingId = GenerateLayerBindingId(subgraphIndex, tensorIdAndPtr.first);
+ IConnectableLayer* layer =
+ m_Network->AddInputLayer(bindingId, tensorIdAndPtr.second->name.c_str());
+
+ auto tensorInfo = ToTensorInfo(tensorIdAndPtr.second);
+ layer->GetOutputSlot(0).SetTensorInfo(tensorInfo);
+
+ RegisterOutputSlots(subgraphIndex,
+ VIRTUAL_OPERATOR_ID,
+ layer,
+ { static_cast<uint32_t>(tensorIdAndPtr.first) });
+ }
+}
+
+void TfLiteParser::SetupOutputLayers(size_t subgraphIndex)
+{
+ CHECK_SUBGRAPH(m_Model, subgraphIndex);
+
+ auto outputs = GetSubgraphOutputs(m_Model, subgraphIndex);
+ for (auto const & tensorIdAndPtr : outputs)
+ {
+ auto bindingId = GenerateLayerBindingId(subgraphIndex, tensorIdAndPtr.first);
+ IConnectableLayer* layer =
+ m_Network->AddOutputLayer(bindingId, tensorIdAndPtr.second->name.c_str());
+
+ RegisterInputSlots(subgraphIndex,
+ VIRTUAL_OPERATOR_ID,
+ layer,
+ { static_cast<uint32_t>(tensorIdAndPtr.first) });
+ }
+}
+
+// example usage: BufferRawPtr bufferPtr = GetBuffer(m_Model, inputs[0]->buffer);
+TfLiteParser::BufferRawPtr TfLiteParser::GetBuffer(const ModelPtr& model, size_t bufferIndex)
+{
+ CHECK_BUFFER(model, bufferIndex);
+ return model->buffers[bufferIndex].get();
+}
+
+std::pair<armnn::ConstTensor, TfLiteParser::SupportedDataStorage>
+TfLiteParser::CreateConstTensor(TensorRawPtr tensorPtr,
+ armnn::TensorInfo & tensorInfo,
+ bool convertFromTfToArmnnFormat)
+{
+ CHECK_TENSOR_PTR(tensorPtr);
+ auto bufferPtr = GetBuffer(m_Model, tensorPtr->buffer);
+ CHECK_BUFFER_SIZE(bufferPtr, tensorInfo, tensorPtr->buffer);
+
+ switch (tensorInfo.GetDataType())
+ {
+ case armnn::DataType::Float32:
+ {
+ auto constData = CreateConstTensorImpl<float>(bufferPtr,
+ tensorPtr,
+ tensorInfo,
+ convertFromTfToArmnnFormat);
+ SupportedDataStorage storage(std::move(constData.second));
+ return std::make_pair(constData.first, std::move(storage));
+ }
+ case armnn::DataType::QuantisedAsymm8:
+ {
+ auto constData = CreateConstTensorImpl<uint8_t>(bufferPtr,
+ tensorPtr,
+ tensorInfo,
+ convertFromTfToArmnnFormat);
+ SupportedDataStorage storage(std::move(constData.second));
+ return std::make_pair(constData.first, std::move(storage));
+ }
+ case armnn::DataType::Signed32:
+ {
+ auto constData = CreateConstTensorImpl<int32_t>(bufferPtr,
+ tensorPtr,
+ tensorInfo,
+ convertFromTfToArmnnFormat);
+ SupportedDataStorage storage(std::move(constData.second));
+ return std::make_pair(constData.first, std::move(storage));
+ }
+ default:
+ {
+ std::stringstream errString;
+ errString << "Unexpected datatype when creating const tensor: "
+ << armnn::GetDataTypeName(tensorInfo.GetDataType())
+ << " shape:" << tensorInfo.GetShape()
+ << CHECK_LOCATION().AsString();
+ throw ParseException(errString.str());
+ }
+ }
+}
+
+BindingPointInfo TfLiteParser::GetNetworkInputBindingInfo(size_t subgraphId,
+ const std::string& name) const
+{
+ CHECK_SUBGRAPH(m_Model, subgraphId);
+ auto inputs = GetSubgraphInputs(m_Model, subgraphId);
+ for (auto const & input : inputs)
+ {
+ if (input.second->name == name)
+ {
+ auto bindingId = GenerateLayerBindingId(subgraphId, input.first);
+ return std::make_pair(bindingId, ToTensorInfo(input.second));
+ }
+ }
+
+ std::stringstream bindings;
+ for (auto const & input : inputs)
+ {
+ bindings << "'" << input.second->name << "' ";
+ }
+
+ throw ParseException(
+ boost::str(
+ boost::format("No input binding found for subgraph:%1% and name:%2%. "
+ "Possible inputs are: [%3%] %4%") %
+ subgraphId %
+ name %
+ bindings.str() %
+ CHECK_LOCATION().AsString()));
+}
+
+BindingPointInfo TfLiteParser::GetNetworkOutputBindingInfo(size_t subgraphId,
+ const std::string& name) const
+{
+ CHECK_SUBGRAPH(m_Model, subgraphId);
+ auto outputs = GetSubgraphOutputs(m_Model, subgraphId);
+ for (auto const & output : outputs)
+ {
+ if (output.second->name == name)
+ {
+ auto bindingId = GenerateLayerBindingId(subgraphId, output.first);
+ return std::make_pair(bindingId, ToTensorInfo(output.second));
+ }
+ }
+
+ std::stringstream bindings;
+ for (auto const & output : outputs)
+ {
+ bindings << "'" << output.second->name << "' ";
+ }
+
+ throw ParseException(
+ boost::str(
+ boost::format("No output binding found for subgraph:%1% and name:%2%. "
+ "Possible outputs are: [%3%] %4%") %
+ subgraphId %
+ name %
+ bindings.str() %
+ CHECK_LOCATION().AsString()));
+}
+
+size_t TfLiteParser::GetSubgraphCount() const
+{
+ return m_Model->subgraphs.size();
+}
+
+std::vector<std::string> TfLiteParser::GetSubgraphInputTensorNames(size_t subgraphId) const
+{
+ CHECK_SUBGRAPH(m_Model, subgraphId);
+ auto inputs = GetSubgraphInputs(m_Model, subgraphId);
+ std::vector<std::string> result;
+ result.reserve(inputs.size());
+ for (auto const & input : inputs)
+ {
+ result.push_back(input.second->name);
+ }
+ return result;
+}
+
+std::vector<std::string> TfLiteParser::GetSubgraphOutputTensorNames(size_t subgraphId) const
+{
+ CHECK_SUBGRAPH(m_Model, subgraphId);
+ auto outputs = GetSubgraphOutputs(m_Model, subgraphId);
+ std::vector<std::string> result;
+ result.reserve(outputs.size());
+ for (auto const & output : outputs)
+ {
+ result.push_back(output.second->name);
+ }
+ return result;
+}
+
+ITfLiteParser* ITfLiteParser::CreateRaw()
+{
+ return new TfLiteParser();
+}
+
+ITfLiteParserPtr ITfLiteParser::Create()
+{
+ return ITfLiteParserPtr(CreateRaw(), &ITfLiteParser::Destroy);
+}
+
+void ITfLiteParser::Destroy(ITfLiteParser* parser)
+{
+ delete parser;
+}
+
+TfLiteParser::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<float[]> && data)
+: m_FloatData(std::move(data))
+, m_Uint8Data(nullptr)
+, m_Int32Data(nullptr)
+{
+}
+
+TfLiteParser::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<uint8_t[]> && data)
+: m_FloatData(nullptr)
+, m_Uint8Data(std::move(data))
+, m_Int32Data(nullptr)
+{
+}
+
+TfLiteParser::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<int32_t[]> && data)
+: m_FloatData(nullptr)
+, m_Uint8Data(nullptr)
+, m_Int32Data(std::move(data))
+{
+}
+
+} // armnnTfLiteParser