diff options
author | telsoa01 <telmo.soares@arm.com> | 2018-08-31 09:22:23 +0100 |
---|---|---|
committer | telsoa01 <telmo.soares@arm.com> | 2018-08-31 09:22:23 +0100 |
commit | c577f2c6a3b4ddb6ba87a882723c53a248afbeba (patch) | |
tree | bd7d4c148df27f8be6649d313efb24f536b7cf34 /src/armnnTfLiteParser/TfLiteParser.cpp | |
parent | 4c7098bfeab1ffe1cdc77f6c15548d3e73274746 (diff) | |
download | armnn-c577f2c6a3b4ddb6ba87a882723c53a248afbeba.tar.gz |
Release 18.08
Diffstat (limited to 'src/armnnTfLiteParser/TfLiteParser.cpp')
-rw-r--r-- | src/armnnTfLiteParser/TfLiteParser.cpp | 1440 |
1 files changed, 1440 insertions, 0 deletions
diff --git a/src/armnnTfLiteParser/TfLiteParser.cpp b/src/armnnTfLiteParser/TfLiteParser.cpp new file mode 100644 index 0000000000..d5c48a10e2 --- /dev/null +++ b/src/armnnTfLiteParser/TfLiteParser.cpp @@ -0,0 +1,1440 @@ +// +// Copyright © 2017 Arm Ltd. All rights reserved. +// See LICENSE file in the project root for full license information. +// +#include "TfLiteParser.hpp" + +#include <armnn/ArmNN.hpp> +#include <armnn/Exceptions.hpp> +#include <armnn/TypesUtils.hpp> +#include <boost/filesystem.hpp> + +// armnnUtils: +#include <Permute.hpp> +#include <VerificationHelpers.hpp> + +// The generated code based on the Tf Lite schema: +#include <schema_generated.h> + +#include <boost/core/ignore_unused.hpp> +#include <boost/assert.hpp> +#include <boost/format.hpp> +#include <boost/log/trivial.hpp> + +#include <fstream> +#include <algorithm> +#include <limits> + +using namespace armnn; +using armnn::CheckLocation; +namespace armnnTfLiteParser +{ +namespace +{ +const PermutationVector NHWCToArmNN = { 0, 2, 3, 1 }; +const PermutationVector ArmNNToNHWC = { 0, 3, 1, 2 }; + +const uint32_t VIRTUAL_OPERATOR_ID = std::numeric_limits<uint32_t>::max(); + +void CheckSubgraph(const TfLiteParser::ModelPtr & model, + size_t subgraphIndex, + const CheckLocation & location) +{ + if (model.get() == nullptr) + { + throw ParseException( + boost::str( + boost::format("%1% was called with invalid (null) model. " + "Possible reason is that the model is not yet loaded and Unpack(ed). " + "subgraph:%2% at %3%") % + location.m_Function % + subgraphIndex % + location.FileLine())); + } + else if (subgraphIndex >= model->subgraphs.size()) + { + throw ParseException( + boost::str( + boost::format("%1% was called with an invalid subgraph index. " + "subgraph:%2% at %3%") % + location.m_Function % + subgraphIndex % + location.FileLine())); + } +} + +#define CHECK_SUBGRAPH(MODEL, SUBGRAPH_INDEX) \ + CheckSubgraph(MODEL, SUBGRAPH_INDEX, CHECK_LOCATION()) + +void CheckModel(const TfLiteParser::ModelPtr & model, + size_t subgraphIndex, + size_t operatorIndex, + const CheckLocation & location) +{ + if (model.get() == nullptr) + { + throw ParseException( + boost::str( + boost::format("%1% was called with invalid (null) model. " + "Possible reason is that the model is not yet loaded and Unpack(ed). " + "subgraph:%2% operator:%3% at %4%") % + location.m_Function % + subgraphIndex % + operatorIndex % + location.FileLine())); + } + else if (subgraphIndex >= model->subgraphs.size()) + { + throw ParseException( + boost::str( + boost::format("%1% was called with an invalid subgraph index. " + "subgraph:%2% operator:%3% at %4%") % + location.m_Function % + subgraphIndex % + operatorIndex % + location.FileLine())); + } + else if (operatorIndex >= model->subgraphs[subgraphIndex]->operators.size() && + operatorIndex != VIRTUAL_OPERATOR_ID) + { + throw ParseException( + boost::str( + boost::format("%1% was called with an invalid operator index. " + "subgraph:%2% operator:%3% at %4%") % + location.m_Function % + subgraphIndex % + operatorIndex % + location.FileLine())); + } +} + +#define CHECK_MODEL(MODEL, SUBGRAPH_INDEX, OPERATOR_INDEX) \ + CheckModel(MODEL, SUBGRAPH_INDEX, OPERATOR_INDEX, CHECK_LOCATION()) + +void CheckTensor(const TfLiteParser::ModelPtr & model, + size_t subgraphIndex, + size_t tensorIndex, + const CheckLocation & location) +{ + // not checking model, because I assume CHECK_MODEL already run + // and checked that. An assert would do. + BOOST_ASSERT_MSG(model.get() != nullptr, "Expecting a valid model in this function"); + + // also subgraph index should be checked by CHECK_MODEL so + // I only add an assert here + BOOST_ASSERT_MSG(subgraphIndex < model->subgraphs.size(), "Expecting a valid subgraph index"); + + // the tensor index is the only one to check here + if (tensorIndex >= model->subgraphs[subgraphIndex]->tensors.size()) + { + throw ParseException( + boost::str( + boost::format("%1% was called with an invalid tensor index. " + "subgraph:%2% tensor:%3% at %4%") % + location.m_Function % + subgraphIndex % + tensorIndex % + location.FileLine())); + } +} + +#define CHECK_TENSOR(MODEL, SUBGRAPH_INDEX, TENSOR_INDEX) \ + CheckTensor(MODEL, SUBGRAPH_INDEX, TENSOR_INDEX, CHECK_LOCATION()) + +void CheckTensorPtr(TfLiteParser::TensorRawPtr rawPtr, + const CheckLocation & location) +{ + if (rawPtr == nullptr) + { + throw ParseException( + boost::str( + boost::format("%1% was called with a null tensor pointer. " + "at %2%") % + location.m_Function % + location.FileLine())); + + } +} + +#define CHECK_TENSOR_PTR(TENSOR_PTR) \ + CheckTensorPtr(TENSOR_PTR, CHECK_LOCATION()) + +void CheckBuffer(const TfLiteParser::ModelPtr & model, + size_t bufferIndex, + const CheckLocation & location) +{ + if (model.get() == nullptr) + { + throw ParseException( + boost::str( + boost::format("%1% was called with invalid (null) model. " + "Possible reason is that the model is not yet loaded and Unpack(ed). " + "buffer:%2% at %3%") % + location.m_Function % + bufferIndex % + location.FileLine())); + } + else if (bufferIndex >= model->buffers.size()) + { + throw ParseException( + boost::str( + boost::format("%1% was called with an invalid buffer index. " + "buffer index:%2% at %3%") % + location.m_Function % + bufferIndex % + location.FileLine())); + } + else if (model->buffers[bufferIndex].get() == nullptr) + { + throw ParseException( + boost::str( + boost::format("The buffer #%1% is null. %3%") % + bufferIndex % + location.AsString())); + } +} + +#define CHECK_BUFFER(MODEL, BUFFER_INDEX) \ + CheckBuffer(MODEL, BUFFER_INDEX, CHECK_LOCATION()) + +void CheckBufferSize(TfLiteParser::BufferRawPtr bufferPtr, + const armnn::TensorInfo & tensorInfo, + uint32_t bufferId, + const CheckLocation & location) +{ + if (bufferPtr == nullptr) + { + throw ParseException( + boost::str( + boost::format("BufferPtr is null for buffer:%1%. %2%") % + bufferId % + location.AsString())); + } + else if(tensorInfo.GetNumElements() > bufferPtr->data.size() || + tensorInfo.GetNumBytes() > bufferPtr->data.size()) + { + std::stringstream ss; + ss << "Buffer #" << bufferId << " has " << bufferPtr->data.size() << " bytes. " + << "For tensor: " << tensorInfo.GetShape() + << " expecting: " << tensorInfo.GetNumBytes() << " bytes and " + << tensorInfo.GetNumElements() << " elements. " << location.AsString(); + throw ParseException(ss.str()); + } +} + +#define CHECK_BUFFER_SIZE(BUFFER_PTR, TENSOR_INFO, BUFFER_ID) \ + CheckBufferSize(BUFFER_PTR, TENSOR_INFO, BUFFER_ID, CHECK_LOCATION()) + +bool IsActivationSupported(tflite::ActivationFunctionType activationType) +{ + switch(activationType) + { + case tflite::ActivationFunctionType_NONE: + case tflite::ActivationFunctionType_RELU: + case tflite::ActivationFunctionType_RELU6: + case tflite::ActivationFunctionType_TANH: + { + return true; + } + default: + { + return false; + } + } +} + +#define CHECK_SUPPORTED_FUSED_ACTIVATION(OPTION, SUBGRAPH_INDEX, OPERATOR_INDEX) \ + do { \ + if (IsActivationSupported(OPTION->fused_activation_function) == false) \ + { \ + throw ParseException( \ + boost::str( \ + boost::format("TfLite parser doesn't suppport fused activation: " \ + "%1%/%2% in %3% subgraph:%4% operator:%5% at %6%") % \ + OPTION->fused_activation_function % \ + tflite::EnumNameActivationFunctionType(\ + OPTION->fused_activation_function) % \ + __func__ % \ + SUBGRAPH_INDEX % \ + OPERATOR_INDEX % \ + CHECK_LOCATION().FileLine())); \ + } \ + } while(false) + + +std::vector<unsigned int> AsUnsignedVector(const std::vector<int32_t> & in) +{ + std::vector<unsigned int> result; + result.reserve(in.size()); + for (auto & i : in) + { + result.push_back(CHECKED_NON_NEGATIVE(i)); + } + return result; +} + +void CalcPadding(uint32_t inputSize, + uint32_t filterSize, + uint32_t stride, + uint32_t& paddingFront, + uint32_t& paddingBack, + tflite::Padding padding) +{ + paddingFront = 0; + paddingBack = 0; + if (padding == tflite::Padding_SAME) + { + uint32_t outputSize = (inputSize + stride - 1) / stride; + uint32_t temp = (outputSize - 1) * stride + filterSize; + if (temp > inputSize) + { + paddingFront = (temp - inputSize) / 2; + paddingBack = (temp - inputSize) - paddingFront; + } + } +} + +armnn::TensorInfo ToTensorInfo(TfLiteParser::TensorRawPtr tensorPtr) +{ + armnn::DataType type; + CHECK_TENSOR_PTR(tensorPtr); + + switch (tensorPtr->type) + { + case tflite::TensorType_UINT8: + type = armnn::DataType::QuantisedAsymm8; + break; + case tflite::TensorType_FLOAT32: + type = armnn::DataType::Float32; + break; + case tflite::TensorType_INT32: + type = armnn::DataType::Signed32; + break; + + default: + { + CheckLocation location = CHECK_LOCATION(); + throw ParseException( + boost::str( + boost::format("Unsupported data type %1% = %2% for tensor: %3%. %4%") % + tensorPtr->type % + tflite::EnumNameTensorType(tensorPtr->type) % + tensorPtr->name % + location.AsString())); + } + } + + float quantizationScale = 0.0f; + int32_t quantizationOffset = 0; + + if (tensorPtr->quantization.get()) + { + CHECK_VALID_SIZE(tensorPtr->quantization->scale.size(), 0, 1); + CHECK_VALID_SIZE(tensorPtr->quantization->zero_point.size(), 0, 1); + + if (tensorPtr->quantization->scale.size() == 1) + { + quantizationScale = tensorPtr->quantization->scale[0]; + } + if (tensorPtr->quantization->zero_point.size() == 1) + { + // NOTE: we lose precision here when converting from 64 bit to 32 + // but this is what we support at the monent in ArmNN + quantizationOffset = static_cast<int32_t>(tensorPtr->quantization->zero_point[0]); + } + } + + auto const & dimensions = AsUnsignedVector(tensorPtr->shape); + + // two statements (on purpose) for easier debugging: + armnn::TensorInfo result(static_cast<unsigned int>(tensorPtr->shape.size()), + dimensions.data(), + type, + quantizationScale, + quantizationOffset); + return result; +} + +template<typename T> +std::pair<armnn::ConstTensor, std::unique_ptr<T[]>> +CreateConstTensorImpl(TfLiteParser::BufferRawPtr bufferPtr, + TfLiteParser::TensorRawPtr tensorPtr, + armnn::TensorInfo & tensorInfo, + bool convertFromTfToArmnnFormat) +{ + BOOST_ASSERT_MSG(tensorPtr != nullptr, "tensorPtr is null"); + BOOST_ASSERT_MSG(bufferPtr != nullptr, + boost::str( + boost::format("Buffer for buffer:%1% is null") % tensorPtr->buffer).c_str()); + + std::unique_ptr<T[]> data(new T[tensorInfo.GetNumElements()]); + + if (convertFromTfToArmnnFormat) + { + tensorInfo = armnnUtils::Permuted(tensorInfo, NHWCToArmNN); + armnnUtils::Permute(tensorInfo.GetShape(), + NHWCToArmNN, + reinterpret_cast<const T *>(bufferPtr->data.data()), + data.get()); + } + else + { + ::memcpy(data.get(), bufferPtr->data.data(), tensorInfo.GetNumBytes()); + } + return std::make_pair(ConstTensor(tensorInfo, data.get()), std::move(data)); +} + +IConnectableLayer* SwizzleIn(INetwork& network, + IConnectableLayer* layer, + unsigned int inputSlotIndex, + const TensorInfo & inputInfo) +{ + BOOST_ASSERT(layer != nullptr); + // Add swizzle layer + std::stringstream name; + name << "swizzle_for-" << layer->GetName() << ":in" << inputSlotIndex; + IConnectableLayer* const swizzleLayer = network.AddPermuteLayer(NHWCToArmNN, name.str().c_str()); + // Set swizzled output shape + const TensorInfo swizzleOutInfo = armnnUtils::Permuted(inputInfo, NHWCToArmNN); + swizzleLayer->GetOutputSlot(0).SetTensorInfo(swizzleOutInfo); + // Connect the swizzle layer to the actual layer + swizzleLayer->GetOutputSlot(0).Connect(layer->GetInputSlot(inputSlotIndex)); + + return swizzleLayer; +} + +IConnectableLayer* DeswizzleOut(INetwork& network, + IConnectableLayer* layer, + unsigned int outputSlotIndex, + const TensorInfo & outputInfo) +{ + BOOST_ASSERT(layer != nullptr); + // Add deswizzle layer + std::stringstream name; + name << "deswizzle_for-" << layer->GetName() << ":out" << outputSlotIndex; + IConnectableLayer* const deswizzleLayer = network.AddPermuteLayer(ArmNNToNHWC, name.str().c_str()); + // Set deswizzled output shape + deswizzleLayer->GetOutputSlot(0).SetTensorInfo(outputInfo); + // Set original layer output shape + const TensorInfo deswizzleOutInfo = armnnUtils::Permuted(outputInfo, NHWCToArmNN); + layer->GetOutputSlot(outputSlotIndex).SetTensorInfo(deswizzleOutInfo); + // Connect the actual layer to the deswizzle layer + layer->GetOutputSlot(outputSlotIndex).Connect(deswizzleLayer->GetInputSlot(0)); + + return deswizzleLayer; +} + +std::pair<IConnectableLayer*, IConnectableLayer*> SwizzleInDeswizzleOut(INetwork& network, + IConnectableLayer* layer, + unsigned int inputSlotIndex, + const TensorInfo & inputInfo, + unsigned int outputSlotIndex, + const TensorInfo & outputInfo) +{ + IConnectableLayer* const swizzleLayer = SwizzleIn(network, layer, inputSlotIndex, inputInfo); + IConnectableLayer* const deswizzleLayer = DeswizzleOut(network, layer, outputSlotIndex, outputInfo); + return std::make_pair(swizzleLayer, deswizzleLayer); +} + +armnn::LayerBindingId GenerateLayerBindingId(size_t subgraphIndex, size_t tensorIndex) +{ + // generate the binding id by shifting the tensor id by 8 bit + // and add the subgraph id, which allows 256 subgraphs + return static_cast<armnn::LayerBindingId>((tensorIndex<<8)+subgraphIndex); +} + +} // <anonymous> + +TfLiteParser::TfLiteParser() +: m_Network(nullptr, nullptr) +, m_ParserFunctions(tflite::BuiltinOperator_MAX+1, &TfLiteParser::ParseUnsupportedOperator) +{ + // register supported operators + m_ParserFunctions[tflite::BuiltinOperator_AVERAGE_POOL_2D] = &TfLiteParser::ParseAveragePool2D; + m_ParserFunctions[tflite::BuiltinOperator_CONV_2D] = &TfLiteParser::ParseConv2D; + m_ParserFunctions[tflite::BuiltinOperator_DEPTHWISE_CONV_2D] = &TfLiteParser::ParseDepthwiseConv2D; + m_ParserFunctions[tflite::BuiltinOperator_SOFTMAX] = &TfLiteParser::ParseSoftmax; + m_ParserFunctions[tflite::BuiltinOperator_SQUEEZE] = &TfLiteParser::ParseSqueeze; +} + +void TfLiteParser::ResetParser() +{ + m_Network = armnn::INetworkPtr(nullptr, nullptr); + m_Model = nullptr; + m_SubgraphConnections.clear(); +} + +INetworkPtr TfLiteParser::CreateNetworkFromBinaryFile(const char* graphFile) +{ + ResetParser(); + m_Model = LoadModelFromFile(graphFile); + return CreateNetworkFromModel(); +} + +INetworkPtr TfLiteParser::CreateNetworkFromBinary(const std::vector<uint8_t> & binaryContent) +{ + ResetParser(); + m_Model = LoadModelFromBinary(binaryContent.data(), binaryContent.size()); + return CreateNetworkFromModel(); +} + +INetworkPtr TfLiteParser::CreateNetworkFromModel() +{ + m_Network = INetwork::Create(); + BOOST_ASSERT(m_Model.get() != nullptr); + + bool failedToCreate = false; + std::stringstream errors; + + if (m_Model->subgraphs.size() != 1) + { + throw ParseException( + boost::str( + boost::format("Current TfLite parser only supports 1 subgraph. Current one has: %1% %2%") % + m_Model->subgraphs.size() % + CHECK_LOCATION().AsString())); + } + + size_t subgraphIndex = 0; + for (SubGraphPtr const & subgraph : m_Model->subgraphs) + { + m_SubgraphConnections.emplace_back(subgraph->tensors.size()); + + size_t operatorIndex = 0; + for (OperatorPtr const & op : subgraph->operators) + { + try + { + if (op->custom_options.size() > 0) + { + throw ParseException( + boost::str( + boost::format("Custom options for op: %1% is not supported. " + "It has %2% bytes of custom options. %3%") % + op->opcode_index % + op->custom_options.size() % + CHECK_LOCATION().AsString())); + } + + auto const & opCodePtr = m_Model->operator_codes[op->opcode_index]; + auto builtinCode = opCodePtr->builtin_code; + + if (builtinCode > tflite::BuiltinOperator_MAX) + { + throw ParseException( + boost::str( + boost::format("Operator code %1% is out of range 0-%2%. " + "subgraph:%3% operator idx:%4%. %5%") % + builtinCode % + tflite::BuiltinOperator_MAX % + subgraphIndex % + operatorIndex % + CHECK_LOCATION().AsString())); + } + + // lookup and call the parser function + auto & parserFunction = m_ParserFunctions[builtinCode]; + (this->*parserFunction)(subgraphIndex, operatorIndex); + } + catch (const ParseException& e) + { + failedToCreate = true; + std::stringstream errorString; + + errorString << "Failed to parse operator #" << operatorIndex + << " within subgraph #" << subgraphIndex + << " error: " << e.what(); + BOOST_LOG_TRIVIAL(error) << errorString.str(); + + errors << errorString.str() << "\n"; + } + ++operatorIndex; + } + + SetupInputLayers(subgraphIndex); + SetupOutputLayers(subgraphIndex); + + ++subgraphIndex; + } + + if (failedToCreate) + { + // we can skip everything and let the outer exception handler deal with the error + throw ParseException(errors.str()); + } + + // establish the connections from the layer outputs to the inputs of the subsequent layers + for (size_t subgraphIndex = 0; subgraphIndex < m_SubgraphConnections.size(); ++subgraphIndex) + { + for (size_t tensorIndex = 0; tensorIndex < m_SubgraphConnections[subgraphIndex].size(); ++tensorIndex) + { + if (m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot != nullptr) + { + for (size_t inputSlotIdx = 0; + inputSlotIdx < m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots.size(); + ++inputSlotIdx) + { + m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot->Connect( + *(m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots[inputSlotIdx])); + } + } + } + } + + return std::move(m_Network); +} + +void TfLiteParser::RegisterProducerOfTensor(size_t subgraphIndex, + size_t tensorIndex, + armnn::IOutputSlot* slot) +{ + CHECK_TENSOR(m_Model, subgraphIndex, tensorIndex); + BOOST_ASSERT(m_SubgraphConnections.size() > subgraphIndex); + BOOST_ASSERT(m_SubgraphConnections[subgraphIndex].size() > tensorIndex); + + TensorSlots & tensorSlots = m_SubgraphConnections[subgraphIndex][tensorIndex]; + + // assuming there is only one producer for that tensor + if (tensorSlots.outputSlot != nullptr) + { + throw ParseException(boost::str( + boost::format("Another layer has already registered itself as the producer of " + "subgraph:%1% tensor:%2% %3%") % + subgraphIndex % + tensorIndex % + CHECK_LOCATION().AsString())); + } + + tensorSlots.outputSlot = slot; +} + +void TfLiteParser::RegisterConsumerOfTensor(size_t subgraphIndex, + size_t tensorIndex, + armnn::IInputSlot* slot) +{ + CHECK_TENSOR(m_Model, subgraphIndex, tensorIndex); + BOOST_ASSERT(m_SubgraphConnections.size() > subgraphIndex); + BOOST_ASSERT(m_SubgraphConnections[subgraphIndex].size() > tensorIndex); + + TensorSlots & tensorSlots = m_SubgraphConnections[subgraphIndex][tensorIndex]; + tensorSlots.inputSlots.push_back(slot); +} + +void TfLiteParser::ParseUnsupportedOperator(size_t subgraphIndex, size_t operatorIndex) +{ + CHECK_MODEL(m_Model, subgraphIndex, operatorIndex); + const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex]; + // + auto opcodeIndex = operatorPtr->opcode_index; + auto opcode = m_Model->operator_codes[opcodeIndex]->builtin_code; + + throw ParseException( + boost::str( + boost::format("Operator not supported. " + "subgraph:%1% operator:%2% " + "opcode_index:%3% opcode:%4% / %5% %6%") % + subgraphIndex % + operatorIndex % + opcodeIndex % + opcode % + tflite::EnumNameBuiltinOperator(opcode) % + CHECK_LOCATION().AsString())); +} + +void TfLiteParser::ParseAveragePool2D(size_t subgraphIndex, size_t operatorIndex) +{ + CHECK_MODEL(m_Model, subgraphIndex, operatorIndex); + + const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex]; + const auto * options = operatorPtr->builtin_options.AsPool2DOptions(); + + CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex); + + Pooling2dDescriptor desc; + + desc.m_PoolType = PoolingAlgorithm::Average; + desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w); + desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h); + desc.m_PoolWidth = CHECKED_NON_NEGATIVE(options->filter_width); + desc.m_PoolHeight = CHECKED_NON_NEGATIVE(options->filter_height); + desc.m_PaddingMethod = PaddingMethod::Exclude; + desc.m_OutputShapeRounding = OutputShapeRounding::Floor; + + auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(inputs.size(), 1); + armnn::TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]); + + // assuming input is NHWC + unsigned int inputHeight = inputTensorInfo.GetShape()[1]; + unsigned int inputWidth = inputTensorInfo.GetShape()[2]; + + CalcPadding(inputHeight, desc.m_PoolHeight, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, options->padding); + CalcPadding(inputWidth, desc.m_PoolWidth, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, options->padding); + + auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(outputs.size(), 1); + armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]); + + auto layerName = boost::str(boost::format("AveragePool2D:%1%:%2%") % subgraphIndex % operatorIndex); + IConnectableLayer* layer = m_Network->AddPooling2dLayer(desc, layerName.c_str()); + + BOOST_ASSERT(layer != nullptr); + + // add permute layers to swizzle the input and deswizzle the output + std::pair<IConnectableLayer*, IConnectableLayer*> permuteLayers = + SwizzleInDeswizzleOut(*m_Network, layer, 0, inputTensorInfo, 0, outputTensorInfo); + + // register the input connection slots for the layer, connections are made after all layers have been created + // only the tensors for the inputs are relevant, exclude the const tensors + auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterInputSlots(subgraphIndex, operatorIndex, permuteLayers.first, {inputTensorIndexes[0]}); + + // we need to add the activation layer and fortunately we don't need to care about the data layout + // beause the activation function is element-wise, so it is OK to have the activation after the trailing + // swizzle layer + layer = AddActivationLayer(permuteLayers.second, 0, options->fused_activation_function); + // register the output connection slots for the layer, connections are made after all layers have been created + auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]}); +} + +void TfLiteParser::ParseConv2D(size_t subgraphIndex, size_t operatorIndex) +{ + CHECK_MODEL(m_Model, subgraphIndex, operatorIndex); + + const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex]; + const auto * options = operatorPtr->builtin_options.AsConv2DOptions(); + + CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex); + + Convolution2dDescriptor desc; + desc.m_BiasEnabled = false; + desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w); + desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h); + + auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(inputs.size(), 2, 3); + + auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(outputs.size(), 1); + + armnn::TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]); + armnn::TensorInfo filterTensorInfo = ToTensorInfo(inputs[1]); + + // assuming input is NHWC + unsigned int inputHeight = inputTensorInfo.GetShape()[1]; + unsigned int inputWidth = inputTensorInfo.GetShape()[2]; + + // assuming the filter is OHWI : Output, H, W, Input + // which is essentially the same as NHWC + unsigned int filterHeight = filterTensorInfo.GetShape()[1]; + unsigned int filterWidth = filterTensorInfo.GetShape()[2]; + + CalcPadding(inputHeight, filterHeight, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, options->padding); + CalcPadding(inputWidth, filterWidth, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, options->padding); + + auto filterTensorAndData = CreateConstTensor(inputs[1], filterTensorInfo, true); + armnn::IConnectableLayer* layer; + + auto layerName = boost::str(boost::format("Conv2D:%1%:%2%") % subgraphIndex % operatorIndex); + + if (inputs.size() == 3) + { + desc.m_BiasEnabled = true; + armnn::TensorInfo biasTensorInfo = ToTensorInfo(inputs[2]); + auto biasTensorAndData = CreateConstTensor(inputs[2], biasTensorInfo, false); + layer = m_Network->AddConvolution2dLayer(desc, + filterTensorAndData.first, + biasTensorAndData.first, + layerName.c_str()); + } + else + { + layer = m_Network->AddConvolution2dLayer(desc, + filterTensorAndData.first, + layerName.c_str()); + } + + BOOST_ASSERT(layer != nullptr); + + // add permute layers to swizzle the input and deswizzle the output + armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]); + std::pair<IConnectableLayer*, IConnectableLayer*> permuteLayers = + SwizzleInDeswizzleOut(*m_Network, layer, 0, inputTensorInfo, 0, outputTensorInfo); + + // register the input connection slots for the layer, connections are made after all layers have been created + // only the tensors for the inputs are relevant, exclude the const tensors + auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterInputSlots(subgraphIndex, operatorIndex, permuteLayers.first, {inputTensorIndexes[0]}); + + // we need to add the activation layer and fortunately we don't need to care about the data layout + // beause the activation function is element-wise, so it is OK to have the activation after the trailing + // swizzle layer + layer = AddActivationLayer(permuteLayers.second, 0, options->fused_activation_function); + // register the output connection slots for the layer, connections are made after all layers have been created + auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]}); +} + +void TfLiteParser::ParseDepthwiseConv2D(size_t subgraphIndex, size_t operatorIndex) +{ + CHECK_MODEL(m_Model, subgraphIndex, operatorIndex); + + const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex]; + const auto * options = operatorPtr->builtin_options.AsDepthwiseConv2DOptions(); + + CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex); + + DepthwiseConvolution2dDescriptor desc; + desc.m_BiasEnabled = false; + desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w); + desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h); + // ACL only supports a depth (channel) multiplier of 1, it is not currently stored in the descriptor + CHECK_VALID_SIZE(CHECKED_NON_NEGATIVE(options->depth_multiplier), 1); + + auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(inputs.size(), 2, 3); + auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(outputs.size(), 1); + + armnn::TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]); + armnn::TensorInfo filterTensorInfo = ToTensorInfo(inputs[1]); + + // assuming input is NHWC + unsigned int inputHeight = inputTensorInfo.GetShape()[1]; + unsigned int inputWidth = inputTensorInfo.GetShape()[2]; + // assuming the filter is OHWI : Output, H, W, Input + unsigned int filterHeight = filterTensorInfo.GetShape()[1]; + unsigned int filterWidth = filterTensorInfo.GetShape()[2]; + + CalcPadding(inputHeight, filterHeight, desc.m_StrideY, desc.m_PadTop, desc.m_PadBottom, options->padding); + CalcPadding(inputWidth, filterWidth, desc.m_StrideX, desc.m_PadLeft, desc.m_PadRight, options->padding); + + auto filterTensorAndData = CreateConstTensor(inputs[1], filterTensorInfo, true); + armnn::IConnectableLayer* layer; + auto layerName = boost::str(boost::format("DepthwiseConv2D:%1%:%2%") % subgraphIndex % operatorIndex); + + if (inputs.size() == 3) + { + desc.m_BiasEnabled = true; + TensorInfo biasTensorInfo = ToTensorInfo(inputs[2]); + auto biasTensorAndData = CreateConstTensor(inputs[2], biasTensorInfo, false); + layer = m_Network->AddDepthwiseConvolution2dLayer(desc, + filterTensorAndData.first, + biasTensorAndData.first, + layerName.c_str()); + } + else + { + layer = m_Network->AddDepthwiseConvolution2dLayer(desc, + filterTensorAndData.first, + layerName.c_str()); + } + BOOST_ASSERT(layer != nullptr); + + // add permute layers to swizzle the input and deswizzle the output + armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]); + std::pair<IConnectableLayer*, IConnectableLayer*> permuteLayers = + SwizzleInDeswizzleOut(*m_Network, layer, 0, inputTensorInfo, 0, outputTensorInfo); + + // register the input connection slots for the layer, connections are made after all layers have been created + // only the tensors for the inputs are relevant, exclude the const tensors + auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterInputSlots(subgraphIndex, operatorIndex, permuteLayers.first, {inputTensorIndexes[0]}); + + // we need to add the activation layer and fortunately we don't need to care about the data layout + // beause the activation function is element-wise, so it is OK to have the activation after the trailing + // swizzle layer + layer = AddActivationLayer(permuteLayers.second, 0, options->fused_activation_function); + // register the output connection slots for the layer, connections are made after all layers have been created + auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]}); +} + +void TfLiteParser::ParseSoftmax(size_t subgraphIndex, size_t operatorIndex) +{ + CHECK_MODEL(m_Model, subgraphIndex, operatorIndex); + const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex]; + const auto * options = operatorPtr->builtin_options.AsSoftmaxOptions(); + + SoftmaxDescriptor desc; + desc.m_Beta = options->beta; + + auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(inputs.size(), 1); + auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(outputs.size(), 1); + + auto layerName = boost::str(boost::format("Softmax:%1%:%2%") % subgraphIndex % operatorIndex); + IConnectableLayer* const layer = m_Network->AddSoftmaxLayer(desc, layerName.c_str()); + + armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]); + layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo); + + // register the input connection slots for the layer, connections are made after all layers have been created + // only the tensors for the inputs are relevant, exclude the const tensors + auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]}); + + // register the output connection slots for the layer, connections are made after all layers have been created + auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]}); +} + +armnn::TensorInfo TfLiteParser::OutputShapeOfSqueeze(const std::vector<uint32_t> & squeezeDimsIn, + const armnn::TensorInfo & inputTensorInfo) +{ + CHECK_VALID_SIZE(squeezeDimsIn.size(), 0, 1, 2, 3, 4); + std::vector<uint32_t> squeezeDims = squeezeDimsIn; + static const uint32_t dimensionSequence[] = { 0, 1, 2, 3 }; + + if (inputTensorInfo.GetNumDimensions() > 4) + { + std::stringstream ss; + ss << "Input tensor has unexpected number of dimensions:" << inputTensorInfo.GetNumDimensions() + << " shape:" << inputTensorInfo.GetShape() << " " + << CHECK_LOCATION().AsString(); + throw ParseException(ss.str()); + } + + if (squeezeDims.empty()) + { + squeezeDims.assign(dimensionSequence, + dimensionSequence+inputTensorInfo.GetNumDimensions()); + } + + std::vector<uint32_t> outputDims; + for(unsigned int i = 0; i < inputTensorInfo.GetNumDimensions(); i++) + { + bool skipSqueeze = (std::find(squeezeDims.begin(), squeezeDims.end(), i) == squeezeDims.end()); + auto currentDimension = inputTensorInfo.GetShape()[i]; + if (skipSqueeze || currentDimension != 1) + { + outputDims.push_back(currentDimension); + } + } + + if (outputDims.size() > 4) + { + std::stringstream ss; + ss << "Output tensor has unexpected number of dimensions:" << inputTensorInfo.GetNumDimensions() + << " shape:" << inputTensorInfo.GetShape() << " " + << CHECK_LOCATION().AsString(); + throw ParseException(ss.str()); + } + + TensorShape outShape = TensorShape(static_cast<unsigned int>(outputDims.size()), + outputDims.data()); + + // we need to preserve the tensor type and the quantization data as well + TensorInfo outTensorInfo = inputTensorInfo; + outTensorInfo.SetShape(outShape); + + return outTensorInfo; +} + +void TfLiteParser::ParseSqueeze(size_t subgraphIndex, size_t operatorIndex) +{ + CHECK_MODEL(m_Model, subgraphIndex, operatorIndex); + + auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(inputs.size(), 1); + + auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex); + CHECK_VALID_SIZE(outputs.size(), 1); + + const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex]; + const auto * options = operatorPtr->builtin_options.AsSqueezeOptions(); + + armnn::TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]); + armnn::TensorInfo outputTensorInfo = + TfLiteParser::OutputShapeOfSqueeze(AsUnsignedVector(options->squeeze_dims), + inputTensorInfo); + + ReshapeDescriptor reshapeDesc; + reshapeDesc.m_TargetShape = outputTensorInfo.GetShape(); + + auto layerName = boost::str(boost::format("Squeeze:%1%:%2%") % subgraphIndex % operatorIndex); + IConnectableLayer* layer = m_Network->AddReshapeLayer(reshapeDesc, layerName.c_str()); + layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo); + + auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]}); + + auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex)); + RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]}); +} + +armnn::IConnectableLayer* TfLiteParser::AddActivationLayer(armnn::IConnectableLayer* prevLayer, + unsigned int outputSlot, + tflite::ActivationFunctionType activationType) +{ + ActivationDescriptor activationDesc; + std::string layerName = prevLayer->GetName(); + + switch(activationType) + { + case tflite::ActivationFunctionType_NONE: + { + // this is a no-op: return previous layer + return prevLayer; + } + case tflite::ActivationFunctionType_RELU: + { + activationDesc.m_Function = ActivationFunction::ReLu; + layerName += ":RELU"; + break; + } + case tflite::ActivationFunctionType_RELU6: + { + activationDesc.m_Function = ActivationFunction::BoundedReLu; + activationDesc.m_A = 6.0f; + activationDesc.m_B = 0.0f; + layerName += ":RELU6"; + break; + } + case tflite::ActivationFunctionType_TANH: + { + activationDesc.m_Function = ActivationFunction::TanH; + activationDesc.m_A = 1.0f; + activationDesc.m_B = 1.0f; + layerName += ":TANH"; + break; + } + + // I only put these here as a reminder what others we could support + case tflite::ActivationFunctionType_RELU_N1_TO_1: + case tflite::ActivationFunctionType_SIGN_BIT: + default: + { + throw ParseException( + boost::str( + boost::format("TfLite parser doesn't suppport fused activation: " + "%1%/%2% %3% ") % + activationType % + tflite::EnumNameActivationFunctionType(activationType) % + CHECK_LOCATION().AsString())); + + } + } + + IConnectableLayer* activationLayer = + m_Network->AddActivationLayer(activationDesc, layerName.c_str()); + + auto & prevOutputSlot = prevLayer->GetOutputSlot(outputSlot); + prevOutputSlot.Connect(activationLayer->GetInputSlot(0)); + activationLayer->GetOutputSlot(0).SetTensorInfo(prevOutputSlot.GetTensorInfo()); + return activationLayer; +} + +TfLiteParser::ModelPtr TfLiteParser::LoadModelFromFile(const char * fileName) +{ + if (fileName == nullptr) + { + throw InvalidArgumentException(boost::str(boost::format("Invalid (null) file name %1%") % + CHECK_LOCATION().AsString())); + } + boost::system::error_code errorCode; + boost::filesystem::path pathToFile(fileName); + if (!boost::filesystem::exists(pathToFile, errorCode)) + { + throw FileNotFoundException(boost::str(boost::format("Cannot find the file (%1%) errorCode: %2% %3%") % + fileName % + errorCode % + CHECK_LOCATION().AsString())); + } + std::ifstream file(fileName, std::ios::binary); + std::string fileContent((std::istreambuf_iterator<char>(file)), std::istreambuf_iterator<char>()); + return LoadModelFromBinary(reinterpret_cast<const uint8_t *>(fileContent.c_str()), + fileContent.size()); +} + +TfLiteParser::ModelPtr TfLiteParser::LoadModelFromBinary(const uint8_t * binaryContent, size_t len) +{ + if (binaryContent == nullptr) + { + throw InvalidArgumentException(boost::str(boost::format("Invalid (null) binary content %1%") % + CHECK_LOCATION().AsString())); + } + flatbuffers::Verifier verifier(binaryContent, len); + if (verifier.VerifyBuffer<tflite::Model>() == false) + { + throw ParseException( + boost::str(boost::format("Buffer doesn't conform to the expected Tensorflow Lite " + "flatbuffers format. size:%1% %2%") % + len % + CHECK_LOCATION().AsString())); + } + return tflite::UnPackModel(binaryContent); +} + +TfLiteParser::TensorRawPtrVector TfLiteParser::GetInputs(const ModelPtr & model, + size_t subgraphIndex, + size_t operatorIndex) +{ + CHECK_MODEL(model, subgraphIndex, operatorIndex); + + const auto & subGraphPtr = model->subgraphs[subgraphIndex]; + const auto & operatorPtr = subGraphPtr->operators[operatorIndex]; + + size_t inputCount = operatorPtr->inputs.size(); + TensorRawPtrVector result(inputCount); + for (size_t i=0; i<inputCount; ++i) + { + uint32_t inputId = CHECKED_NON_NEGATIVE(operatorPtr->inputs[i]); + result[i] = subGraphPtr->tensors[inputId].get(); + } + return result; +} + +TfLiteParser::TensorRawPtrVector TfLiteParser::GetOutputs(const ModelPtr & model, + size_t subgraphIndex, + size_t operatorIndex) +{ + CHECK_MODEL(model, subgraphIndex, operatorIndex); + + const auto & subGraphPtr = model->subgraphs[subgraphIndex]; + const auto & operatorPtr = subGraphPtr->operators[operatorIndex]; + + size_t outputCount = operatorPtr->outputs.size(); + TensorRawPtrVector result(outputCount); + for (size_t i=0; i<outputCount; ++i) + { + uint32_t outputId = CHECKED_NON_NEGATIVE(operatorPtr->outputs[i]); + CHECK_TENSOR(model, subgraphIndex, outputId); + result[i] = subGraphPtr->tensors[outputId].get(); + } + return result; +} + +TfLiteParser::TensorIdRawPtrVector TfLiteParser::GetSubgraphInputs(const ModelPtr & model, + size_t subgraphIndex) +{ + CHECK_SUBGRAPH(model, subgraphIndex); + const auto & subGraphPtr = model->subgraphs[subgraphIndex]; + + size_t inputCount = subGraphPtr->inputs.size(); + TensorIdRawPtrVector result(inputCount); + for (size_t i=0; i<inputCount; ++i) + { + uint32_t inputId = CHECKED_NON_NEGATIVE(subGraphPtr->inputs[i]); + CHECK_TENSOR(model, subgraphIndex, inputId); + result[i] = std::make_pair(inputId, subGraphPtr->tensors[inputId].get()); + } + return result; +} + +TfLiteParser::TensorIdRawPtrVector TfLiteParser::GetSubgraphOutputs(const ModelPtr & model, + size_t subgraphIndex) +{ + CHECK_SUBGRAPH(model, subgraphIndex); + const auto & subGraphPtr = model->subgraphs[subgraphIndex]; + + size_t outputCount = subGraphPtr->outputs.size(); + TensorIdRawPtrVector result(outputCount); + for (size_t i=0; i<outputCount; ++i) + { + uint32_t outputId = CHECKED_NON_NEGATIVE(subGraphPtr->outputs[i]); + result[i] = std::make_pair(outputId, subGraphPtr->tensors[outputId].get()); + } + return result; +} + +std::vector<int32_t>& TfLiteParser::GetInputTensorIds(const ModelPtr& model, + size_t subgraphIndex, + size_t operatorIndex) +{ + CHECK_MODEL(model, subgraphIndex, operatorIndex); + const auto & subGraphPtr = model->subgraphs[subgraphIndex]; + const auto & operatorPtr = subGraphPtr->operators[operatorIndex]; + return operatorPtr->inputs; +} + +std::vector<int32_t>& TfLiteParser::GetOutputTensorIds(const ModelPtr& model, + size_t subgraphIndex, + size_t operatorIndex) +{ + CHECK_MODEL(model, subgraphIndex, operatorIndex); + const auto & subGraphPtr = model->subgraphs[subgraphIndex]; + const auto & operatorPtr = subGraphPtr->operators[operatorIndex]; + return operatorPtr->outputs; +} + +void TfLiteParser::RegisterInputSlots(size_t subgraphIndex, + size_t operatorIndex, + IConnectableLayer* layer, + const std::vector<unsigned int>& tensorIndexes) +{ + CHECK_MODEL(m_Model, subgraphIndex, operatorIndex); + BOOST_ASSERT(layer != nullptr); + if (tensorIndexes.size() != layer->GetNumInputSlots()) + { + throw ParseException( + boost::str(boost::format("The number of tensor inputs (%1%) does not match the number expected (%2%)" + " for subgraph:%3% operator index:%4% %5%") % + tensorIndexes.size() % + layer->GetNumInputSlots() % + subgraphIndex % + operatorIndex % + CHECK_LOCATION().AsString())); + } + + for (unsigned int slotIndex = 0; slotIndex < layer->GetNumInputSlots(); ++slotIndex) + { + unsigned int tensorIndex = tensorIndexes[slotIndex]; + armnn::IInputSlot* slot = &(layer->GetInputSlot(slotIndex)); + RegisterConsumerOfTensor(subgraphIndex, tensorIndex, slot); + } +} + +void TfLiteParser::RegisterOutputSlots(size_t subgraphIndex, + size_t operatorIndex, + IConnectableLayer* layer, + const std::vector<unsigned int>& tensorIndexes) +{ + CHECK_MODEL(m_Model, subgraphIndex, operatorIndex); + BOOST_ASSERT(layer != nullptr); + if (tensorIndexes.size() != layer->GetNumOutputSlots()) + { + throw ParseException( + boost::str(boost::format("The number of tensor outputs (%1%) does not match the number expected (%2%)" + " for subgraph:%3% operator index:%4% %5%") % + tensorIndexes.size() % + layer->GetNumOutputSlots() % + subgraphIndex % + operatorIndex % + CHECK_LOCATION().AsString())); + } + + for (unsigned int slotIndex = 0; slotIndex < layer->GetNumOutputSlots(); ++slotIndex) + { + unsigned int tensorIndex = tensorIndexes[slotIndex]; + armnn::IOutputSlot* slot = &(layer->GetOutputSlot(slotIndex)); + RegisterProducerOfTensor(subgraphIndex, tensorIndex, slot); + } +} + +void TfLiteParser::SetupInputLayers(size_t subgraphIndex) +{ + CHECK_SUBGRAPH(m_Model, subgraphIndex); + + auto inputs = GetSubgraphInputs(m_Model, subgraphIndex); + for (auto const & tensorIdAndPtr : inputs) + { + auto bindingId = GenerateLayerBindingId(subgraphIndex, tensorIdAndPtr.first); + IConnectableLayer* layer = + m_Network->AddInputLayer(bindingId, tensorIdAndPtr.second->name.c_str()); + + auto tensorInfo = ToTensorInfo(tensorIdAndPtr.second); + layer->GetOutputSlot(0).SetTensorInfo(tensorInfo); + + RegisterOutputSlots(subgraphIndex, + VIRTUAL_OPERATOR_ID, + layer, + { static_cast<uint32_t>(tensorIdAndPtr.first) }); + } +} + +void TfLiteParser::SetupOutputLayers(size_t subgraphIndex) +{ + CHECK_SUBGRAPH(m_Model, subgraphIndex); + + auto outputs = GetSubgraphOutputs(m_Model, subgraphIndex); + for (auto const & tensorIdAndPtr : outputs) + { + auto bindingId = GenerateLayerBindingId(subgraphIndex, tensorIdAndPtr.first); + IConnectableLayer* layer = + m_Network->AddOutputLayer(bindingId, tensorIdAndPtr.second->name.c_str()); + + RegisterInputSlots(subgraphIndex, + VIRTUAL_OPERATOR_ID, + layer, + { static_cast<uint32_t>(tensorIdAndPtr.first) }); + } +} + +// example usage: BufferRawPtr bufferPtr = GetBuffer(m_Model, inputs[0]->buffer); +TfLiteParser::BufferRawPtr TfLiteParser::GetBuffer(const ModelPtr& model, size_t bufferIndex) +{ + CHECK_BUFFER(model, bufferIndex); + return model->buffers[bufferIndex].get(); +} + +std::pair<armnn::ConstTensor, TfLiteParser::SupportedDataStorage> +TfLiteParser::CreateConstTensor(TensorRawPtr tensorPtr, + armnn::TensorInfo & tensorInfo, + bool convertFromTfToArmnnFormat) +{ + CHECK_TENSOR_PTR(tensorPtr); + auto bufferPtr = GetBuffer(m_Model, tensorPtr->buffer); + CHECK_BUFFER_SIZE(bufferPtr, tensorInfo, tensorPtr->buffer); + + switch (tensorInfo.GetDataType()) + { + case armnn::DataType::Float32: + { + auto constData = CreateConstTensorImpl<float>(bufferPtr, + tensorPtr, + tensorInfo, + convertFromTfToArmnnFormat); + SupportedDataStorage storage(std::move(constData.second)); + return std::make_pair(constData.first, std::move(storage)); + } + case armnn::DataType::QuantisedAsymm8: + { + auto constData = CreateConstTensorImpl<uint8_t>(bufferPtr, + tensorPtr, + tensorInfo, + convertFromTfToArmnnFormat); + SupportedDataStorage storage(std::move(constData.second)); + return std::make_pair(constData.first, std::move(storage)); + } + case armnn::DataType::Signed32: + { + auto constData = CreateConstTensorImpl<int32_t>(bufferPtr, + tensorPtr, + tensorInfo, + convertFromTfToArmnnFormat); + SupportedDataStorage storage(std::move(constData.second)); + return std::make_pair(constData.first, std::move(storage)); + } + default: + { + std::stringstream errString; + errString << "Unexpected datatype when creating const tensor: " + << armnn::GetDataTypeName(tensorInfo.GetDataType()) + << " shape:" << tensorInfo.GetShape() + << CHECK_LOCATION().AsString(); + throw ParseException(errString.str()); + } + } +} + +BindingPointInfo TfLiteParser::GetNetworkInputBindingInfo(size_t subgraphId, + const std::string& name) const +{ + CHECK_SUBGRAPH(m_Model, subgraphId); + auto inputs = GetSubgraphInputs(m_Model, subgraphId); + for (auto const & input : inputs) + { + if (input.second->name == name) + { + auto bindingId = GenerateLayerBindingId(subgraphId, input.first); + return std::make_pair(bindingId, ToTensorInfo(input.second)); + } + } + + std::stringstream bindings; + for (auto const & input : inputs) + { + bindings << "'" << input.second->name << "' "; + } + + throw ParseException( + boost::str( + boost::format("No input binding found for subgraph:%1% and name:%2%. " + "Possible inputs are: [%3%] %4%") % + subgraphId % + name % + bindings.str() % + CHECK_LOCATION().AsString())); +} + +BindingPointInfo TfLiteParser::GetNetworkOutputBindingInfo(size_t subgraphId, + const std::string& name) const +{ + CHECK_SUBGRAPH(m_Model, subgraphId); + auto outputs = GetSubgraphOutputs(m_Model, subgraphId); + for (auto const & output : outputs) + { + if (output.second->name == name) + { + auto bindingId = GenerateLayerBindingId(subgraphId, output.first); + return std::make_pair(bindingId, ToTensorInfo(output.second)); + } + } + + std::stringstream bindings; + for (auto const & output : outputs) + { + bindings << "'" << output.second->name << "' "; + } + + throw ParseException( + boost::str( + boost::format("No output binding found for subgraph:%1% and name:%2%. " + "Possible outputs are: [%3%] %4%") % + subgraphId % + name % + bindings.str() % + CHECK_LOCATION().AsString())); +} + +size_t TfLiteParser::GetSubgraphCount() const +{ + return m_Model->subgraphs.size(); +} + +std::vector<std::string> TfLiteParser::GetSubgraphInputTensorNames(size_t subgraphId) const +{ + CHECK_SUBGRAPH(m_Model, subgraphId); + auto inputs = GetSubgraphInputs(m_Model, subgraphId); + std::vector<std::string> result; + result.reserve(inputs.size()); + for (auto const & input : inputs) + { + result.push_back(input.second->name); + } + return result; +} + +std::vector<std::string> TfLiteParser::GetSubgraphOutputTensorNames(size_t subgraphId) const +{ + CHECK_SUBGRAPH(m_Model, subgraphId); + auto outputs = GetSubgraphOutputs(m_Model, subgraphId); + std::vector<std::string> result; + result.reserve(outputs.size()); + for (auto const & output : outputs) + { + result.push_back(output.second->name); + } + return result; +} + +ITfLiteParser* ITfLiteParser::CreateRaw() +{ + return new TfLiteParser(); +} + +ITfLiteParserPtr ITfLiteParser::Create() +{ + return ITfLiteParserPtr(CreateRaw(), &ITfLiteParser::Destroy); +} + +void ITfLiteParser::Destroy(ITfLiteParser* parser) +{ + delete parser; +} + +TfLiteParser::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<float[]> && data) +: m_FloatData(std::move(data)) +, m_Uint8Data(nullptr) +, m_Int32Data(nullptr) +{ +} + +TfLiteParser::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<uint8_t[]> && data) +: m_FloatData(nullptr) +, m_Uint8Data(std::move(data)) +, m_Int32Data(nullptr) +{ +} + +TfLiteParser::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<int32_t[]> && data) +: m_FloatData(nullptr) +, m_Uint8Data(nullptr) +, m_Int32Data(std::move(data)) +{ +} + +} // armnnTfLiteParser |