ArmNN
 20.05
Deserializer.hpp
Go to the documentation of this file.
1 //
2 // Copyright © 2017 Arm Ltd. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
6 #pragma once
7 
8 #include "armnn/INetwork.hpp"
10 #include <ArmnnSchema_generated.h>
11 
12 #include <unordered_map>
13 
14 namespace armnnDeserializer
15 {
17 {
18 public:
19  // Shorthands for deserializer types
20  using ConstTensorRawPtr = const armnnSerializer::ConstTensor *;
21  using GraphPtr = const armnnSerializer::SerializedGraph *;
22  using TensorRawPtr = const armnnSerializer::TensorInfo *;
23  using PoolingDescriptor = const armnnSerializer::Pooling2dDescriptor *;
24  using NormalizationDescriptorPtr = const armnnSerializer::NormalizationDescriptor *;
25  using LstmDescriptorPtr = const armnnSerializer::LstmDescriptor *;
26  using LstmInputParamsPtr = const armnnSerializer::LstmInputParams *;
27  using QLstmDescriptorPtr = const armnnSerializer::QLstmDescriptor *;
28  using QunatizedLstmInputParamsPtr = const armnnSerializer::QuantizedLstmInputParams *;
29  using TensorRawPtrVector = std::vector<TensorRawPtr>;
30  using LayerRawPtr = const armnnSerializer::LayerBase *;
31  using LayerBaseRawPtr = const armnnSerializer::LayerBase *;
32  using LayerBaseRawPtrVector = std::vector<LayerBaseRawPtr>;
33 
34 public:
35 
36  /// Create an input network from binary file contents
37  armnn::INetworkPtr CreateNetworkFromBinary(const std::vector<uint8_t>& binaryContent) override;
38 
39  /// Create an input network from a binary input stream
40  armnn::INetworkPtr CreateNetworkFromBinary(std::istream& binaryContent) override;
41 
42  /// Retrieve binding info (layer id and tensor info) for the network input identified by the given layer name
43  BindingPointInfo GetNetworkInputBindingInfo(unsigned int layerId, const std::string& name) const override;
44 
45  /// Retrieve binding info (layer id and tensor info) for the network output identified by the given layer name
46  BindingPointInfo GetNetworkOutputBindingInfo(unsigned int layerId, const std::string& name) const override;
47 
48  Deserializer();
50 
51 public:
52  // testable helpers
53  static GraphPtr LoadGraphFromBinary(const uint8_t* binaryContent, size_t len);
54  static TensorRawPtrVector GetInputs(const GraphPtr& graph, unsigned int layerIndex);
55  static TensorRawPtrVector GetOutputs(const GraphPtr& graph, unsigned int layerIndex);
56  static LayerBaseRawPtr GetBaseLayer(const GraphPtr& graphPtr, unsigned int layerIndex);
57  static int32_t GetBindingLayerInfo(const GraphPtr& graphPtr, unsigned int layerIndex);
58  static std::string GetLayerName(const GraphPtr& graph, unsigned int index);
60  unsigned int layerIndex);
62  NormalizationDescriptorPtr normalizationDescriptor, unsigned int layerIndex);
65  LstmInputParamsPtr lstmInputParams);
67  static armnn::TensorInfo OutputShapeOfReshape(const armnn::TensorInfo & inputTensorInfo,
68  const std::vector<uint32_t> & targetDimsIn);
69 
70 private:
71  // No copying allowed until it is wanted and properly implemented
72  Deserializer(const Deserializer&) = delete;
73  Deserializer& operator=(const Deserializer&) = delete;
74 
75  /// Create the network from an already loaded flatbuffers graph
76  armnn::INetworkPtr CreateNetworkFromGraph(GraphPtr graph);
77 
78  // signature for the parser functions
79  using LayerParsingFunction = void(Deserializer::*)(GraphPtr graph, unsigned int layerIndex);
80 
81  void ParseUnsupportedLayer(GraphPtr graph, unsigned int layerIndex);
82  void ParseAbs(GraphPtr graph, unsigned int layerIndex);
83  void ParseActivation(GraphPtr graph, unsigned int layerIndex);
84  void ParseAdd(GraphPtr graph, unsigned int layerIndex);
85  void ParseArgMinMax(GraphPtr graph, unsigned int layerIndex);
86  void ParseBatchToSpaceNd(GraphPtr graph, unsigned int layerIndex);
87  void ParseBatchNormalization(GraphPtr graph, unsigned int layerIndex);
88  void ParseComparison(GraphPtr graph, unsigned int layerIndex);
89  void ParseConcat(GraphPtr graph, unsigned int layerIndex);
90  void ParseConstant(GraphPtr graph, unsigned int layerIndex);
91  void ParseConvolution2d(GraphPtr graph, unsigned int layerIndex);
92  void ParseDepthToSpace(GraphPtr graph, unsigned int layerIndex);
93  void ParseDepthwiseConvolution2d(GraphPtr graph, unsigned int layerIndex);
94  void ParseDequantize(GraphPtr graph, unsigned int layerIndex);
95  void ParseDetectionPostProcess(GraphPtr graph, unsigned int layerIndex);
96  void ParseDivision(GraphPtr graph, unsigned int layerIndex);
97  void ParseElementwiseUnary(GraphPtr graph, unsigned int layerIndex);
98  void ParseEqual(GraphPtr graph, unsigned int layerIndex);
99  void ParseFloor(GraphPtr graph, unsigned int layerIndex);
100  void ParseFullyConnected(GraphPtr graph, unsigned int layerIndex);
101  void ParseGather(GraphPtr graph, unsigned int layerIndex);
102  void ParseGreater(GraphPtr graph, unsigned int layerIndex);
103  void ParseInstanceNormalization(GraphPtr graph, unsigned int layerIndex);
104  void ParseL2Normalization(GraphPtr graph, unsigned int layerIndex);
105  void ParseLogSoftmax(GraphPtr graph, unsigned int layerIndex);
106  void ParseMaximum(GraphPtr graph, unsigned int layerIndex);
107  void ParseMean(GraphPtr graph, unsigned int layerIndex);
108  void ParseMinimum(GraphPtr graph, unsigned int layerIndex);
109  void ParseMerge(GraphPtr graph, unsigned int layerIndex);
110  void ParseMultiplication(GraphPtr graph, unsigned int layerIndex);
111  void ParseNormalization(GraphPtr graph, unsigned int layerIndex);
112  void ParseLstm(GraphPtr graph, unsigned int layerIndex);
113  void ParseQuantizedLstm(GraphPtr graph, unsigned int layerIndex);
114  void ParsePad(GraphPtr graph, unsigned int layerIndex);
115  void ParsePermute(GraphPtr graph, unsigned int layerIndex);
116  void ParsePooling2d(GraphPtr graph, unsigned int layerIndex);
117  void ParsePrelu(GraphPtr graph, unsigned int layerIndex);
118  void ParseQLstm(GraphPtr graph, unsigned int layerIndex);
119  void ParseQuantize(GraphPtr graph, unsigned int layerIndex);
120  void ParseReshape(GraphPtr graph, unsigned int layerIndex);
121  void ParseResize(GraphPtr graph, unsigned int layerIndex);
122  void ParseResizeBilinear(GraphPtr graph, unsigned int layerIndex);
123  void ParseRsqrt(GraphPtr graph, unsigned int layerIndex);
124  void ParseSlice(GraphPtr graph, unsigned int layerIndex);
125  void ParseSoftmax(GraphPtr graph, unsigned int layerIndex);
126  void ParseSpaceToBatchNd(GraphPtr graph, unsigned int layerIndex);
127  void ParseSpaceToDepth(GraphPtr graph, unsigned int layerIndex);
128  void ParseSplitter(GraphPtr graph, unsigned int layerIndex);
129  void ParseStack(GraphPtr graph, unsigned int layerIndex);
130  void ParseStandIn(GraphPtr graph, unsigned int layerIndex);
131  void ParseStridedSlice(GraphPtr graph, unsigned int layerIndex);
132  void ParseSubtraction(GraphPtr graph, unsigned int layerIndex);
133  void ParseSwitch(GraphPtr graph, unsigned int layerIndex);
134  void ParseTranspose(GraphPtr graph, unsigned int layerIndex);
135  void ParseTransposeConvolution2d(GraphPtr graph, unsigned int layerIndex);
136 
137  void RegisterInputSlots(GraphPtr graph, uint32_t layerIndex,
138  armnn::IConnectableLayer* layer);
139  void RegisterOutputSlots(GraphPtr graph, uint32_t layerIndex,
140  armnn::IConnectableLayer* layer);
141 
142  // NOTE index here must be from flatbuffer object index property
143  void RegisterOutputSlotOfConnection(uint32_t sourceLayerIndex, uint32_t outputSlotIndex, armnn::IOutputSlot* slot);
144  void RegisterInputSlotOfConnection(uint32_t sourceLayerIndex, uint32_t outputSlotIndex, armnn::IInputSlot* slot);
145 
146  void ResetParser();
147 
148  void SetupInputLayers(GraphPtr graphPtr);
149  void SetupOutputLayers(GraphPtr graphPtr);
150 
151  /// Helper to get the index of the layer in the flatbuffer vector from its bindingId property
152  unsigned int GetInputLayerInVector(GraphPtr graph, int targetId);
153  unsigned int GetOutputLayerInVector(GraphPtr graph, int targetId);
154 
155  /// Helper to get the index of the layer in the flatbuffer vector from its index property
156  unsigned int GetLayerIndexInVector(GraphPtr graph, unsigned int index);
157 
158  struct FeatureVersions
159  {
160  // Default values to zero for backward compatibility
161  unsigned int m_BindingIdScheme = 0;
162  };
163 
164  FeatureVersions GetFeatureVersions(GraphPtr graph);
165 
166  /// The network we're building. Gets cleared after it is passed to the user
167  armnn::INetworkPtr m_Network;
168  std::vector<LayerParsingFunction> m_ParserFunctions;
169 
170  using NameToBindingInfo = std::pair<std::string, BindingPointInfo >;
171  std::vector<NameToBindingInfo> m_InputBindings;
172  std::vector<NameToBindingInfo> m_OutputBindings;
173 
174  /// This struct describe connections for each layer
175  struct Connections
176  {
177  // Maps output slot index (property in flatbuffer object) to IOutputSlot pointer
178  std::unordered_map<unsigned int, armnn::IOutputSlot*> outputSlots;
179 
180  // Maps output slot index to IInputSlot pointer the output slot should be connected to
181  std::unordered_map<unsigned int, std::vector<armnn::IInputSlot*>> inputSlots;
182  };
183 
184  /// Maps layer index (index property in flatbuffer object) to Connections for each layer
185  std::unordered_map<unsigned int, Connections> m_GraphConnections;
186 };
187 
188 } // namespace armnnDeserializer
const armnnSerializer::LstmInputParams * LstmInputParamsPtr
static armnn::LstmDescriptor GetLstmDescriptor(LstmDescriptorPtr lstmDescriptor)
const armnnSerializer::QuantizedLstmInputParams * QunatizedLstmInputParamsPtr
Interface for a layer that is connectable to other layers via InputSlots and OutputSlots.
Definition: INetwork.hpp:61
std::vector< LayerBaseRawPtr > LayerBaseRawPtrVector
static GraphPtr LoadGraphFromBinary(const uint8_t *binaryContent, size_t len)
static armnn::NormalizationDescriptor GetNormalizationDescriptor(NormalizationDescriptorPtr normalizationDescriptor, unsigned int layerIndex)
const armnnSerializer::TensorInfo * TensorRawPtr
const armnnSerializer::NormalizationDescriptor * NormalizationDescriptorPtr
static armnn::QLstmDescriptor GetQLstmDescriptor(QLstmDescriptorPtr qLstmDescriptorPtr)
armnn::INetworkPtr CreateNetworkFromBinary(const std::vector< uint8_t > &binaryContent) override
Create an input network from binary file contents.
static std::string GetLayerName(const GraphPtr &graph, unsigned int index)
BindingPointInfo GetNetworkInputBindingInfo(unsigned int layerId, const std::string &name) const override
Retrieve binding info (layer id and tensor info) for the network input identified by the given layer ...
static int32_t GetBindingLayerInfo(const GraphPtr &graphPtr, unsigned int layerIndex)
const armnnSerializer::Pooling2dDescriptor * PoolingDescriptor
An LstmDescriptor for the LstmLayer.
An output connection slot for a layer.
Definition: INetwork.hpp:37
static LayerBaseRawPtr GetBaseLayer(const GraphPtr &graphPtr, unsigned int layerIndex)
A QLstmDescriptor for the QLstmLayer.
const armnnSerializer::LayerBase * LayerRawPtr
BindingPointInfo GetNetworkOutputBindingInfo(unsigned int layerId, const std::string &name) const override
Retrieve binding info (layer id and tensor info) for the network output identified by the given layer...
std::vector< TensorRawPtr > TensorRawPtrVector
static TensorRawPtrVector GetOutputs(const GraphPtr &graph, unsigned int layerIndex)
const armnnSerializer::SerializedGraph * GraphPtr
const armnnSerializer::ConstTensor * ConstTensorRawPtr
const armnnSerializer::LstmDescriptor * LstmDescriptorPtr
static armnn::Pooling2dDescriptor GetPoolingDescriptor(PoolingDescriptor pooling2dDescriptor, unsigned int layerIndex)
static armnn::LstmInputParams GetLstmInputParams(LstmDescriptorPtr lstmDescriptor, LstmInputParamsPtr lstmInputParams)
const armnnSerializer::QLstmDescriptor * QLstmDescriptorPtr
static TensorRawPtrVector GetInputs(const GraphPtr &graph, unsigned int layerIndex)
std::unique_ptr< INetwork, void(*)(INetwork *network)> INetworkPtr
Definition: INetwork.hpp:101
A Pooling2dDescriptor for the Pooling2dLayer.
const armnnSerializer::LayerBase * LayerBaseRawPtr
A NormalizationDescriptor for the NormalizationLayer.
static armnn::TensorInfo OutputShapeOfReshape(const armnn::TensorInfo &inputTensorInfo, const std::vector< uint32_t > &targetDimsIn)
An input connection slot for a layer.
Definition: INetwork.hpp:24