ArmNN
 22.02
QuantizedLstmLayer.cpp
Go to the documentation of this file.
1 //
2 // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 #include "QuantizedLstmLayer.hpp"
6 
7 #include "LayerCloneBase.hpp"
8 
10 #include <armnn/TypesUtils.hpp>
13 
14 namespace armnn
15 {
16 
18  : Layer(3, 2, LayerType::QuantizedLstm, name)
19 {
20 }
21 
22 std::unique_ptr<IWorkload> QuantizedLstmLayer::CreateWorkload(const IWorkloadFactory& factory) const
23 {
25 
26  // QuantizedLstmLayer parameters - there are no optional params
31 
36 
41 
42  SetAdditionalInfo(descriptor);
43 
44  return factory.CreateWorkload(LayerType::QuantizedLstm, descriptor, PrepInfoAndDesc(descriptor));
45 }
46 
48 {
49  auto layer = CloneBase<QuantizedLstmLayer>(graph, GetName());
50 
53  layer->m_QuantizedLstmParameters.m_InputToForgetWeights = m_QuantizedLstmParameters.m_InputToForgetWeights ?
55  layer->m_QuantizedLstmParameters.m_InputToCellWeights = m_QuantizedLstmParameters.m_InputToCellWeights ?
57  layer->m_QuantizedLstmParameters.m_InputToOutputWeights = m_QuantizedLstmParameters.m_InputToOutputWeights ?
59 
60  layer->m_QuantizedLstmParameters.m_RecurrentToInputWeights = m_QuantizedLstmParameters.m_RecurrentToInputWeights ?
62  layer->m_QuantizedLstmParameters.m_RecurrentToForgetWeights = m_QuantizedLstmParameters.m_RecurrentToForgetWeights
64  layer->m_QuantizedLstmParameters.m_RecurrentToCellWeights = m_QuantizedLstmParameters.m_RecurrentToCellWeights ?
66  layer->m_QuantizedLstmParameters.m_RecurrentToOutputWeights = m_QuantizedLstmParameters.m_RecurrentToOutputWeights
68 
69  layer->m_QuantizedLstmParameters.m_InputGateBias = m_QuantizedLstmParameters.m_InputGateBias ?
71  layer->m_QuantizedLstmParameters.m_ForgetGateBias = m_QuantizedLstmParameters.m_ForgetGateBias ?
73  layer->m_QuantizedLstmParameters.m_CellBias = m_QuantizedLstmParameters.m_CellBias ?
75  layer->m_QuantizedLstmParameters.m_OutputGateBias = m_QuantizedLstmParameters.m_OutputGateBias ?
77 
78  return std::move(layer);
79 }
80 
81 std::vector<TensorShape> QuantizedLstmLayer::InferOutputShapes(const std::vector<TensorShape>& inputShapes) const
82 {
83  ARMNN_ASSERT(inputShapes.size() == 3);
84 
85  // Get input values for validation
86  unsigned int numBatches = inputShapes[0][0];
87  unsigned int outputSize = inputShapes[1][1];
88 
89  std::vector<TensorShape> outShapes;
90  outShapes.push_back(TensorShape({numBatches, outputSize})); // cellStateOut
91  outShapes.push_back(TensorShape({numBatches, outputSize})); // output
92 
93  return outShapes;
94 }
95 
97 {
99 
100  const TensorShape& outputShape = GetOutputSlot(0).GetTensorInfo().GetShape();
101 
103 
104  auto inferredShapes = InferOutputShapes(
105  {
107  GetInputSlot(1).GetConnection()->GetTensorInfo().GetShape(), // previousCellStateIn
108  GetInputSlot(2).GetConnection()->GetTensorInfo().GetShape() // previousOutputIn
109  });
110 
111  ARMNN_ASSERT(inferredShapes.size() == 2);
112 
113  // Check weights and bias for nullptr
115  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_InputToInputWeights should not be null.");
117  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_InputToForgetWeights should not be null.");
119  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_InputToCellWeights should not be null.");
121  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_InputToOutputWeights should not be null.");
122 
124  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_RecurrentToInputWeights should not be null.");
126  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_RecurrentToForgetWeights should not be null.");
128  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_RecurrentToCellWeights should not be null.");
130  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_RecurrentToOutputWeights should not be null.");
131 
133  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_InputGateBias should not be null.");
135  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_ForgetGateBias should not be null.");
137  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_CellBias should not be null.");
139  "QuantizedLstmLayer: m_QuantizedLstmParameters.m_OutputGateBias should not be null.");
140 
141  // Check output TensorShape(s) match inferred shape
142  ValidateAndCopyShape(outputShape, inferredShapes[0], m_ShapeInferenceMethod, "QuantizedLstmLayer");
143 
145  inferredShapes[1],
147  "QuantizedLstmLayer",
148  1);
149 }
150 
152 {
153  // For API stability DO NOT ALTER order and add new members to the end of vector
154  return
155  {
160 
165 
170  };
171 }
172 
174 void QuantizedLstmLayer::Accept(ILayerVisitor& visitor) const
175 {
176  QuantizedLstmInputParams inputParams;
177 
182 
187 
192 
193  // InputToX weight tensors
194  ConstTensor inputToInputWeightsTensor;
196  {
197  ConstTensor inputToInputWeightsTensorCopy(managedInputToInputWeights.GetTensorInfo(),
198  managedInputToInputWeights.Map());
199  inputToInputWeightsTensor = inputToInputWeightsTensorCopy;
200  inputParams.m_InputToInputWeights = &inputToInputWeightsTensor;
201  }
202 
203  ConstTensor inputToForgetWeightsTensor;
205  {
206  ConstTensor inputToForgetWeightsTensorCopy(managedInputToForgetWeights.GetTensorInfo(),
207  managedInputToForgetWeights.Map());
208  inputToForgetWeightsTensor = inputToForgetWeightsTensorCopy;
209  inputParams.m_InputToForgetWeights = &inputToForgetWeightsTensor;
210  }
211 
212  ConstTensor inputToCellWeightsTensor;
214  {
215  ConstTensor inputToCellWeightsTensorCopy(managedInputToCellWeights.GetTensorInfo(),
216  managedInputToCellWeights.Map());
217  inputToCellWeightsTensor = inputToCellWeightsTensorCopy;
218  inputParams.m_InputToCellWeights = &inputToCellWeightsTensor;
219  }
220 
221  ConstTensor inputToOutputWeightsTensor;
223  {
224  ConstTensor inputToOutputWeightsTensorCopy(managedInputToOutputWeights.GetTensorInfo(),
225  managedInputToOutputWeights.Map());
226  inputToOutputWeightsTensor = inputToOutputWeightsTensorCopy;
227  inputParams.m_InputToOutputWeights = &inputToOutputWeightsTensor;
228  }
229 
230  // RecurrentToX weight tensors
231  ConstTensor recurrentToInputWeightsTensor;
233  {
234  ConstTensor recurrentToInputWeightsTensorCopy(
235  managedRecurrentToInputWeights.GetTensorInfo(),
236  managedRecurrentToInputWeights.Map());
237  recurrentToInputWeightsTensor = recurrentToInputWeightsTensorCopy;
238  inputParams.m_RecurrentToInputWeights = &recurrentToInputWeightsTensor;
239  }
240 
241  ConstTensor recurrentToForgetWeightsTensor;
243  {
244  ConstTensor recurrentToForgetWeightsTensorCopy(
245  managedRecurrentToForgetWeights.GetTensorInfo(),
246  managedRecurrentToForgetWeights.Map());
247  recurrentToForgetWeightsTensor = recurrentToForgetWeightsTensorCopy;
248  inputParams.m_RecurrentToForgetWeights = &recurrentToForgetWeightsTensor;
249  }
250 
251  ConstTensor recurrentToCellWeightsTensor;
253  {
254  ConstTensor recurrentToCellWeightsTensorCopy(
255  managedRecurrentToCellWeights.GetTensorInfo(),
256  managedRecurrentToCellWeights.Map());
257  recurrentToCellWeightsTensor = recurrentToCellWeightsTensorCopy;
258  inputParams.m_RecurrentToCellWeights = &recurrentToCellWeightsTensor;
259  }
260 
261  ConstTensor recurrentToOutputWeightsTensor;
263  {
264  ConstTensor recurrentToOutputWeightsTensorCopy(
265  managedRecurrentToOutputWeights.GetTensorInfo(),
266  managedRecurrentToOutputWeights.Map());
267  recurrentToOutputWeightsTensor = recurrentToOutputWeightsTensorCopy;
268  inputParams.m_RecurrentToOutputWeights = &recurrentToOutputWeightsTensor;
269  }
270 
271  // Bias tensors
272  ConstTensor inputGateBiasTensor;
274  {
275  ConstTensor inputGateBiasTensorCopy(managedInputGateBias.GetTensorInfo(),
276  managedInputGateBias.Map());
277  inputGateBiasTensor = inputGateBiasTensorCopy;
278  inputParams.m_InputGateBias = &inputGateBiasTensor;
279  }
280 
281  ConstTensor forgetGateBiasTensor;
283  {
284  ConstTensor forgetGateBiasTensorCopy(managedForgetGateBias.GetTensorInfo(),
285  managedForgetGateBias.Map());
286  forgetGateBiasTensor = forgetGateBiasTensorCopy;
287  inputParams.m_ForgetGateBias = &forgetGateBiasTensor;
288  }
289 
290  ConstTensor cellBiasTensor;
291  if (m_QuantizedLstmParameters.m_CellBias != nullptr)
292  {
293  ConstTensor cellBiasTensorCopy(managedCellBias.GetTensorInfo(),
294  managedCellBias.Map());
295  cellBiasTensor = cellBiasTensorCopy;
296  inputParams.m_CellBias = &cellBiasTensor;
297  }
298 
299  ConstTensor outputGateBiasTensor;
301  {
302  ConstTensor outputGateBiasCopy(managedOutputGateBias.GetTensorInfo(),
303  managedOutputGateBias.Map());
304  outputGateBiasTensor = outputGateBiasCopy;
305  inputParams.m_OutputGateBias = &outputGateBiasTensor;
306  }
307 
308  visitor.VisitQuantizedLstmLayer(this, inputParams, GetName());
309 }
311 
313 {
314  std::vector<ConstTensor> constTensors;
315 
320 
325 
330 
331  // InputToX weight tensors
333  {
334  constTensors.emplace_back(ConstTensor(managedInputToInputWeights.GetTensorInfo(),
335  managedInputToInputWeights.Map()));
336  }
337 
339  {
340  constTensors.emplace_back(ConstTensor(managedInputToForgetWeights.GetTensorInfo(),
341  managedInputToForgetWeights.Map()));
342  }
343 
345  {
346  constTensors.emplace_back(ConstTensor(managedInputToCellWeights.GetTensorInfo(),
347  managedInputToCellWeights.Map()));
348  }
349 
351  {
352  constTensors.emplace_back(ConstTensor(managedInputToOutputWeights.GetTensorInfo(),
353  managedInputToOutputWeights.Map()));
354  }
355 
356  // RecurrentToX weight tensors
358  {
359  constTensors.emplace_back(ConstTensor(
360  managedRecurrentToInputWeights.GetTensorInfo(),
361  managedRecurrentToInputWeights.Map()));
362  }
363 
365  {
366  constTensors.emplace_back(ConstTensor(
367  managedRecurrentToForgetWeights.GetTensorInfo(),
368  managedRecurrentToForgetWeights.Map()));
369  }
370 
372  {
373  constTensors.emplace_back(ConstTensor(
374  managedRecurrentToCellWeights.GetTensorInfo(),
375  managedRecurrentToCellWeights.Map()));
376  }
377 
379  {
380  constTensors.emplace_back(ConstTensor(
381  managedRecurrentToOutputWeights.GetTensorInfo(),
382  managedRecurrentToOutputWeights.Map()));
383  }
384 
385  // Bias tensors
387  {
388  constTensors.emplace_back(ConstTensor(managedInputGateBias.GetTensorInfo(),
389  managedInputGateBias.Map()));
390  }
391 
393  {
394  constTensors.emplace_back(ConstTensor(managedForgetGateBias.GetTensorInfo(),
395  managedForgetGateBias.Map()));
396  }
397 
398  if (m_QuantizedLstmParameters.m_CellBias != nullptr)
399  {
400  constTensors.emplace_back(ConstTensor(managedCellBias.GetTensorInfo(),
401  managedCellBias.Map()));
402  }
403 
405  {
406  constTensors.emplace_back(ConstTensor(managedOutputGateBias.GetTensorInfo(),
407  managedOutputGateBias.Map()));
408  }
409 
410 
411  strategy.ExecuteStrategy(this, BaseDescriptor(), constTensors, GetName());
412 }
413 
414 } // namespace armnn
Layer::ConstantTensors GetConstantTensorsByRef() override
Retrieve the handles to the constant values stored by the layer.
std::shared_ptr< ConstTensorHandle > m_ForgetGateBias
A unique pointer to represent 1D bias tensor with dimensions [outputSize] (int32).
QuantizedLstmParameters m_QuantizedLstmParameters
const TensorShape & GetShape() const
Definition: Tensor.hpp:191
const ConstTensor * m_RecurrentToOutputWeights
std::shared_ptr< ConstTensorHandle > m_InputToForgetWeights
A unique pointer to represent 2D weights tensor with dimensions [outputSize, inputSize] (QAsymm8)...
#define ARMNN_NO_DEPRECATE_WARN_BEGIN
Definition: Deprecated.hpp:33
const ConstTensor * m_RecurrentToForgetWeights
std::shared_ptr< ConstTensorHandle > m_InputGateBias
A unique pointer to represent 1D bias tensor with dimensions [outputSize] (int32).
QuantizedLstmLayer * Clone(Graph &graph) const override
Creates a dynamically-allocated copy of this layer.
virtual void ExecuteStrategy(const armnn::IConnectableLayer *layer, const armnn::BaseDescriptor &descriptor, const std::vector< armnn::ConstTensor > &constants, const char *name, const armnn::LayerBindingId id=0)=0
const ConstTensorHandle * m_InputGateBias
void VerifyShapeInferenceType(const TensorShape &outputShape, ShapeInferenceMethod shapeInferenceMethod)
Definition: Layer.cpp:436
void ValidateTensorShapesFromInputs() override
Check if the input tensor shape(s) will lead to a valid configuration of QuantizedLstmLayer.
const TensorInfo & GetTensorInfo() const
Copyright (c) 2021 ARM Limited and Contributors.
std::shared_ptr< ConstTensorHandle > m_InputToOutputWeights
A unique pointer to represent 2D weights tensor with dimensions [outputSize, inputSize] (QAsymm8)...
const IOutputSlot * GetConnection() const override
Definition: Layer.hpp:204
const ConstTensorHandle * m_RecurrentToInputWeights
QuantizedLstmLayer(const char *name)
Constructor to create a QuantizedLstmLayer.
std::shared_ptr< ConstTensorHandle > m_CellBias
A unique pointer to represent 1D bias tensor with dimensions [outputSize] (int32).
void ValidateAndCopyShape(const TensorShape &outputShape, const TensorShape &inferredShape, const ShapeInferenceMethod shapeInferenceMethod, const std::string &layerName, const unsigned int outputSlotIndex=0)
Definition: Layer.cpp:396
std::shared_ptr< ConstTensorHandle > m_RecurrentToOutputWeights
A unique pointer to represent 2D weights tensor with dimensions [outputSize, outputSize] (QAsymm8)...
std::shared_ptr< ConstTensorHandle > m_RecurrentToInputWeights
A unique pointer to represent 2D weights tensor with dimensions [outputSize, outputSize] (QAsymm8)...
Base class for all descriptors.
Definition: Descriptors.hpp:22
void VerifyLayerConnections(unsigned int expectedConnections, const CheckLocation &location) const
Definition: Layer.cpp:352
std::shared_ptr< ConstTensorHandle > m_InputToCellWeights
A unique pointer to represent 2D weights tensor with dimensions [outputSize, inputSize] (QAsymm8)...
const InputSlot & GetInputSlot(unsigned int index) const override
Get a const input slot handle by slot index.
Definition: Layer.hpp:321
const ConstTensorHandle * m_InputToForgetWeights
std::vector< std::reference_wrapper< std::shared_ptr< ConstTensorHandle > >> ConstantTensors
Definition: INetwork.hpp:124
#define ARMNN_NO_DEPRECATE_WARN_END
Definition: Deprecated.hpp:34
#define ARMNN_ASSERT_MSG(COND, MSG)
Definition: Assert.hpp:15
This layer represents a QuantizedLstm operation.
WorkloadInfo PrepInfoAndDesc(QueueDescriptor &descriptor) const
Helper function to reduce duplication in *LayerCreateWorkload.
Definition: Layer.hpp:388
const ConstTensor * m_InputToForgetWeights
const ConstTensorHandle * m_RecurrentToCellWeights
A tensor defined by a TensorInfo (shape and data type) and an immutable backing store.
Definition: Tensor.hpp:327
const ConstTensorHandle * m_ForgetGateBias
#define ARMNN_ASSERT(COND)
Definition: Assert.hpp:14
const ConstTensorHandle * m_RecurrentToOutputWeights
virtual std::unique_ptr< IWorkload > CreateWorkload(const IWorkloadFactory &factory) const override
Makes a workload for the QuantizedLstm type.
const ConstTensorHandle * m_OutputGateBias
#define CHECK_LOCATION()
Definition: Exceptions.hpp:209
const ConstTensorHandle * m_RecurrentToForgetWeights
const ConstTensor * m_RecurrentToInputWeights
std::shared_ptr< ConstTensorHandle > m_OutputGateBias
A unique pointer to represent 1D bias tensor with dimensions [outputSize] (int32).
void SetAdditionalInfo(QueueDescriptor &descriptor) const
Definition: Layer.cpp:248
std::shared_ptr< ConstTensorHandle > m_RecurrentToCellWeights
A unique pointer to represent 2D weights tensor with dimensions [outputSize, outputSize] (QAsymm8)...
ARMNN_NO_DEPRECATE_WARN_BEGIN void Accept(ILayerVisitor &visitor) const override
const ConstTensorHandle * m_InputToOutputWeights
const ConstTensorHandle * m_InputToInputWeights
const ConstTensorHandle * m_CellBias
const ConstTensor * m_RecurrentToCellWeights
const ConstTensor * m_InputToOutputWeights
const OutputSlot & GetOutputSlot(unsigned int index=0) const override
Get the const output slot handle by slot index.
Definition: Layer.hpp:323
virtual const TensorInfo & GetTensorInfo() const =0
const char * GetName() const override
Returns the name of the layer.
Definition: Layer.hpp:316
const void * Map(bool blocking=true)
RAII Managed resource Unmaps MemoryArea once out of scope.
const TensorInfo & GetTensorInfo(const ITensorHandle *tensorHandle)
float32 helpers
std::shared_ptr< ConstTensorHandle > m_RecurrentToForgetWeights
A unique pointer to represent 2D weights tensor with dimensions [outputSize, outputSize] (QAsymm8)...
const ConstTensorHandle * m_InputToCellWeights
virtual std::unique_ptr< IWorkload > CreateWorkload(LayerType type, const QueueDescriptor &descriptor, const WorkloadInfo &info) const
std::shared_ptr< ConstTensorHandle > m_InputToInputWeights
A unique pointer to represent 2D weights tensor with dimensions [outputSize, inputSize] (QAsymm8)...
const TensorInfo & GetTensorInfo() const override
Definition: Layer.cpp:66
std::vector< TensorShape > InferOutputShapes(const std::vector< TensorShape > &inputShapes) const override
By default returns inputShapes if the number of inputs are equal to number of outputs, otherwise infers the output shapes from given input shapes and layer properties.
ARMNN_NO_DEPRECATE_WARN_END void ExecuteStrategy(IStrategy &strategy) const override
Apply a visitor to this layer.
ShapeInferenceMethod m_ShapeInferenceMethod
Definition: Layer.hpp:415
LayerType
When adding a new layer, adapt also the LastLayer enum value in the enum class LayerType below...
Definition: Types.hpp:458