aboutsummaryrefslogtreecommitdiff
path: root/src/runtime/NEON/functions/NEQLSTMLayer.cpp
diff options
context:
space:
mode:
authorSang-Hoon Park <sang-hoon.park@arm.com>2020-09-23 13:24:13 +0100
committerGeorgios Pinitas <georgios.pinitas@arm.com>2020-09-23 18:15:29 +0000
commit840a72cc745c60eccbd26fe192b035ec68b2ee41 (patch)
tree3b5d0cfc222249ffe49373ce0387525075e370ca /src/runtime/NEON/functions/NEQLSTMLayer.cpp
parent1643a45557fde79ee209f55c507860307ffe627c (diff)
downloadComputeLibrary-840a72cc745c60eccbd26fe192b035ec68b2ee41.tar.gz
COMPMID-3773: Fix the accumulation of projection in QLSTM
The "output_state_in" (previous output state) tensor is used for accumulation of projection. The argument for the tensor given to configure() has to be changed to non-const since CLTensor needs to be non-const for map() function call for data copying. Even though NEON-side doesn't need the same change, it has been done for consistency. Change-Id: Ifba0ab6dc8260c468e9f087bf51824daefbab7a3 Signed-off-by: Sang-Hoon Park <sang-hoon.park@arm.com> Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/4018 Tested-by: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com>
Diffstat (limited to 'src/runtime/NEON/functions/NEQLSTMLayer.cpp')
-rw-r--r--src/runtime/NEON/functions/NEQLSTMLayer.cpp8
1 files changed, 4 insertions, 4 deletions
diff --git a/src/runtime/NEON/functions/NEQLSTMLayer.cpp b/src/runtime/NEON/functions/NEQLSTMLayer.cpp
index cb45b647c7..5a6b51337a 100644
--- a/src/runtime/NEON/functions/NEQLSTMLayer.cpp
+++ b/src/runtime/NEON/functions/NEQLSTMLayer.cpp
@@ -105,7 +105,7 @@ void NEQLSTMLayer::configure(const ITensor *input,
const ITensor *input_to_forget_weights, const ITensor *input_to_cell_weights, const ITensor *input_to_output_weights,
const ITensor *recurrent_to_forget_weights, const ITensor *recurrent_to_cell_weights, const ITensor *recurrent_to_output_weights,
const ITensor *forget_gate_bias, const ITensor *cell_bias, const ITensor *output_gate_bias,
- const ITensor *cell_state_in, const ITensor *output_state_in,
+ const ITensor *cell_state_in, ITensor *output_state_in,
ITensor *cell_state_out, ITensor *output_state_out, ITensor *output,
const LSTMParams<ITensor> &lstm_params)
{
@@ -477,9 +477,9 @@ void NEQLSTMLayer::configure(const ITensor *input,
if(_projection_tensor_copy_required)
{
_hidden_gate.allocator()->allocate();
- _projection_accumulate_res.allocator()->init(*output_state_out->info());
+ _projection_accumulate_res.allocator()->init(*output_state_in->info());
_projection_accumulate_res.info()->set_tensor_shape(_projection_outstage_res.info()->tensor_shape());
- _projection_output_to_accumulate_copy.configure(*output_state_out, _projection_accumulate_res);
+ _projection_output_to_accumulate_copy.configure(*output_state_in, _projection_accumulate_res);
accumulate_destination = &_projection_accumulate_res;
}
@@ -834,7 +834,7 @@ Status NEQLSTMLayer::validate(const ITensorInfo *input,
if(projection_tensor_copy_required)
{
- ARM_COMPUTE_RETURN_ON_ERROR(NEQLSTMLayer::TensorCopyKernel::validate(*output_state_out, projection_outstage_info));
+ ARM_COMPUTE_RETURN_ON_ERROR(NEQLSTMLayer::TensorCopyKernel::validate(*output_state_in, projection_outstage_info));
}
ARM_COMPUTE_RETURN_ON_ERROR(NEArithmeticAddition::validate(output_state_out, output_state_out, output_state_out, ConvertPolicy::SATURATE));