aboutsummaryrefslogtreecommitdiff
path: root/src/backends/cl/workloads/ClLstmFloatWorkload.cpp
diff options
context:
space:
mode:
authorMatteo Martincigh <matteo.martincigh@arm.com>2018-11-14 12:39:55 +0000
committerMatteo Martincigh <matteo.martincigh@arm.com>2018-11-16 09:05:24 +0000
commita65b7aeafc0ef6acf40e4a8a6d36206bf53d717c (patch)
treed62257a911f3a4a4ed99243d4860a2453e95ec98 /src/backends/cl/workloads/ClLstmFloatWorkload.cpp
parent74ba3dc7113e51cf11ab772ee1eb030c07a7dda5 (diff)
downloadarmnn-a65b7aeafc0ef6acf40e4a8a6d36206bf53d717c.tar.gz
IVGCVSW-2092 Port LSTMCell::Eval to ArmNN
* Ported Google's LSTM implementation to RefLstmFloat32Workload * Fixed the code throughout because of an error in the docs around the scratch buffer size * Updated IsLstmSupported * Added the unit tests !android-nn-driver:127 Change-Id: I5577b7e39ca52df1a7f102a9b437df6aa99520b6
Diffstat (limited to 'src/backends/cl/workloads/ClLstmFloatWorkload.cpp')
-rw-r--r--src/backends/cl/workloads/ClLstmFloatWorkload.cpp8
1 files changed, 4 insertions, 4 deletions
diff --git a/src/backends/cl/workloads/ClLstmFloatWorkload.cpp b/src/backends/cl/workloads/ClLstmFloatWorkload.cpp
index 2a664454e1..f4d8974226 100644
--- a/src/backends/cl/workloads/ClLstmFloatWorkload.cpp
+++ b/src/backends/cl/workloads/ClLstmFloatWorkload.cpp
@@ -116,14 +116,14 @@ ClLstmFloatWorkload::ClLstmFloatWorkload(const LstmQueueDescriptor &descriptor,
m_ScratchBuffer = std::make_unique<arm_compute::CLTensor>();
if (m_Data.m_Parameters.m_CifgEnabled)
{
- // 2D tensor with dimensions [num_units * 4, batch_size] with CIFG
- armnn::TensorInfo scratchBuffer1({ batch_size, num_units * 4 }, DataType::Float32);
+ // 2D tensor with dimensions [num_units * 3, batch_size] with CIFG
+ armnn::TensorInfo scratchBuffer1({ batch_size, num_units * 3 }, DataType::Float32);
BuildArmComputeTensor(*m_ScratchBuffer, scratchBuffer1);
}
else
{
- // scratch_buffer [num_units * 3, batch_size] without CIFG
- armnn::TensorInfo scratchBuffer2({ batch_size, num_units * 3 }, DataType::Float32);
+ // scratch_buffer [num_units * 4, batch_size] without CIFG
+ armnn::TensorInfo scratchBuffer2({ batch_size, num_units * 4 }, DataType::Float32);
BuildArmComputeTensor(*m_ScratchBuffer, scratchBuffer2);
}