From b8181f72b8c7c9132373dbcf7f8709ec2c0f23c0 Mon Sep 17 00:00:00 2001 From: Finn Williams Date: Wed, 7 Apr 2021 10:23:21 +0100 Subject: IVGCVSW-5787 Add/Update Execute() implementations in RefActivationWorkload * Added multithreaded StridedSliceEndToEndTest Signed-off-by: Finn Williams Change-Id: I4579db7b5959e0a22256f1bda00238c22e611dec --- .../reference/workloads/RefLstmWorkload.cpp | 46 +++++++++++++--------- 1 file changed, 28 insertions(+), 18 deletions(-) (limited to 'src/backends/reference/workloads/RefLstmWorkload.cpp') diff --git a/src/backends/reference/workloads/RefLstmWorkload.cpp b/src/backends/reference/workloads/RefLstmWorkload.cpp index 7c37301d1d..09423547da 100644 --- a/src/backends/reference/workloads/RefLstmWorkload.cpp +++ b/src/backends/reference/workloads/RefLstmWorkload.cpp @@ -39,26 +39,36 @@ RefLstmWorkload::RefLstmWorkload(const LstmQueueDescriptor &descriptor, const Wo {} void RefLstmWorkload::Execute() const +{ + Execute(m_Data.m_Inputs, m_Data.m_Outputs); +} + +void RefLstmWorkload::ExecuteAsync(WorkingMemDescriptor &workingMemDescriptor) +{ + Execute(workingMemDescriptor.m_Inputs, workingMemDescriptor.m_Outputs); +} + +void RefLstmWorkload::Execute(std::vector inputs, std::vector outputs) const { // This is a porting of the LSTM::Eval() method in the Android code base // Refer to: android/frameworks/ml/nn/common/operations/LSTM.cpp - const TensorInfo& inputInfo = GetTensorInfo(m_Data.m_Inputs[0]); - const TensorInfo& outputInfo = GetTensorInfo(m_Data.m_Outputs[0]); + const TensorInfo& inputInfo = GetTensorInfo(inputs[0]); + const TensorInfo& outputInfo = GetTensorInfo(outputs[0]); const TensorShape& inputShape = inputInfo.GetShape(); const DataType& outputType = outputInfo.GetDataType(); - std::unique_ptr> outputStateOut = MakeEncoder(outputInfo, m_Data.m_Outputs[1]->Map()); - std::unique_ptr> cellStateOut = MakeEncoder(outputInfo, m_Data.m_Outputs[2]->Map()); - std::unique_ptr> output = MakeEncoder(outputInfo, m_Data.m_Outputs[3]->Map()); + std::unique_ptr> outputStateOut = MakeEncoder(outputInfo, outputs[1]->Map()); + std::unique_ptr> cellStateOut = MakeEncoder(outputInfo, outputs[2]->Map()); + std::unique_ptr> output = MakeEncoder(outputInfo, outputs[3]->Map()); - std::unique_ptr> cellStateOutDecoder = MakeDecoder(outputInfo, m_Data.m_Outputs[2]->Map()); - std::unique_ptr> outputDecoder = MakeDecoder(outputInfo, m_Data.m_Outputs[3]->Map()); + std::unique_ptr> cellStateOutDecoder = MakeDecoder(outputInfo, outputs[2]->Map()); + std::unique_ptr> outputDecoder = MakeDecoder(outputInfo, outputs[3]->Map()); - std::unique_ptr> inputData = MakeDecoder(inputInfo, m_Data.m_Inputs[0]->Map()); - std::unique_ptr> outputStateIn = MakeDecoder(inputInfo, m_Data.m_Inputs[1]->Map()); - std::unique_ptr> cellStateIn = MakeDecoder(inputInfo, m_Data.m_Inputs[2]->Map()); + std::unique_ptr> inputData = MakeDecoder(inputInfo, inputs[0]->Map()); + std::unique_ptr> outputStateIn = MakeDecoder(inputInfo, inputs[1]->Map()); + std::unique_ptr> cellStateIn = MakeDecoder(inputInfo, inputs[2]->Map()); const uint32_t nBatch = inputShape[0]; const uint32_t nInput = inputShape[1]; @@ -71,19 +81,19 @@ void RefLstmWorkload::Execute() const const bool useLayerNorm = m_Data.m_Parameters.m_LayerNormEnabled; // Index the scratch buffers pointers to the global scratch buffer. - std::unique_ptr> inputGateScratch = MakeEncoder(outputInfo, m_Data.m_Outputs[0]->Map()); - std::unique_ptr> cellScratch = MakeEncoder(outputInfo, m_Data.m_Outputs[0]->Map()); - std::unique_ptr> forgetGateScratch = MakeEncoder(outputInfo, m_Data.m_Outputs[0]->Map()); - std::unique_ptr> outputGateScratch = MakeEncoder(outputInfo, m_Data.m_Outputs[0]->Map()); + std::unique_ptr> inputGateScratch = MakeEncoder(outputInfo, outputs[0]->Map()); + std::unique_ptr> cellScratch = MakeEncoder(outputInfo, outputs[0]->Map()); + std::unique_ptr> forgetGateScratch = MakeEncoder(outputInfo, outputs[0]->Map()); + std::unique_ptr> outputGateScratch = MakeEncoder(outputInfo, outputs[0]->Map()); std::unique_ptr> inputGateScratchDecoder = - MakeDecoder(outputInfo, m_Data.m_Outputs[0]->Map()); + MakeDecoder(outputInfo, outputs[0]->Map()); std::unique_ptr> cellScratchDecoder = - MakeDecoder(outputInfo, m_Data.m_Outputs[0]->Map()); + MakeDecoder(outputInfo, outputs[0]->Map()); std::unique_ptr> forgetGateScratchDecoder = - MakeDecoder(outputInfo, m_Data.m_Outputs[0]->Map()); + MakeDecoder(outputInfo, outputs[0]->Map()); std::unique_ptr> outputGateScratchDecoder = - MakeDecoder(outputInfo, m_Data.m_Outputs[0]->Map()); + MakeDecoder(outputInfo, outputs[0]->Map()); if (useCifg) { -- cgit v1.2.1