From e2af6f4322a1e2b8b3c391fb721a6a80c281477f Mon Sep 17 00:00:00 2001 From: Narumol Prangnawarat Date: Fri, 28 Jan 2022 17:59:18 +0000 Subject: IVGCVSW-6552 Add support of aligned host memory * Add AllocatedData functions to OutputHandler * Enable import aligned memory in ImportInputs * Enable import aligned memory in ImportOutputs * Allow to import input and output if the memory is aligned * Implement Reconfigure function on ClConvolution2dWorkload * End-to-end test on Ref and Cl to ensure that input and output memory are imported when aligned Signed-off-by: Narumol Prangnawarat Change-Id: I9e5e4c26d1ac2f1d806803ade5f64c6479c51718 --- src/backends/cl/test/ClCreateWorkloadTests.cpp | 61 ++++++++++++++++++++++++++ 1 file changed, 61 insertions(+) (limited to 'src/backends/cl/test/ClCreateWorkloadTests.cpp') diff --git a/src/backends/cl/test/ClCreateWorkloadTests.cpp b/src/backends/cl/test/ClCreateWorkloadTests.cpp index d8b2d4f786..4a28205ade 100644 --- a/src/backends/cl/test/ClCreateWorkloadTests.cpp +++ b/src/backends/cl/test/ClCreateWorkloadTests.cpp @@ -11,11 +11,14 @@ #include #include #include +#include #include #include #include +#include +#include #include #include #include @@ -355,6 +358,64 @@ TEST_CASE_FIXTURE(ClContextControlFixture, "CreateConvolution2dFastMathEnabledWo ARMNN_ASSERT(conv2dWorkload->GetConvolutionMethod() == arm_compute::ConvolutionMethod::WINOGRAD); } +TEST_CASE_FIXTURE(ClContextControlFixture, "ClReplaceInputOutputConvolution2dWorkload") +{ + // Create Convolution2dWorkload with ClTensorHandle input and output + // Then replace the input and output with ClImportTensorHandle + Graph graph; + ClWorkloadFactory factory = + ClWorkloadFactoryHelper::GetFactory(ClWorkloadFactoryHelper::GetMemoryManager()); + + auto workload = + CreateConvolution2dWorkloadTest(factory, + graph, + DataLayout::NHWC); + + TensorShape inputShape = std::initializer_list({2, 8, 16, 3}); + TensorShape outputShape = std::initializer_list({2, 2, 10, 2}); + + // Checks that outputs and inputs are as we expect them (see definition of CreateConvolution2dWorkloadTest). + Convolution2dQueueDescriptor queueDescriptor = workload->GetData(); + auto inputHandle = PolymorphicDowncast(queueDescriptor.m_Inputs[0]); + auto outputHandle = PolymorphicDowncast(queueDescriptor.m_Outputs[0]); + CHECK((inputHandle->GetShape() == inputShape)); + CHECK((outputHandle->GetShape() == outputShape)); + // The input and output handles are created correctly as ClTensorHandle + CHECK((dynamic_cast(inputHandle) != nullptr)); + CHECK((dynamic_cast(outputHandle) != nullptr)); + + // Replace with ImportTensorHandle + ClImportTensorHandleFactory importFactory(static_cast(MemorySource::Malloc), + static_cast(MemorySource::Malloc)); + + TensorInfo inputInfo({ 2, 8, 16, 3 }, DataType::Float32); + TensorInfo outputInfo({ 2, 2, 10, 2 }, DataType::Float32); + + // create TensorHandle for memory import + auto inputImportHandle = importFactory.CreateTensorHandle(inputInfo); + auto outputImportHandle = importFactory.CreateTensorHandle(outputInfo); + + // Calling ReplaceInputTensorHandle and ReplaceOutputTensorHandle does not throw exception + // as Reconfigure function is implemented + workload->ReplaceInputTensorHandle(inputImportHandle.get(), 0); + workload->ReplaceOutputTensorHandle(outputImportHandle.get(), 0); + + // Correctly replaced with the import handles with correct information + queueDescriptor = workload->GetData(); + auto replacedInputHandle = PolymorphicDowncast(queueDescriptor.m_Inputs[0]); + auto replacedOutputHandle = PolymorphicDowncast(queueDescriptor.m_Outputs[0]); + CHECK((replacedInputHandle->GetShape() == inputShape)); + CHECK((replacedOutputHandle->GetShape() == outputShape)); + + CHECK((inputImportHandle.get() == replacedInputHandle)); + CHECK((inputImportHandle.get() == replacedInputHandle)); + + CHECK((dynamic_cast(replacedInputHandle) == nullptr)); + CHECK((dynamic_cast(replacedInputHandle) != nullptr)); + CHECK((dynamic_cast(replacedOutputHandle) == nullptr)); + CHECK((dynamic_cast(replacedOutputHandle) != nullptr)); +} + TEST_CASE_FIXTURE(ClContextControlFixture, "CreateConvolution2dClCompiledContextWorkload") { using namespace armnn; -- cgit v1.2.1