From 60ab9765329b1449b509b32b07f0b0abb3b532f2 Mon Sep 17 00:00:00 2001
From: Nikhil Raj <nikhil.raj@arm.com>
Date: Thu, 13 Jan 2022 09:34:44 +0000
Subject: IVGCVSW-6673 Implement CanBeImported function to ClTensorHandle

 * Added Unittests

Signed-off-by: Nikhil Raj <nikhil.raj@arm.com>
Signed-off-by: David Monahan <David.Monahan@arm.com>
Change-Id: If7c0add39583a7e47b43fd79f93c620f86f80fc1
---
 src/backends/cl/ClImportTensorHandle.hpp | 61 +++++++++++++++++++++++++++++++-
 1 file changed, 60 insertions(+), 1 deletion(-)

(limited to 'src/backends/cl/ClImportTensorHandle.hpp')

diff --git a/src/backends/cl/ClImportTensorHandle.hpp b/src/backends/cl/ClImportTensorHandle.hpp
index a24ab5656e..18cd1ffeb4 100644
--- a/src/backends/cl/ClImportTensorHandle.hpp
+++ b/src/backends/cl/ClImportTensorHandle.hpp
@@ -192,12 +192,71 @@ public:
         }
     }
 
+    virtual bool CanBeImported(void* memory, MemorySource source) override
+    {
+        if (m_ImportFlags & static_cast<MemorySourceFlags>(source))
+        {
+            if (source == MemorySource::Malloc)
+            {
+                const cl_import_properties_arm importProperties[] =
+                        {
+                                CL_IMPORT_TYPE_ARM,
+                                CL_IMPORT_TYPE_HOST_ARM,
+                                0
+                        };
+
+                size_t totalBytes = m_Tensor.info()->total_size();
+
+                // Round the size of the mapping to match the CL_DEVICE_GLOBAL_MEM_CACHELINE_SIZE
+                // This does not change the size of the buffer, only the size of the mapping the buffer is mapped to
+                // We do this to match the behaviour of the Import function later on.
+                auto cachelineAlignment =
+                        arm_compute::CLKernelLibrary::get().get_device().getInfo<CL_DEVICE_GLOBAL_MEM_CACHELINE_SIZE>();
+                auto roundedSize = cachelineAlignment + totalBytes - (totalBytes % cachelineAlignment);
+
+                cl_int error = CL_SUCCESS;
+                cl_mem buffer;
+                buffer = clImportMemoryARM(arm_compute::CLKernelLibrary::get().context().get(),
+                                           CL_MEM_READ_WRITE, importProperties, memory, roundedSize, &error);
+
+                // If we fail to map we know the import will not succeed and can return false.
+                // There is no memory to be released if error is not CL_SUCCESS
+                if (error != CL_SUCCESS)
+                {
+                    return false;
+                }
+                else
+                {
+                    // If import was successful we can release the mapping knowing import will succeed at workload
+                    // execution and return true
+                    error = clReleaseMemObject(buffer);
+                    if (error == CL_SUCCESS)
+                    {
+                        return true;
+                    }
+                    else
+                    {
+                        // If we couldn't release the mapping this constitutes a memory leak and throw an exception
+                        throw MemoryImportException("ClImportTensorHandle::Failed to unmap cl_mem buffer: "
+                                                    + std::to_string(error));
+                    }
+                }
+            }
+        }
+        else
+        {
+            throw MemoryImportException("ClImportTensorHandle::Incorrect import flag");
+        }
+        return false;
+    }
+
 private:
     bool ClImport(const cl_import_properties_arm* importProperties, void* memory, bool isProtected = false)
     {
         size_t totalBytes = m_Tensor.info()->total_size();
 
-        // Round the size of the buffer to a multiple of the CL_DEVICE_GLOBAL_MEM_CACHELINE_SIZE
+        // Round the size of the mapping to match the CL_DEVICE_GLOBAL_MEM_CACHELINE_SIZE
+        // This does not change the size of the buffer, only the size of the mapping the buffer is mapped to
         auto cachelineAlignment =
                 arm_compute::CLKernelLibrary::get().get_device().getInfo<CL_DEVICE_GLOBAL_MEM_CACHELINE_SIZE>();
         auto roundedSize = cachelineAlignment + totalBytes - (totalBytes % cachelineAlignment);
-- 
cgit v1.2.1