#include <armnn/backends/ICustomAllocator.hpp>
#include <armnn/Descriptors.hpp>
#include <armnn/Exceptions.hpp>
#include <armnn/INetwork.hpp>
#include <armnn/IRuntime.hpp>
#include <armnn/Utils.hpp>
#include <armnn/BackendRegistry.hpp>
#include <cl/ClBackend.hpp>
#include <neon/NeonBackend.hpp>
#include <doctest/doctest.h>
#include <arm_compute/core/CL/CLKernelLibrary.h>
#include <CL/cl_ext.h>
#include <arm_compute/runtime/CL/CLScheduler.h>

Functions
armnn::INetworkPtr	CreateTestNetwork (armnn::TensorInfo &inputTensorInfo)

	TEST_SUITE ("ClCustomAllocatorTests")

Function Documentation

◆ CreateTestNetwork()

armnn::INetworkPtr CreateTestNetwork ( armnn::TensorInfo & inputTensorInfo )

Definition at line 63 of file ClCustomAllocatorTests.cpp.

References ARMNN_NO_DEPRECATE_WARN_BEGIN, ARMNN_NO_DEPRECATE_WARN_END, OutputSlot::Connect(), IConnectableLayer::GetInputSlot(), Layer::GetOutputSlot(), and TensorInfo::SetConstant().

Referenced by TEST_SUITE().

 {
     using namespace armnn;
     INetworkPtr myNetwork = INetwork::Create();
 
     armnn::FullyConnectedDescriptor fullyConnectedDesc;
     float weightsData[] = {1.0f}; // Identity
     TensorInfo weightsInfo(TensorShape({1, 1}), DataType::Float32);
     weightsInfo.SetConstant(true);
     armnn::ConstTensor weights(weightsInfo, weightsData);
 
     ARMNN_NO_DEPRECATE_WARN_BEGIN
     IConnectableLayer* fullyConnected = myNetwork->AddFullyConnectedLayer(fullyConnectedDesc,
                                                                           weights,
                                                                           EmptyOptional(),
                                                                           "fully connected");
     ARMNN_NO_DEPRECATE_WARN_END
     IConnectableLayer* InputLayer = myNetwork->AddInputLayer(0);
     IConnectableLayer* OutputLayer = myNetwork->AddOutputLayer(0);
     InputLayer->GetOutputSlot(0).Connect(fullyConnected->GetInputSlot(0));
     fullyConnected->GetOutputSlot(0).Connect(OutputLayer->GetInputSlot(0));
 
     //Set the tensors in the network.
 
     InputLayer->GetOutputSlot(0).SetTensorInfo(inputTensorInfo);
 
     TensorInfo outputTensorInfo(TensorShape({1, 1}), DataType::Float32);
     fullyConnected->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
 
     return myNetwork;
 }

◆ TEST_SUITE()

TEST_SUITE ( "ClCustomAllocatorTests" )

Definition at line 95 of file ClCustomAllocatorTests.cpp.

References CreateTestNetwork(), and IRuntime::CreationOptions::m_CustomAllocatorMap.

 {
 
 // This is a copy of the SimpleSample app modified to use a custom
 // allocator for the clbackend. It creates a FullyConnected network with a single layer
 // taking a single number as an input
 TEST_CASE("ClCustomAllocatorTest")
 {
     using namespace armnn;
 
     float number = 3;
 
     // Construct ArmNN network
     armnn::NetworkId networkIdentifier;
 
     TensorInfo inputTensorInfo(TensorShape({1, 1}), DataType::Float32);
 
     INetworkPtr myNetwork = CreateTestNetwork(inputTensorInfo);
 
     // Create ArmNN runtime
     IRuntime::CreationOptions options; // default options
     auto customAllocator = std::make_shared<SampleClBackendCustomAllocator>();
     options.m_CustomAllocatorMap = {{"GpuAcc", std::move(customAllocator)}};
     IRuntimePtr run = IRuntime::Create(options);
 
     // Optimise ArmNN network
     OptimizerOptions optOptions;
     optOptions.m_ImportEnabled = true;
     armnn::IOptimizedNetworkPtr optNet = Optimize(*myNetwork, {"GpuAcc"}, run->GetDeviceSpec(), optOptions);
     CHECK(optNet);
 
     // Load graph into runtime
     std::string ignoredErrorMessage;
     INetworkProperties networkProperties(false, MemorySource::Malloc, MemorySource::Malloc);
     run->LoadNetwork(networkIdentifier, std::move(optNet), ignoredErrorMessage, networkProperties);
 
     // Creates structures for input & output
     unsigned int numElements = inputTensorInfo.GetNumElements();
     size_t totalBytes = numElements * sizeof(float);
 
     const size_t alignment =
             arm_compute::CLKernelLibrary::get().get_device().getInfo<CL_DEVICE_GLOBAL_MEM_CACHELINE_SIZE>();
 
     void* alignedInputPtr = options.m_CustomAllocatorMap["GpuAcc"]->allocate(totalBytes, alignment);
 
     // Input with negative values
     auto* inputPtr = reinterpret_cast<float*>(alignedInputPtr);
     std::fill_n(inputPtr, numElements, number);
 
     void* alignedOutputPtr = options.m_CustomAllocatorMap["GpuAcc"]->allocate(totalBytes, alignment);
     auto* outputPtr = reinterpret_cast<float*>(alignedOutputPtr);
     std::fill_n(outputPtr, numElements, -10.0f);
 
     armnn::InputTensors inputTensors
     {
         {0, armnn::ConstTensor(run->GetInputTensorInfo(networkIdentifier, 0), alignedInputPtr)},
     };
     armnn::OutputTensors outputTensors
     {
         {0, armnn::Tensor(run->GetOutputTensorInfo(networkIdentifier, 0), alignedOutputPtr)}
     };
 
     // Execute network
     run->EnqueueWorkload(networkIdentifier, inputTensors, outputTensors);
     run->UnloadNetwork(networkIdentifier);
 
 
     // Tell the CLBackend to sync memory so we can read the output.
     arm_compute::CLScheduler::get().sync();
     auto* outputResult = reinterpret_cast<float*>(alignedOutputPtr);
 
     run->UnloadNetwork(networkIdentifier);
     CHECK(outputResult[0] == number);
     auto& backendRegistry = armnn::BackendRegistryInstance();
     backendRegistry.DeregisterAllocator(ClBackend::GetIdStatic());
 }
 
 // Only run this test if NEON is enabled
 #if defined(ARMCOMPUTENEON_ENABLED)
 
 TEST_CASE("ClCustomAllocatorCpuAccNegativeTest")
 {
     using namespace armnn;
 
     // Create ArmNN runtime
     IRuntime::CreationOptions options; // default options
     auto customAllocator = std::make_shared<SampleClBackendCustomAllocator>();
     options.m_CustomAllocatorMap = {{"CpuAcc", std::move(customAllocator)}};
     IRuntimePtr run = IRuntime::Create(options);
     TensorInfo inputTensorInfo(TensorShape({1, 1}), DataType::Float32);
     INetworkPtr myNetwork = CreateTestNetwork(inputTensorInfo);
 
     // Optimise ArmNN network
     OptimizerOptions optOptions;
     optOptions.m_ImportEnabled = true;
     IOptimizedNetworkPtr optNet(nullptr, nullptr);
     std::vector<std::string> errMessages;
 
     CHECK_THROWS_AS_MESSAGE(Optimize(*myNetwork, {"CpuAcc"}, run->GetDeviceSpec(), optOptions, errMessages),
                             armnn::InvalidArgumentException,
                             "Expected an exception as GetAvailablePreferredBackends() should be empty in Optimize().");
 
     auto& backendRegistry = armnn::BackendRegistryInstance();
     backendRegistry.DeregisterAllocator(NeonBackend::GetIdStatic());
 }
 
 #endif
 
 TEST_CASE("ClCustomAllocatorGpuAccNullptrTest")
 {
     using namespace armnn;
 
     // Create ArmNN runtime
     IRuntime::CreationOptions options; // default options
     auto customAllocator = std::make_shared<SampleClBackendCustomAllocator>();
     options.m_CustomAllocatorMap = {{"GpuAcc", nullptr}};
 
     CHECK_THROWS_AS_MESSAGE(IRuntimePtr run = IRuntime::Create(options),
                             armnn::Exception,
                             "Expected exception in RuntimeImpl::RuntimeImpl() as allocator was nullptr.");
 }
 
 }

Functions

Function Documentation

◆ CreateTestNetwork()

◆ TEST_SUITE()