diff options
Diffstat (limited to 'src/backends/gpuFsa/test/GpuFsaOptimizedNetworkTests.cpp')
-rw-r--r-- | src/backends/gpuFsa/test/GpuFsaOptimizedNetworkTests.cpp | 46 |
1 files changed, 46 insertions, 0 deletions
diff --git a/src/backends/gpuFsa/test/GpuFsaOptimizedNetworkTests.cpp b/src/backends/gpuFsa/test/GpuFsaOptimizedNetworkTests.cpp index 6ddb942dea..1e5c976c00 100644 --- a/src/backends/gpuFsa/test/GpuFsaOptimizedNetworkTests.cpp +++ b/src/backends/gpuFsa/test/GpuFsaOptimizedNetworkTests.cpp @@ -15,6 +15,52 @@ using namespace armnn; TEST_SUITE("GpuFsaOptimizedNetwork") { +TEST_CASE("BatchMatMulSupportedOptimizedNetwork") +{ + using namespace armnn; + + const float qScale = 1.0f; + const int32_t qOffset = 0; + + const TensorShape& input1Shape = { 2, 2 }; + const TensorShape& input2Shape = { 2, 2 }; + const TensorShape& outputShape = { 2, 2 }; + + TensorInfo input1TensorInfo(input1Shape, DataType::Float32, qScale, qOffset, true); + TensorInfo input2TensorInfo(input2Shape, DataType::Float32, qScale, qOffset, true); + TensorInfo outputTensorInfo(outputShape, DataType::Float32, qScale, qOffset); + + IRuntime::CreationOptions options; + IRuntimePtr runtime(IRuntime::Create(options)); + INetworkPtr network(INetwork::Create()); + + BatchMatMulDescriptor desc{}; + + IConnectableLayer* input1 = network->AddInputLayer(0, "input0"); + IConnectableLayer* input2 = network->AddInputLayer(1, "input1"); + IConnectableLayer* batchMatMulLayer = network->AddBatchMatMulLayer(desc, "batchMatMul"); + IConnectableLayer* output = network->AddOutputLayer(2, "output"); + + Connect(input1, batchMatMulLayer, input1TensorInfo, 0, 0); + Connect(input2, batchMatMulLayer, input2TensorInfo, 0, 1); + Connect(batchMatMulLayer, output, outputTensorInfo, 0, 0); + + std::vector<BackendId> backends = { "GpuFsa" }; + + OptimizerOptionsOpaque optimizedOptions; + IOptimizedNetworkPtr optNet = Optimize(*network, backends, runtime->GetDeviceSpec(), optimizedOptions); + CHECK(optNet); + + Graph& graph = GetGraphForTesting(optNet.get()); + + // Check graph layer sequence to ensure that the network has been replaced with a PreCompiledLayer + CHECK(CheckSequence(graph.cbegin(), graph.cend(), + &IsLayerOfType<InputLayer>, + &IsLayerOfType<InputLayer>, + &IsLayerOfType<PreCompiledLayer>, + &IsLayerOfType<OutputLayer>)); +} + TEST_CASE("CastSupportedOptimizedNetwork") { using namespace armnn; |