// // Copyright © 2022 Arm Ltd and Contributors. All rights reserved. // SPDX-License-Identifier: MIT // #pragma once #include "TestUtils.hpp" #include #include #include #include #include #include #include #include namespace { std::vector CreateBatchMatMulTfLiteModel( tflite::BuiltinOperator bmmOperatorCode, tflite::TensorType tensorType, const std::vector & LHSInputTensorShape, const std::vector & RHSInputTensorShape, const std::vector & outputTensorShape, bool adjX = false, bool adjY = false, float quantScale = 1.0f, int quantOffset = 0) { using namespace tflite; flatbuffers::FlatBufferBuilder flatBufferBuilder; std::vector> buffers; buffers.push_back(CreateBuffer(flatBufferBuilder, flatBufferBuilder.CreateVector({}))); auto quantizationParameters = CreateQuantizationParameters(flatBufferBuilder, 0, 0, flatBufferBuilder.CreateVector({ quantScale }), flatBufferBuilder.CreateVector({ quantOffset })); std::array, 3> tensors; tensors[0] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(LHSInputTensorShape.data(), LHSInputTensorShape.size()), tensorType, 0, flatBufferBuilder.CreateString("LHSInput"), quantizationParameters); tensors[1] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(RHSInputTensorShape.data(), RHSInputTensorShape.size()), tensorType, 0, flatBufferBuilder.CreateString("RHSInput"), quantizationParameters); tensors[2] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(outputTensorShape.data(), outputTensorShape.size()), tensorType, 0, flatBufferBuilder.CreateString("output"), quantizationParameters); // create operator tflite::BuiltinOptions operatorBuiltinOptionsType = BuiltinOptions_BatchMatMulOptions; flatbuffers::Offset operatorBuiltinOptions = CreateBatchMatMulOptions(flatBufferBuilder, adjX, adjY).Union(); const std::vector operatorInputs{{0, 1}}; const std::vector operatorOutputs{2}; flatbuffers::Offset bmmOperator = CreateOperator(flatBufferBuilder, 0, flatBufferBuilder.CreateVector(operatorInputs.data(), operatorInputs.size()), flatBufferBuilder.CreateVector(operatorOutputs.data(), operatorOutputs.size()), operatorBuiltinOptionsType, operatorBuiltinOptions); const std::vector subgraphInputs{{0, 1}}; const std::vector subgraphOutputs{2}; flatbuffers::Offset subgraph = CreateSubGraph(flatBufferBuilder, flatBufferBuilder.CreateVector(tensors.data(), tensors.size()), flatBufferBuilder.CreateVector(subgraphInputs.data(), subgraphInputs.size()), flatBufferBuilder.CreateVector(subgraphOutputs.data(), subgraphOutputs.size()), flatBufferBuilder.CreateVector(&bmmOperator, 1)); flatbuffers::Offset modelDescription = flatBufferBuilder.CreateString("ArmnnDelegate: BatchMatMul Operator Model"); flatbuffers::Offset operatorCode = CreateOperatorCode(flatBufferBuilder, bmmOperatorCode); flatbuffers::Offset flatbufferModel = CreateModel(flatBufferBuilder, TFLITE_SCHEMA_VERSION, flatBufferBuilder.CreateVector(&operatorCode, 1), flatBufferBuilder.CreateVector(&subgraph, 1), modelDescription, flatBufferBuilder.CreateVector(buffers.data(), buffers.size())); flatBufferBuilder.Finish(flatbufferModel); return std::vector(flatBufferBuilder.GetBufferPointer(), flatBufferBuilder.GetBufferPointer() + flatBufferBuilder.GetSize()); } template void BatchMatMulTest(tflite::BuiltinOperator bmmOperatorCode, tflite::TensorType tensorType, std::vector& backends, std::vector& LHSInputShape, std::vector& RHSInputShape, std::vector& outputShape, std::vector& LHSInputValues, std::vector& RHSInputValues, std::vector& expectedOutputValues, bool adjX = false, bool adjY = false, float quantScale = 1.0f, int quantOffset = 0) { using namespace tflite; std::vector modelBuffer = CreateBatchMatMulTfLiteModel(bmmOperatorCode, tensorType, LHSInputShape, RHSInputShape, outputShape, adjX, adjY, quantScale, quantOffset); const Model* tfLiteModel = GetModel(modelBuffer.data()); CHECK(tfLiteModel != nullptr); // Create TfLite Interpreters std::unique_ptr armnnDelegateInterpreter; CHECK(InterpreterBuilder(tfLiteModel, ::tflite::ops::builtin::BuiltinOpResolver()) (&armnnDelegateInterpreter) == kTfLiteOk); CHECK(armnnDelegateInterpreter != nullptr); CHECK(armnnDelegateInterpreter->AllocateTensors() == kTfLiteOk); std::unique_ptr tfLiteInterpreter; CHECK(InterpreterBuilder(tfLiteModel, ::tflite::ops::builtin::BuiltinOpResolver()) (&tfLiteInterpreter) == kTfLiteOk); CHECK(tfLiteInterpreter != nullptr); CHECK(tfLiteInterpreter->AllocateTensors() == kTfLiteOk); // Create the ArmNN Delegate armnnDelegate::DelegateOptions delegateOptions(backends); std::unique_ptr theArmnnDelegate(armnnDelegate::TfLiteArmnnDelegateCreate(delegateOptions), armnnDelegate::TfLiteArmnnDelegateDelete); CHECK(theArmnnDelegate != nullptr); // Modify armnnDelegateInterpreter to use armnnDelegate CHECK(armnnDelegateInterpreter->ModifyGraphWithDelegate(theArmnnDelegate.get()) == kTfLiteOk); // Set input data auto tfLiteDelegateLHSInputId = tfLiteInterpreter->inputs()[0]; auto tfLiteDelegateLHSInputData = tfLiteInterpreter->typed_tensor(tfLiteDelegateLHSInputId); auto tfLiteDelegateRHSInputId = tfLiteInterpreter->inputs()[1]; auto tfLiteDelegateRHSInputData = tfLiteInterpreter->typed_tensor(tfLiteDelegateRHSInputId); for (unsigned int i = 0; i < LHSInputValues.size(); ++i) { tfLiteDelegateLHSInputData[i] = LHSInputValues[i]; } for (unsigned int i = 0; i < RHSInputValues.size(); ++i) { tfLiteDelegateRHSInputData[i] = RHSInputValues[i]; } auto armnnDelegateLHSInputId = armnnDelegateInterpreter->inputs()[0]; auto armnnDelegateLHSInputData = armnnDelegateInterpreter->typed_tensor(armnnDelegateLHSInputId); auto armnnDelegateRHSInputId = armnnDelegateInterpreter->inputs()[1]; auto armnnDelegateRHSInputData = armnnDelegateInterpreter->typed_tensor(armnnDelegateRHSInputId); for (unsigned int i = 0; i < LHSInputValues.size(); ++i) { armnnDelegateLHSInputData[i] = LHSInputValues[i]; } for (unsigned int i = 0; i < RHSInputValues.size(); ++i) { armnnDelegateRHSInputData[i] = RHSInputValues[i]; } // Run EnqueueWorkload CHECK(tfLiteInterpreter->Invoke() == kTfLiteOk); CHECK(armnnDelegateInterpreter->Invoke() == kTfLiteOk); armnnDelegate::CompareOutputData(tfLiteInterpreter, armnnDelegateInterpreter, outputShape, expectedOutputValues); } } // anonymous namespace