// // Copyright © 2021, 2023-2024 Arm Ltd and Contributors. All rights reserved. // SPDX-License-Identifier: MIT // #pragma once #include "TestUtils.hpp" #include #include #include namespace { struct StreamRedirector { public: StreamRedirector(std::ostream &stream, std::streambuf *newStreamBuffer) : m_Stream(stream), m_BackupBuffer(m_Stream.rdbuf(newStreamBuffer)) {} ~StreamRedirector() { m_Stream.rdbuf(m_BackupBuffer); } private: std::ostream &m_Stream; std::streambuf *m_BackupBuffer; }; std::vector CreateAddDivTfLiteModel(tflite::TensorType tensorType, const std::vector& tensorShape, float quantScale = 1.0f, int quantOffset = 0) { using namespace tflite; flatbuffers::FlatBufferBuilder flatBufferBuilder; std::vector> buffers; buffers.push_back(CreateBuffer(flatBufferBuilder)); buffers.push_back(CreateBuffer(flatBufferBuilder)); buffers.push_back(CreateBuffer(flatBufferBuilder)); buffers.push_back(CreateBuffer(flatBufferBuilder)); buffers.push_back(CreateBuffer(flatBufferBuilder)); buffers.push_back(CreateBuffer(flatBufferBuilder)); auto quantizationParameters = CreateQuantizationParameters(flatBufferBuilder, 0, 0, flatBufferBuilder.CreateVector({ quantScale }), flatBufferBuilder.CreateVector({ quantOffset })); std::array, 5> tensors; tensors[0] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(tensorShape.data(), tensorShape.size()), tensorType, 1, flatBufferBuilder.CreateString("input_0"), quantizationParameters); tensors[1] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(tensorShape.data(), tensorShape.size()), tensorType, 2, flatBufferBuilder.CreateString("input_1"), quantizationParameters); tensors[2] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(tensorShape.data(), tensorShape.size()), tensorType, 3, flatBufferBuilder.CreateString("input_2"), quantizationParameters); tensors[3] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(tensorShape.data(), tensorShape.size()), tensorType, 4, flatBufferBuilder.CreateString("add"), quantizationParameters); tensors[4] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(tensorShape.data(), tensorShape.size()), tensorType, 5, flatBufferBuilder.CreateString("output"), quantizationParameters); // create operator tflite::BuiltinOptions addBuiltinOptionsType = tflite::BuiltinOptions_AddOptions; flatbuffers::Offset addBuiltinOptions = CreateAddOptions(flatBufferBuilder, ActivationFunctionType_NONE).Union(); tflite::BuiltinOptions divBuiltinOptionsType = tflite::BuiltinOptions_DivOptions; flatbuffers::Offset divBuiltinOptions = CreateAddOptions(flatBufferBuilder, ActivationFunctionType_NONE).Union(); std::array, 2> operators; const std::vector addInputs{0, 1}; const std::vector addOutputs{3}; operators[0] = CreateOperator(flatBufferBuilder, 0, flatBufferBuilder.CreateVector(addInputs.data(), addInputs.size()), flatBufferBuilder.CreateVector(addOutputs.data(), addOutputs.size()), addBuiltinOptionsType, addBuiltinOptions); const std::vector divInputs{3, 2}; const std::vector divOutputs{4}; operators[1] = CreateOperator(flatBufferBuilder, 1, flatBufferBuilder.CreateVector(divInputs.data(), divInputs.size()), flatBufferBuilder.CreateVector(divOutputs.data(), divOutputs.size()), divBuiltinOptionsType, divBuiltinOptions); const std::vector subgraphInputs{0, 1, 2}; const std::vector subgraphOutputs{4}; flatbuffers::Offset subgraph = CreateSubGraph(flatBufferBuilder, flatBufferBuilder.CreateVector(tensors.data(), tensors.size()), flatBufferBuilder.CreateVector(subgraphInputs.data(), subgraphInputs.size()), flatBufferBuilder.CreateVector(subgraphOutputs.data(), subgraphOutputs.size()), flatBufferBuilder.CreateVector(operators.data(), operators.size())); flatbuffers::Offset modelDescription = flatBufferBuilder.CreateString("ArmnnDelegate: Add and Div Operator Model"); std::array, 2> codes; codes[0] = CreateOperatorCode(flatBufferBuilder, tflite::BuiltinOperator_ADD); codes[1] = CreateOperatorCode(flatBufferBuilder, tflite::BuiltinOperator_DIV); flatbuffers::Offset flatbufferModel = CreateModel(flatBufferBuilder, TFLITE_SCHEMA_VERSION, flatBufferBuilder.CreateVector(codes.data(), codes.size()), flatBufferBuilder.CreateVector(&subgraph, 1), modelDescription, flatBufferBuilder.CreateVector(buffers.data(), buffers.size())); flatBufferBuilder.Finish(flatbufferModel, armnnDelegate::FILE_IDENTIFIER); return std::vector(flatBufferBuilder.GetBufferPointer(), flatBufferBuilder.GetBufferPointer() + flatBufferBuilder.GetSize()); } std::vector CreateCosTfLiteModel(tflite::TensorType tensorType, const std::vector & tensorShape, float quantScale = 1.0f, int quantOffset = 0) { using namespace tflite; flatbuffers::FlatBufferBuilder flatBufferBuilder; std::vector> buffers; buffers.push_back(CreateBuffer(flatBufferBuilder)); auto quantizationParameters = CreateQuantizationParameters(flatBufferBuilder, 0, 0, flatBufferBuilder.CreateVector({quantScale}), flatBufferBuilder.CreateVector({quantOffset})); std::array, 2> tensors; tensors[0] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(tensorShape.data(), tensorShape.size()), tensorType, 0, flatBufferBuilder.CreateString("input"), quantizationParameters); tensors[1] = CreateTensor(flatBufferBuilder, flatBufferBuilder.CreateVector(tensorShape.data(), tensorShape.size()), tensorType, 0, flatBufferBuilder.CreateString("output"), quantizationParameters); const std::vector operatorInputs({0}); const std::vector operatorOutputs({1}); flatbuffers::Offset ceilOperator = CreateOperator(flatBufferBuilder, 0, flatBufferBuilder.CreateVector(operatorInputs.data(), operatorInputs.size()), flatBufferBuilder.CreateVector(operatorOutputs.data(), operatorOutputs.size()), BuiltinOptions_NONE); flatbuffers::Offset modelDescription = flatBufferBuilder.CreateString("ArmnnDelegate: CEIL Operator Model"); flatbuffers::Offset operatorCode = CreateOperatorCode(flatBufferBuilder, tflite::BuiltinOperator_COS); const std::vector subgraphInputs({0}); const std::vector subgraphOutputs({1}); flatbuffers::Offset subgraph = CreateSubGraph(flatBufferBuilder, flatBufferBuilder.CreateVector(tensors.data(), tensors.size()), flatBufferBuilder.CreateVector(subgraphInputs.data(), subgraphInputs.size()), flatBufferBuilder.CreateVector(subgraphOutputs.data(), subgraphOutputs.size()), flatBufferBuilder.CreateVector(&ceilOperator, 1)); flatbuffers::Offset flatbufferModel = CreateModel(flatBufferBuilder, TFLITE_SCHEMA_VERSION, flatBufferBuilder.CreateVector(&operatorCode, 1), flatBufferBuilder.CreateVector(&subgraph, 1), modelDescription, flatBufferBuilder.CreateVector(buffers.data(), buffers.size())); flatBufferBuilder.Finish(flatbufferModel, armnnDelegate::FILE_IDENTIFIER); return std::vector(flatBufferBuilder.GetBufferPointer(), flatBufferBuilder.GetBufferPointer() + flatBufferBuilder.GetSize()); } template void DelegateOptionTest(tflite::TensorType tensorType, std::vector& tensorShape, std::vector& input0Values, std::vector& input1Values, std::vector& input2Values, std::vector& expectedOutputValues, const armnnDelegate::DelegateOptions& delegateOptions, float quantScale = 1.0f, int quantOffset = 0) { using namespace delegateTestInterpreter; std::vector modelBuffer = CreateAddDivTfLiteModel(tensorType, tensorShape, quantScale, quantOffset); // Setup interpreter with just TFLite Runtime. auto tfLiteInterpreter = DelegateTestInterpreter(modelBuffer); CHECK(tfLiteInterpreter.AllocateTensors() == kTfLiteOk); CHECK(tfLiteInterpreter.FillInputTensor(input0Values, 0) == kTfLiteOk); CHECK(tfLiteInterpreter.FillInputTensor(input1Values, 1) == kTfLiteOk); CHECK(tfLiteInterpreter.FillInputTensor(input2Values, 2) == kTfLiteOk); CHECK(tfLiteInterpreter.Invoke() == kTfLiteOk); std::vector tfLiteOutputValues = tfLiteInterpreter.GetOutputResult(0); std::vector tfLiteOutputShape = tfLiteInterpreter.GetOutputShape(0); // Setup interpreter with Arm NN Delegate applied. auto armnnInterpreter = DelegateTestInterpreter(modelBuffer, delegateOptions); CHECK(armnnInterpreter.AllocateTensors() == kTfLiteOk); CHECK(armnnInterpreter.FillInputTensor(input0Values, 0) == kTfLiteOk); CHECK(armnnInterpreter.FillInputTensor(input1Values, 1) == kTfLiteOk); CHECK(armnnInterpreter.FillInputTensor(input2Values, 2) == kTfLiteOk); CHECK(armnnInterpreter.Invoke() == kTfLiteOk); std::vector armnnOutputValues = armnnInterpreter.GetOutputResult(0); std::vector armnnOutputShape = armnnInterpreter.GetOutputShape(0); armnnDelegate::CompareOutputData(tfLiteOutputValues, armnnOutputValues, expectedOutputValues); armnnDelegate::CompareOutputShape(tfLiteOutputShape, armnnOutputShape, tensorShape); tfLiteInterpreter.Cleanup(); armnnInterpreter.Cleanup(); } template void DelegateOptionNoFallbackTest(tflite::TensorType tensorType, std::vector& tensorShape, std::vector& inputValues, std::vector& expectedOutputValues, const armnnDelegate::DelegateOptions& delegateOptions, float quantScale = 1.0f, int quantOffset = 0) { using namespace delegateTestInterpreter; std::vector modelBuffer = CreateCosTfLiteModel(tensorType, tensorShape, quantScale, quantOffset); // Setup interpreter with just TFLite Runtime. auto tfLiteInterpreter = DelegateTestInterpreter(modelBuffer); CHECK(tfLiteInterpreter.AllocateTensors() == kTfLiteOk); CHECK(tfLiteInterpreter.FillInputTensor(inputValues, 0) == kTfLiteOk); CHECK(tfLiteInterpreter.Invoke() == kTfLiteOk); std::vector tfLiteOutputValues = tfLiteInterpreter.GetOutputResult(0); std::vector tfLiteOutputShape = tfLiteInterpreter.GetOutputShape(0); tfLiteInterpreter.Cleanup(); try { auto armnnInterpreter = DelegateTestInterpreter(modelBuffer, delegateOptions); CHECK(armnnInterpreter.AllocateTensors() == kTfLiteOk); CHECK(armnnInterpreter.FillInputTensor(inputValues, 0) == kTfLiteOk); CHECK(armnnInterpreter.Invoke() == kTfLiteOk); std::vector armnnOutputValues = armnnInterpreter.GetOutputResult(0); std::vector armnnOutputShape = armnnInterpreter.GetOutputShape(0); armnnInterpreter.Cleanup(); armnnDelegate::CompareOutputData(tfLiteOutputValues, armnnOutputValues, expectedOutputValues); armnnDelegate::CompareOutputShape(tfLiteOutputShape, armnnOutputShape, tensorShape); } catch (const armnn::Exception& e) { // Forward the exception message to std::cout std::cout << e.what() << std::endl; } } } // anonymous namespace