/* * SPDX-FileCopyrightText: Copyright 2021-2022 Arm Limited and/or its affiliates * SPDX-License-Identifier: Apache-2.0 * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include "UseCaseHandler.hpp" #include "VisualWakeWordModel.hpp" #include "Classifier.hpp" #include "InputFiles.hpp" #include "ImageUtils.hpp" #include "UseCaseCommonUtils.hpp" #include "hal.h" #include "log_macros.h" #include "VisualWakeWordProcessing.hpp" namespace arm { namespace app { /* Visual Wake Word inference handler. */ bool ClassifyImageHandler(ApplicationContext &ctx, uint32_t imgIndex, bool runAll) { auto& profiler = ctx.Get("profiler"); auto& model = ctx.Get("model"); /* If the request has a valid size, set the image index. */ if (imgIndex < NUMBER_OF_FILES) { if (!SetAppCtxIfmIdx(ctx, imgIndex,"imgIndex")) { return false; } } auto initialImgIdx = ctx.Get("imgIndex"); constexpr uint32_t dataPsnImgDownscaleFactor = 1; constexpr uint32_t dataPsnImgStartX = 10; constexpr uint32_t dataPsnImgStartY = 35; constexpr uint32_t dataPsnTxtInfStartX = 150; constexpr uint32_t dataPsnTxtInfStartY = 40; if (!model.IsInited()) { printf_err("Model is not initialised! Terminating processing.\n"); return false; } TfLiteTensor* inputTensor = model.GetInputTensor(0); TfLiteTensor* outputTensor = model.GetOutputTensor(0); if (!inputTensor->dims) { printf_err("Invalid input tensor dims\n"); return false; } else if (inputTensor->dims->size < 4) { printf_err("Input tensor dimension should be = 4\n"); return false; } /* Get input shape for displaying the image. */ TfLiteIntArray* inputShape = model.GetInputShape(0); const uint32_t nCols = inputShape->data[arm::app::VisualWakeWordModel::ms_inputColsIdx]; const uint32_t nRows = inputShape->data[arm::app::VisualWakeWordModel::ms_inputRowsIdx]; if (arm::app::VisualWakeWordModel::ms_inputChannelsIdx >= static_cast(inputShape->size)) { printf_err("Invalid channel index.\n"); return false; } /* We expect RGB images to be provided. */ const uint32_t displayChannels = 3; /* Set up pre and post-processing. */ VisualWakeWordPreProcess preProcess = VisualWakeWordPreProcess(inputTensor); std::vector results; VisualWakeWordPostProcess postProcess = VisualWakeWordPostProcess(outputTensor, ctx.Get("classifier"), ctx.Get&>("labels"), results); do { hal_lcd_clear(COLOR_BLACK); /* Strings for presentation/logging. */ std::string str_inf{"Running inference... "}; const uint8_t* imgSrc = get_img_array(ctx.Get("imgIndex")); if (nullptr == imgSrc) { printf_err("Failed to get image index %" PRIu32 " (max: %u)\n", ctx.Get("imgIndex"), NUMBER_OF_FILES - 1); return false; } /* Display this image on the LCD. */ hal_lcd_display_image( imgSrc, nCols, nRows, displayChannels, dataPsnImgStartX, dataPsnImgStartY, dataPsnImgDownscaleFactor); /* Display message on the LCD - inference running. */ hal_lcd_display_text(str_inf.c_str(), str_inf.size(), dataPsnTxtInfStartX, dataPsnTxtInfStartY, 0); /* Run inference over this image. */ info("Running inference on image %" PRIu32 " => %s\n", ctx.Get("imgIndex"), get_filename(ctx.Get("imgIndex"))); const size_t imgSz = inputTensor->bytes < IMAGE_DATA_SIZE ? inputTensor->bytes : IMAGE_DATA_SIZE; /* Run the pre-processing, inference and post-processing. */ if (!preProcess.DoPreProcess(imgSrc, imgSz)) { printf_err("Pre-processing failed."); return false; } if (!RunInference(model, profiler)) { printf_err("Inference failed."); return false; } if (!postProcess.DoPostProcess()) { printf_err("Post-processing failed."); return false; } /* Erase. */ str_inf = std::string(str_inf.size(), ' '); hal_lcd_display_text(str_inf.c_str(), str_inf.size(), dataPsnTxtInfStartX, dataPsnTxtInfStartY, 0); /* Add results to context for access outside handler. */ ctx.Set>("results", results); #if VERIFY_TEST_OUTPUT arm::app::DumpTensor(outputTensor); #endif /* VERIFY_TEST_OUTPUT */ if (!PresentInferenceResult(results)) { return false; } profiler.PrintProfilingResult(); IncrementAppCtxIfmIdx(ctx,"imgIndex"); } while (runAll && ctx.Get("imgIndex") != initialImgIdx); return true; } } /* namespace app */ } /* namespace arm */