summaryrefslogtreecommitdiff
path: root/source/application/api/use_case/vww/include/VisualWakeWordProcessing.hpp
blob: f9f9d72cf5f4de65e03f61ed6d6fc9f17acae454 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
/*
 * Copyright (c) 2022 Arm Limited. All rights reserved.
 * SPDX-License-Identifier: Apache-2.0
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
#ifndef VWW_PROCESSING_HPP
#define VWW_PROCESSING_HPP

#include "BaseProcessing.hpp"
#include "Model.hpp"
#include "Classifier.hpp"

namespace arm {
namespace app {

    /**
     * @brief   Pre-processing class for Visual Wake Word use case.
     *          Implements methods declared by BasePreProcess and anything else needed
     *          to populate input tensors ready for inference.
     */
    class VisualWakeWordPreProcess : public BasePreProcess {

    public:
        /**
         * @brief       Constructor
         * @param[in]   inputTensor   Pointer to the TFLite Micro input Tensor.
         * @param[in]   rgb2Gray      Convert image from 3 channel RGB to 1 channel grayscale.
         **/
        explicit VisualWakeWordPreProcess(TfLiteTensor* inputTensor, bool rgb2Gray=true);

        /**
         * @brief       Should perform pre-processing of 'raw' input image data and load it into
         *              TFLite Micro input tensors ready for inference
         * @param[in]   input      Pointer to the data that pre-processing will work on.
         * @param[in]   inputSize  Size of the input data.
         * @return      true if successful, false otherwise.
         **/
        bool DoPreProcess(const void* input, size_t inputSize) override;

    private:
        TfLiteTensor* m_inputTensor;
        bool m_rgb2Gray;
    };

    /**
     * @brief   Post-processing class for Visual Wake Word use case.
     *          Implements methods declared by BasePostProcess and anything else needed
     *          to populate result vector.
     */
    class VisualWakeWordPostProcess : public BasePostProcess {

    private:
        TfLiteTensor* m_outputTensor;
        Classifier& m_vwwClassifier;
        const std::vector<std::string>& m_labels;
        std::vector<ClassificationResult>& m_results;

    public:
        /**
         * @brief       Constructor
         * @param[in]   outputTensor   Pointer to the TFLite Micro output Tensor.
         * @param[in]   classifier     Classifier object used to get top N results from classification.
         * @param[in]   model          Pointer to the VWW classification Model object.
         * @param[in]   labels         Vector of string labels to identify each output of the model.
         * @param[out]  results        Vector of classification results to store decoded outputs.
         **/
        VisualWakeWordPostProcess(TfLiteTensor* outputTensor, Classifier& classifier,
                const std::vector<std::string>& labels,
                std::vector<ClassificationResult>& results);

        /**
         * @brief    Should perform post-processing of the result of inference then
         *           populate classification result data for any later use.
         * @return   true if successful, false otherwise.
         **/
        bool DoPostProcess() override;
    };

} /* namespace app */
} /* namespace arm */

#endif /* VWW_PROCESSING_HPP */