aboutsummaryrefslogtreecommitdiff
path: root/lib/ethosu_profiler/src/ethosu_profiler.cpp
blob: c69e6f89c754c7581e72181be96039b4e5932370 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
/*
 * Copyright (c) 2021 Arm Limited. All rights reserved.
 *
 * SPDX-License-Identifier: Apache-2.0
 *
 * Licensed under the Apache License, Version 2.0 (the License); you may
 * not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an AS IS BASIS, WITHOUT
 * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include "tensorflow/lite/kernels/internal/compatibility.h"
#include "tensorflow/lite/micro/micro_error_reporter.h"
#include "tensorflow/lite/micro/micro_profiler.h"
#include "tensorflow/lite/micro/micro_time.h"

#include <string.h>

#include "ethosu_profiler.hpp"
#include <ethosu_driver.h>
#include <inttypes.h>
#include <stdio.h>

namespace {

uint64_t GetCurrentEthosuTicks(struct ethosu_driver *drv) {
    return ETHOSU_PMU_Get_CCNTR_v2(drv);
}

void InitEthosuPMUCounters(struct ethosu_driver *drv, ethosu_pmu_event_type *ethosu_pmu_cntrs) {
    ETHOSU_PMU_Enable_v2(drv);

    ETHOSU_PMU_CNTR_Enable_v2(drv,
                              ETHOSU_PMU_CNT1_Msk | ETHOSU_PMU_CNT2_Msk | ETHOSU_PMU_CNT3_Msk | ETHOSU_PMU_CNT4_Msk |
                                  ETHOSU_PMU_CCNT_Msk);

    for (int i = 0; i < ETHOSU_PMU_NCOUNTERS; i++) {
        ETHOSU_PMU_Set_EVTYPER_v2(drv, i, ethosu_pmu_cntrs[i]);
    }

    ETHOSU_PMU_EVCNTR_ALL_Reset_v2(drv);
}

uint32_t GetEthosuPMUEventCounter(struct ethosu_driver *drv, int counter) {
    return ETHOSU_PMU_Get_EVCNTR_v2(drv, counter);
}
} // namespace

namespace tflite {

EthosUProfiler::EthosUProfiler(ethosu_pmu_event_type event0,
                               ethosu_pmu_event_type event1,
                               ethosu_pmu_event_type event2,
                               ethosu_pmu_event_type event3,
                               size_t max_events) :
    max_events_(max_events) {
    tags_        = std::make_unique<const char *[]>(max_events_);
    start_ticks_ = std::make_unique<uint64_t[]>(max_events_);
    end_ticks_   = std::make_unique<uint64_t[]>(max_events_);

    for (size_t i = 0; i < ETHOSU_PMU_NCOUNTERS; i++) {
        event_counters[i] = 0;
    }

    MonitorEthosuPMUEvents(event0, event1, event2, event3);
}

// NOTE: THIS PROFILER ONLY WORKS ON SYSTEMS WITH 1 NPU
uint32_t EthosUProfiler::BeginEvent(const char *tag) {
    if (num_events_ == max_events_) {
        tflite::GetMicroErrorReporter()->Report("Profiling event overflow, max: %u events", max_events_);
        num_events_ = 0;
    }

    tags_[num_events_] = tag;

    if (strcmp("ethos-u", tag) == 0) {
        struct ethosu_driver *ethosu_drv = ethosu_reserve_driver();
        ETHOSU_PMU_CYCCNT_Reset_v2(ethosu_drv);
        ETHOSU_PMU_PMCCNTR_CFG_Set_Start_Event_v2(ethosu_drv, ETHOSU_PMU_NPU_ACTIVE);
        ETHOSU_PMU_PMCCNTR_CFG_Set_Stop_Event_v2(ethosu_drv, ETHOSU_PMU_NPU_IDLE);
        start_ticks_[num_events_] = GetCurrentEthosuTicks(ethosu_drv);
        InitEthosuPMUCounters(ethosu_drv, ethosu_pmu_cntrs);
        ethosu_release_driver(ethosu_drv);
    } else {
        start_ticks_[num_events_] = GetCurrentTimeTicks();
    }

    end_ticks_[num_events_] = start_ticks_[num_events_] - 1;
    return num_events_++;
}

// NOTE: THIS PROFILER ONLY WORKS ON SYSTEMS WITH 1 NPU
void EthosUProfiler::EndEvent(uint32_t event_handle) {
    TFLITE_DCHECK(event_handle < max_events_);

    if (strcmp("ethos-u", tags_[event_handle]) == 0) {
        struct ethosu_driver *ethosu_drv = ethosu_reserve_driver();
        end_ticks_[event_handle]         = GetCurrentEthosuTicks(ethosu_drv);
        uint32_t ethosu_pmu_counter_end[ETHOSU_PMU_NCOUNTERS];
        ETHOSU_PMU_Disable_v2(ethosu_drv);
        for (size_t i = 0; i < ETHOSU_PMU_NCOUNTERS; i++) {
            ethosu_pmu_counter_end[i] = GetEthosuPMUEventCounter(ethosu_drv, i);
            tflite::GetMicroErrorReporter()->Report(
                "%s : ethosu_pmu_cntr%d : %u", tags_[event_handle], i, ethosu_pmu_counter_end[i]);

            event_counters[i] += ethosu_pmu_counter_end[i];
        }
        ethosu_release_driver(ethosu_drv);
        printf("%s : cycle_cnt : %" PRIu64 " cycles\n",
               tags_[event_handle],
               end_ticks_[event_handle] - start_ticks_[event_handle]);

    } else {
        end_ticks_[event_handle] = GetCurrentTimeTicks();
        printf("%s : cycle_cnt : %" PRIu64 " cycles\n",
               tags_[event_handle],
               end_ticks_[event_handle] - start_ticks_[event_handle]);
    }
}

uint64_t EthosUProfiler::GetTotalTicks() const {
    uint64_t ticks = 0;
    for (int i = 0; i < num_events_; ++i) {
        ticks += end_ticks_[i] - start_ticks_[i];
    }

    return ticks;
}

void EthosUProfiler::Log() const {
#if !defined(TF_LITE_STRIP_ERROR_STRINGS)
    for (int i = 0; i < num_events_; ++i) {
        uint64_t ticks = end_ticks_[i] - start_ticks_[i];
        printf("%s took %" PRIu64 " cycles\n", tags_[i], ticks);
    }
#endif
}

void EthosUProfiler::MonitorEthosuPMUEvents(ethosu_pmu_event_type event0,
                                            ethosu_pmu_event_type event1,
                                            ethosu_pmu_event_type event2,
                                            ethosu_pmu_event_type event3) {
    ethosu_pmu_cntrs[0] = event0;
    ethosu_pmu_cntrs[1] = event1;
    ethosu_pmu_cntrs[2] = event2;
    ethosu_pmu_cntrs[3] = event3;
}

uint32_t EthosUProfiler::GetEthosuPMUCounter(int counter) {
    return event_counters[counter];
}

} // namespace tflite