/* * Copyright (c) 2019-2021 Arm Limited. All rights reserved. * * SPDX-License-Identifier: Apache-2.0 * * Licensed under the Apache License, Version 2.0 (the License); you may * not use this file except in compliance with the License. * You may obtain a copy of the License at * * www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an AS IS BASIS, WITHOUT * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ /****************************************************************************** * Includes ******************************************************************************/ #include "ethosu_driver.h" #include "ethosu_common.h" #include "ethosu_config.h" #include "ethosu_device.h" #include "ethosu_log.h" #include #include #include #include #include #include #include /****************************************************************************** * Defines ******************************************************************************/ #define MACS_PER_CYCLE_LOG2_MASK 0x000F #define SHRAM_SIZE_MASK 0xFF00 #define SHRAM_SIZE_RIGHT_SHIFT 8 #define BYTES_IN_32_BITS 4 #define CUSTOM_OPTION_LENGTH_32_BIT_WORD 1 #define DRIVER_ACTION_LENGTH_32_BIT_WORD 1 #define OPTIMIZER_CONFIG_LENGTH_32_BIT_WORD 2 #define ETHOSU_FOURCC ('1' << 24 | 'P' << 16 | 'O' << 8 | 'C') // "Custom Operator Payload 1" #define APB_START_ADDR_MASK 0x0FFF #define APB_NUM_REG_BIT_SHIFT 12 #define BYTES_1KB 1024 #define PRODUCT_MAJOR_ETHOSU55 (4) #define MASK_16_BYTE_ALIGN (0xF) #define FAST_MEMORY_BASE_ADDR_INDEX 2 /****************************************************************************** * Types ******************************************************************************/ // Driver actions enum DRIVER_ACTION_e { RESERVED = 0, OPTIMIZER_CONFIG = 1, COMMAND_STREAM = 2, READ_APB_REG = 3, DUMP_SHRAM = 4, NOP = 5, }; // Custom data struct struct custom_data_s { union { // Driver action data struct { // Driver action command (valid values in DRIVER_ACTION_e) uint8_t driver_action_command; // reserved uint8_t reserved; // Driver action data union { // DA_CMD_OPT_CFG struct { uint16_t rel_nbr : 4; uint16_t patch_nbr : 4; uint16_t opt_cfg_reserved : 8; }; // DA_CMD_CMSTRM struct { uint16_t length; }; // DA_CMD_READAPB struct { uint16_t start_address : 12; uint16_t nbr_reg_minus1 : 4; }; uint16_t driver_action_data; }; }; uint32_t word; }; }; // optimizer config struct struct opt_cfg_s { struct custom_data_s da_data; union { struct { uint32_t macs_per_cc : 4; uint32_t cmd_stream_version : 4; uint32_t shram_size : 8; uint32_t reserved0 : 11; uint32_t custom_dma : 1; uint32_t product : 4; }; uint32_t npu_cfg; }; union { struct { uint32_t version_status : 4; uint32_t version_minor : 4; uint32_t version_major : 4; uint32_t product_major : 4; uint32_t arch_patch_rev : 4; uint32_t arch_minor_rev : 8; uint32_t arch_major_rev : 4; }; uint32_t ethosu_id; }; }; /****************************************************************************** * Variables ******************************************************************************/ // Registered drivers linked list HEAD static struct ethosu_driver *registered_drivers = NULL; /****************************************************************************** * Weak functions - Cache * * Default NOP operations. Override if available on the targeted device. ******************************************************************************/ /* * Flush/clean the data cache by address and size. Passing NULL as p argument * expects the whole cache to be flushed. */ void __attribute__((weak)) ethosu_flush_dcache(uint32_t *p, size_t bytes) { UNUSED(p); UNUSED(bytes); } /* * Invalidate the data cache by address and size. Passing NULL as p argument * expects the whole cache to be invalidated. */ void __attribute__((weak)) ethosu_invalidate_dcache(uint32_t *p, size_t bytes) { UNUSED(p); UNUSED(bytes); } /****************************************************************************** * Weak functions - Semaphore/Mutex for multi NPU * * Following section handles the minimal sempahore and mutex implementation in * case of baremetal applications. Weak symbols will be overridden by RTOS * definitions and implement true thread-safety (in application layer). ******************************************************************************/ struct ethosu_semaphore_t { int count; }; static void *ethosu_mutex; static void *ethosu_semaphore; void *__attribute__((weak)) ethosu_mutex_create(void) { return NULL; } void __attribute__((weak)) ethosu_mutex_lock(void *mutex) { UNUSED(mutex); } void __attribute__((weak)) ethosu_mutex_unlock(void *mutex) { UNUSED(mutex); } // Baremetal implementation of creating a semaphore void *__attribute__((weak)) ethosu_semaphore_create(void) { struct ethosu_semaphore_t *sem = malloc(sizeof(*sem)); sem->count = 1; return sem; } // Baremetal simulation of waiting/sleeping for and then taking a semaphore using intrisics void __attribute__((weak)) ethosu_semaphore_take(void *sem) { struct ethosu_semaphore_t *s = sem; while (s->count <= 0) { __WFE(); } s->count--; } // Baremetal simulation of giving a semaphore and waking up processes using intrinsics void __attribute__((weak)) ethosu_semaphore_give(void *sem) { struct ethosu_semaphore_t *s = sem; s->count++; __SEV(); } /****************************************************************************** * Weak functions - Inference begin/end callbacks ******************************************************************************/ void __attribute__((weak)) ethosu_inference_begin(struct ethosu_driver *drv, const void *inference_data) { UNUSED(inference_data); UNUSED(drv); } void __attribute__((weak)) ethosu_inference_end(struct ethosu_driver *drv, const void *inference_data) { UNUSED(inference_data); UNUSED(drv); } /****************************************************************************** * Static functions ******************************************************************************/ static inline void wait_for_irq(struct ethosu_driver *drv) { while (1) { if (drv->irq_triggered || drv->abort_inference) { drv->irq_triggered = false; break; } ethosu_semaphore_take(drv->semaphore); } } static void npu_axi_init(struct ethosu_driver *drv) { ethosu_dev_set_qconfig(&drv->dev, NPU_QCONFIG); ethosu_dev_set_regioncfg(&drv->dev, 0, NPU_REGIONCFG_0); ethosu_dev_set_regioncfg(&drv->dev, 1, NPU_REGIONCFG_1); ethosu_dev_set_regioncfg(&drv->dev, 2, NPU_REGIONCFG_2); ethosu_dev_set_regioncfg(&drv->dev, 3, NPU_REGIONCFG_3); ethosu_dev_set_regioncfg(&drv->dev, 4, NPU_REGIONCFG_4); ethosu_dev_set_regioncfg(&drv->dev, 5, NPU_REGIONCFG_5); ethosu_dev_set_regioncfg(&drv->dev, 6, NPU_REGIONCFG_6); ethosu_dev_set_regioncfg(&drv->dev, 7, NPU_REGIONCFG_7); (void)ethosu_dev_set_axi_limit0(&drv->dev, AXI_LIMIT0_MAX_BEATS_BYTES, AXI_LIMIT0_MEM_TYPE, AXI_LIMIT0_MAX_OUTSTANDING_READS, AXI_LIMIT0_MAX_OUTSTANDING_WRITES); (void)ethosu_dev_set_axi_limit1(&drv->dev, AXI_LIMIT1_MAX_BEATS_BYTES, AXI_LIMIT1_MEM_TYPE, AXI_LIMIT1_MAX_OUTSTANDING_READS, AXI_LIMIT1_MAX_OUTSTANDING_WRITES); (void)ethosu_dev_set_axi_limit2(&drv->dev, AXI_LIMIT2_MAX_BEATS_BYTES, AXI_LIMIT2_MEM_TYPE, AXI_LIMIT2_MAX_OUTSTANDING_READS, AXI_LIMIT2_MAX_OUTSTANDING_WRITES); (void)ethosu_dev_set_axi_limit3(&drv->dev, AXI_LIMIT3_MAX_BEATS_BYTES, AXI_LIMIT3_MEM_TYPE, AXI_LIMIT3_MAX_OUTSTANDING_READS, AXI_LIMIT3_MAX_OUTSTANDING_WRITES); } static void ethosu_register_driver(struct ethosu_driver *drv) { // Register driver as new HEAD of list drv->next = registered_drivers; registered_drivers = drv; LOG_INFO("New NPU driver registered (handle: 0x%p, NPU: 0x%x)\n", drv, drv->dev.base_address); } static int ethosu_deregister_driver(struct ethosu_driver *drv) { struct ethosu_driver *cur = registered_drivers; struct ethosu_driver **prev = ®istered_drivers; while (cur != NULL) { if (cur == drv) { *prev = cur->next; LOG_INFO("NPU driver handle %p deregistered.\n", drv); return 0; } prev = &cur->next; cur = cur->next; } LOG_ERR("No NPU driver handle registered at address %p.\n", drv); return -1; } static struct ethosu_driver *ethosu_find_and_reserve_driver(void) { struct ethosu_driver *drv = registered_drivers; while (drv != NULL) { if (!drv->reserved) { drv->reserved = true; LOG_DEBUG("NPU driver handle %p reserved.\n", drv); return drv; } drv = drv->next; } LOG_DEBUG("No NPU driver handle available.\n", drv); return NULL; } static int ethosu_soft_reset_and_restore(struct ethosu_driver *drv) { if (ETHOSU_SUCCESS != ethosu_dev_soft_reset(&drv->dev)) { return -1; } set_clock_and_power_request(drv, ETHOSU_INFERENCE_REQUEST, ETHOSU_CLOCK_Q_ENABLE, ETHOSU_POWER_Q_DISABLE); npu_axi_init(drv); ethosu_dev_restore_pmu_config(&drv->dev); return 0; } static int handle_optimizer_config(struct ethosu_driver *drv, struct opt_cfg_s *opt_cfg_p) { struct ethosu_config cfg; struct ethosu_id id; int return_code = 0; LOG_INFO("Optimizer release nbr: %d patch: %d\n", opt_cfg_p->da_data.rel_nbr, opt_cfg_p->da_data.patch_nbr); LOG_INFO("Optimizer config cmd_stream_version: %d macs_per_cc: %d shram_size: %d custom_dma: %d\n", opt_cfg_p->cmd_stream_version, opt_cfg_p->macs_per_cc, opt_cfg_p->shram_size, opt_cfg_p->custom_dma); LOG_INFO("Optimizer config Ethos-U version: %d.%d.%d\n", opt_cfg_p->arch_major_rev, opt_cfg_p->arch_minor_rev, opt_cfg_p->arch_patch_rev); (void)ethosu_dev_get_config(&drv->dev, &cfg); (void)ethosu_dev_get_id(&drv->dev, &id); LOG_INFO("Ethos-U config cmd_stream_version: %" PRIu32 " macs_per_cc: %" PRIu32 " shram_size: %" PRIu32 " custom_dma: %" PRIu32 "\n", cfg.cmd_stream_version, cfg.macs_per_cc, cfg.shram_size, cfg.custom_dma); LOG_INFO("Ethos-U version: %" PRIu32 ".%" PRIu32 ".%" PRIu32 "\n", id.arch_major_rev, id.arch_minor_rev, id.arch_patch_rev); if ((cfg.macs_per_cc != opt_cfg_p->macs_per_cc) || (cfg.shram_size != opt_cfg_p->shram_size) || (cfg.cmd_stream_version != opt_cfg_p->cmd_stream_version) || (!cfg.custom_dma && opt_cfg_p->custom_dma)) { if (cfg.macs_per_cc != opt_cfg_p->macs_per_cc) { LOG_ERR("NPU config mismatch: npu.macs_per_cc=%" PRIu32 " optimizer.macs_per_cc=%d\n", cfg.macs_per_cc, opt_cfg_p->macs_per_cc); } if (cfg.shram_size != opt_cfg_p->shram_size) { LOG_ERR("NPU config mismatch: npu.shram_size=%" PRIu32 " optimizer.shram_size=%d\n", cfg.shram_size, opt_cfg_p->shram_size); } if (cfg.cmd_stream_version != opt_cfg_p->cmd_stream_version) { LOG_ERR("NPU config mismatch: npu.cmd_stream_version=%" PRIu32 " optimizer.cmd_stream_version=%d\n", cfg.cmd_stream_version, opt_cfg_p->cmd_stream_version); } if (!cfg.custom_dma && opt_cfg_p->custom_dma) { LOG_ERR("NPU config mismatch: npu.custom_dma=%" PRIu32 " optimize.custom_dma=%d\n", cfg.custom_dma, opt_cfg_p->custom_dma); } return_code = -1; } if ((id.arch_major_rev != opt_cfg_p->arch_major_rev) || (id.arch_minor_rev < opt_cfg_p->arch_minor_rev)) { LOG_ERR("NPU arch mismatch: npu.arch=%" PRIu32 ".%" PRIu32 ".%" PRIu32 " optimizer.arch=%d.%d.%d\n", id.arch_major_rev, id.arch_minor_rev, id.arch_patch_rev, opt_cfg_p->arch_major_rev, opt_cfg_p->arch_minor_rev, opt_cfg_p->arch_patch_rev); return_code = -1; } #if !defined(LOG_ENABLED) UNUSED(opt_cfg_p); #endif return return_code; } static int handle_command_stream(struct ethosu_driver *drv, const uint8_t *cmd_stream, const int cms_length, const uint64_t *base_addr, const size_t *base_addr_size, const int num_base_addr) { uint32_t qread = 0; uint32_t cms_bytes = cms_length * BYTES_IN_32_BITS; ptrdiff_t cmd_stream_ptr = (ptrdiff_t)cmd_stream; LOG_INFO("handle_command_stream: cmd_stream=%p, cms_length %d\n", cmd_stream, cms_length); if (0 != ((ptrdiff_t)cmd_stream & MASK_16_BYTE_ALIGN)) { LOG_ERR("Command stream addr %p not aligned to 16 bytes\n", cmd_stream); return -1; } bool base_addr_invalid = false; for (int i = 0; i < num_base_addr; i++) { if (0 != (base_addr[i] & MASK_16_BYTE_ALIGN)) { LOG_ERR("Base addr %d: 0x%llx not aligned to 16 bytes\n", i, base_addr[i]); base_addr_invalid = true; } } if (base_addr_invalid) { return -1; } /* Flush the cache if available on our CPU. * The upcasting to uin32_t* is ok since the pointer never is dereferenced. * The base_addr_size is null if invoking from prior to invoke_V2, in that case * the whole cache is being flushed. */ if (base_addr_size != NULL) { ethosu_flush_dcache((uint32_t *)cmd_stream_ptr, cms_bytes); for (int i = 0; i < num_base_addr; i++) { ethosu_flush_dcache((uint32_t *)(uintptr_t)base_addr[i], base_addr_size[i]); } } else { ethosu_flush_dcache(NULL, 0); } if (ETHOSU_SUCCESS != ethosu_dev_run_command_stream(&drv->dev, cmd_stream, cms_bytes, base_addr, num_base_addr)) { return -1; } wait_for_irq(drv); if (drv->status_error) { return -1; } if (base_addr_size != NULL) { for (int i = 0; i < num_base_addr; i++) { ethosu_invalidate_dcache((uint32_t *)(uintptr_t)base_addr[i], base_addr_size[i]); } } else { ethosu_invalidate_dcache(NULL, 0); } qread = ethosu_dev_get_qread(&drv->dev); if (qread != cms_bytes) { LOG_WARN("IRQ received but qread (%" PRIu32 ") not at end of stream (%" PRIu32 ").\n", qread, cms_bytes); return -1; } return 0; } static int read_apb_reg(struct ethosu_driver *drv, uint16_t da_data) { uint32_t *reg_p; uint32_t start_address = (uint32_t)(da_data & APB_START_ADDR_MASK); uint16_t num_reg = (da_data >> APB_NUM_REG_BIT_SHIFT) + 1; reg_p = (uint32_t *)malloc(num_reg * sizeof(uint32_t)); if (reg_p == NULL) { LOG_ERR("Memory allocation failed\n"); return -1; } if (ETHOSU_SUCCESS == ethosu_dev_read_apb_reg(&drv->dev, start_address, num_reg, reg_p)) { for (int i = 0; i < num_reg; i++) { LOG_INFO( "NPU_REG ADDR 0x%04" PRIu32 " = 0x%08" PRIu32 "\n", (start_address + (i * BYTES_IN_32_BITS)), reg_p[i]); } } else { free(reg_p); return -1; } free(reg_p); return 0; } static int dump_shram(struct ethosu_driver *drv) { struct ethosu_config cfg; uint32_t *shram_p; (void)ethosu_dev_get_config(&drv->dev, &cfg); LOG_INFO("dump_shram size = %" PRIu32 " KB\n", cfg.shram_size); shram_p = (uint32_t *)malloc(BYTES_1KB); if (shram_p == NULL) { LOG_ERR("Memory allocation failed for shram data\n"); return -1; } for (uint32_t i = 0; i < cfg.shram_size; i++) { ethosu_dev_get_shram_data(&drv->dev, i, (uint32_t *)shram_p); // Output 1KB of SHRAM LOG_INFO("***SHRAM SECTION %" PRIu32 "***\n", i); for (int j = 0; j < (BYTES_1KB / BYTES_IN_32_BITS); j++) { LOG_INFO("[0x%04" PRIx32 "] %" PRIx32 "\n", (i * 1024 + j * 4), shram_p[j]); } } free(shram_p); return 0; } /****************************************************************************** * Weak functions - Interrupt handler ******************************************************************************/ void __attribute__((weak)) ethosu_irq_handler(struct ethosu_driver *drv) { uint8_t irq_raised = 0; LOG_DEBUG( "Interrupt. status=0x%08x, qread=%d\n", ethosu_dev_get_status(&drv->dev), ethosu_dev_get_qread(&drv->dev)); // Verify that interrupt has been raised (void)ethosu_dev_is_irq_raised(&drv->dev, &irq_raised); assert(irq_raised == 1); drv->irq_triggered = true; // Clear interrupt (void)ethosu_dev_clear_irq_status(&drv->dev); // Verify that interrupt has been successfully cleared (void)ethosu_dev_is_irq_raised(&drv->dev, &irq_raised); assert(irq_raised == 0); if (ethosu_dev_status_has_error(&drv->dev)) { ethosu_soft_reset_and_restore(drv); drv->status_error = true; } ethosu_semaphore_give(drv->semaphore); } /****************************************************************************** * Functions API ******************************************************************************/ int ethosu_init(struct ethosu_driver *drv, const void *base_address, const void *fast_memory, const size_t fast_memory_size, uint32_t secure_enable, uint32_t privilege_enable) { int return_code = 0; LOG_INFO("Initializing NPU: base_address=%p, fast_memory=%p, fast_memory_size=%zu, secure=%" PRIu32 ", privileged=%" PRIu32 "\n", base_address, fast_memory, fast_memory_size, secure_enable, privilege_enable); if (!ethosu_mutex) { ethosu_mutex = ethosu_mutex_create(); } if (!ethosu_semaphore) { ethosu_semaphore = ethosu_semaphore_create(); } drv->fast_memory = (uint32_t)fast_memory; drv->fast_memory_size = fast_memory_size; drv->irq_triggered = false; drv->semaphore = ethosu_semaphore_create(); if (ETHOSU_SUCCESS != ethosu_dev_init(&drv->dev, base_address, secure_enable, privilege_enable)) { LOG_ERR("Failed to initialize Ethos-U device\n"); return -1; } if (ETHOSU_SUCCESS != set_clock_and_power_request(drv, ETHOSU_INFERENCE_REQUEST, ETHOSU_CLOCK_Q_DISABLE, ETHOSU_POWER_Q_DISABLE)) { LOG_ERR("Failed to disable clock-q & power-q for Ethos-U\n"); return -1; } if (ETHOSU_SUCCESS != ethosu_dev_soft_reset(&drv->dev)) { return -1; } if (ETHOSU_SUCCESS != ethosu_dev_wait_for_reset(&drv->dev)) { LOG_ERR("Failed reset of Ethos-U\n"); return -1; } drv->status_error = false; ethosu_register_driver(drv); return return_code; } void ethosu_deinit(struct ethosu_driver *drv) { ethosu_deregister_driver(drv); } void ethosu_get_driver_version(struct ethosu_driver_version *ver) { assert(ver != NULL); ver->major = ETHOSU_DRIVER_VERSION_MAJOR; ver->minor = ETHOSU_DRIVER_VERSION_MINOR; ver->patch = ETHOSU_DRIVER_VERSION_PATCH; } void ethosu_get_hw_info(struct ethosu_driver *drv, struct ethosu_hw_info *hw) { assert(hw != NULL); (void)ethosu_dev_get_id(&drv->dev, &hw->version); (void)ethosu_dev_get_config(&drv->dev, &hw->cfg); } int ethosu_invoke(struct ethosu_driver *drv, const void *custom_data_ptr, const int custom_data_size, const uint64_t *base_addr, const size_t *base_addr_size, const int num_base_addr) { const struct custom_data_s *data_ptr = custom_data_ptr; const struct custom_data_s *data_end = custom_data_ptr + custom_data_size; int return_code = 0; // First word in custom_data_ptr should contain "Custom Operator Payload 1" if (data_ptr->word != ETHOSU_FOURCC) { LOG_ERR("Custom Operator Payload: %" PRIu32 " is not correct, expected %x\n", data_ptr->word, ETHOSU_FOURCC); return -1; } // Custom data length must be a multiple of 32 bits if ((custom_data_size % BYTES_IN_32_BITS) != 0) { LOG_ERR("custom_data_size=0x%x not a multiple of 4\n", custom_data_size); return -1; } ++data_ptr; // Adjust base address to fast memory area if (drv->fast_memory != 0 && num_base_addr >= FAST_MEMORY_BASE_ADDR_INDEX) { uint64_t *fast_memory = (uint64_t *)&base_addr[FAST_MEMORY_BASE_ADDR_INDEX]; if (base_addr_size != NULL && base_addr_size[FAST_MEMORY_BASE_ADDR_INDEX] > drv->fast_memory_size) { LOG_ERR("Fast memory area too small. fast_memory_size=%u, base_addr_size=%u\n", drv->fast_memory_size, base_addr_size[FAST_MEMORY_BASE_ADDR_INDEX]); return -1; } *fast_memory = drv->fast_memory; } if (!drv->dev_power_always_on) { // Only soft reset if security state or privilege level needs changing if (ethosu_dev_prot_has_changed(&drv->dev)) { if (ETHOSU_SUCCESS != ethosu_dev_soft_reset(&drv->dev)) { return -1; } } drv->status_error = false; set_clock_and_power_request(drv, ETHOSU_INFERENCE_REQUEST, ETHOSU_CLOCK_Q_ENABLE, ETHOSU_POWER_Q_DISABLE); ethosu_dev_restore_pmu_config(&drv->dev); npu_axi_init(drv); } drv->status_error = false; ethosu_inference_begin(drv, custom_data_ptr); while (data_ptr < data_end) { int ret = 0; switch (data_ptr->driver_action_command) { case OPTIMIZER_CONFIG: LOG_DEBUG("OPTIMIZER_CONFIG\n"); struct opt_cfg_s *opt_cfg_p = (struct opt_cfg_s *)data_ptr; ret = handle_optimizer_config(drv, opt_cfg_p); data_ptr += DRIVER_ACTION_LENGTH_32_BIT_WORD + OPTIMIZER_CONFIG_LENGTH_32_BIT_WORD; break; case COMMAND_STREAM: LOG_DEBUG("COMMAND_STREAM\n"); void *command_stream = (uint8_t *)(data_ptr) + sizeof(struct custom_data_s); int cms_length = (data_ptr->reserved << 16) | data_ptr->length; drv->abort_inference = false; // It is safe to clear this flag without atomic, because npu is not running. drv->irq_triggered = false; ret = handle_command_stream(drv, command_stream, cms_length, base_addr, base_addr_size, num_base_addr); if (return_code == -1 && drv->abort_inference) { LOG_ERR("NPU timeout. qread=%" PRIu32 "\n", ethosu_dev_get_qread(&drv->dev)); dump_shram(drv); } data_ptr += DRIVER_ACTION_LENGTH_32_BIT_WORD + cms_length; break; case READ_APB_REG: LOG_DEBUG("READ_APB_REG\n"); ret = read_apb_reg(drv, data_ptr->driver_action_data); data_ptr += DRIVER_ACTION_LENGTH_32_BIT_WORD; break; case DUMP_SHRAM: LOG_DEBUG("DUMP_SHRAM\n"); ret = dump_shram(drv); data_ptr += DRIVER_ACTION_LENGTH_32_BIT_WORD; break; case NOP: LOG_DEBUG("NOP\n"); data_ptr += DRIVER_ACTION_LENGTH_32_BIT_WORD; break; default: LOG_ERR("UNSUPPORTED driver_action_command: %d \n", data_ptr->driver_action_command); ret = -1; break; } if (ret != 0) { return_code = -1; break; } } ethosu_inference_end(drv, custom_data_ptr); if (!drv->status_error && !drv->dev_power_always_on) { ethosu_dev_save_pmu_counters(&drv->dev); set_clock_and_power_request(drv, ETHOSU_INFERENCE_REQUEST, ETHOSU_CLOCK_Q_ENABLE, ETHOSU_POWER_Q_ENABLE); } return return_code; } void ethosu_abort(struct ethosu_driver *drv) { drv->abort_inference = true; } void ethosu_set_power_mode(struct ethosu_driver *drv, bool always_on) { drv->dev_power_always_on = always_on; if (always_on) { npu_axi_init(drv); } } struct ethosu_driver *ethosu_reserve_driver(void) { struct ethosu_driver *drv = NULL; do { ethosu_mutex_lock(ethosu_mutex); drv = ethosu_find_and_reserve_driver(); ethosu_mutex_unlock(ethosu_mutex); if (drv != NULL) { break; } LOG_INFO("Waiting for NPU driver handle to become available...\n"); ethosu_semaphore_take(ethosu_semaphore); } while (1); return drv; } void ethosu_release_driver(struct ethosu_driver *drv) { ethosu_mutex_lock(ethosu_mutex); if (drv != NULL && drv->reserved) { drv->reserved = false; LOG_DEBUG("NPU driver handle %p released\n", drv); ethosu_semaphore_give(ethosu_semaphore); } ethosu_mutex_unlock(ethosu_mutex); } enum ethosu_error_codes set_clock_and_power_request(struct ethosu_driver *drv, enum ethosu_request_clients client, enum ethosu_clock_q_request clock_request, enum ethosu_power_q_request power_request) { // Set clock request bit for client if (clock_request == ETHOSU_CLOCK_Q_DISABLE) { drv->clock_request |= (1 << client); } else { drv->clock_request &= ~(1 << client); } // Get current clock request (ENABLE if both PMU and INFERENCE asks for clock request, else DISABLE) clock_request = drv->clock_request == 0 ? ETHOSU_CLOCK_Q_ENABLE : ETHOSU_CLOCK_Q_DISABLE; // Set power request bit for client if (power_request == ETHOSU_POWER_Q_DISABLE) { drv->power_request |= (1 << client); } else { drv->power_request &= ~(1 << client); } // Get current power request (ENABLE if both PMU and INFERENCE asks for power request, else DISABLE) power_request = drv->power_request == 0 ? ETHOSU_POWER_Q_ENABLE : ETHOSU_POWER_Q_DISABLE; // Set clock and power enum ethosu_error_codes ret = ethosu_dev_set_clock_and_power(&drv->dev, clock_request, power_request); return ret; }