From 1c772e43434bd39aad1cb2e0036dcdf67b038633 Mon Sep 17 00:00:00 2001 From: Henrik G Olsson Date: Fri, 9 Apr 2021 10:51:33 +0200 Subject: MLBEDSW-4073 Handle elementwise ops with same tensor for both inputs Signed-off-by: Henrik G Olsson Change-Id: I0e6bb46b7b91ed10f5bda34fba66d8b714560f47 --- ethosu/vela/high_level_command_stream_generator.py | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/ethosu/vela/high_level_command_stream_generator.py b/ethosu/vela/high_level_command_stream_generator.py index aad3783d..c01790a4 100644 --- a/ethosu/vela/high_level_command_stream_generator.py +++ b/ethosu/vela/high_level_command_stream_generator.py @@ -46,7 +46,12 @@ def generate_high_level_command_stream_for_pass(strat, passes, block_configs, id npu_block_type = ps.npu_block_type split_offsets = list(ps.primary_op.read_offsets) # offset for [ifm, ifm2] - if ps.ifm_tensor is not None and ps.ifm2_tensor is not None and npu_block_type == NpuBlockType.ElementWise: + if ( + len(ps.inputs) == 2 + and ps.ifm_tensor is not None + and ps.ifm2_tensor is not None + and npu_block_type == NpuBlockType.ElementWise + ): # Ensure correct ifm and ifm2 order if ps.inputs[0] == ps.primary_op.inputs[1] and ps.inputs[1] == ps.primary_op.inputs[0]: ps.ifm_tensor, ps.ifm2_tensor = ps.ifm2_tensor, ps.ifm_tensor -- cgit v1.2.1