aboutsummaryrefslogtreecommitdiff
path: root/ethosu/vela/high_level_command_stream_generator.py
diff options
context:
space:
mode:
authorFredrik Svedberg <fredrik.svedberg@arm.com>2022-06-30 10:44:12 +0200
committerFredrik Svedberg <fredrik.svedberg@arm.com>2022-07-13 15:29:38 +0000
commitd03dc504452dbb32db383121f3dad81f4280bb3c (patch)
treea491e706d5d18a099116b30b8d924667ff0f7245 /ethosu/vela/high_level_command_stream_generator.py
parenta04f2f7322e7b83d93e875313d2e5b4d0dca94fb (diff)
downloadethos-u-vela-d03dc504452dbb32db383121f3dad81f4280bb3c.tar.gz
MLBEDSW-6496 mlperf_deeplabv3_mnv2_ade20k_int8 fails at verify_output for u65
Added check to see if additional stripe data is needed from producer op when cascading to make sure the stripes are not overwriting data still being used. Also changed scheduler to make sure ResizeBilinear always runs with even stripe height. Signed-off-by: Fredrik Svedberg <fredrik.svedberg@arm.com> Change-Id: If7d723e6be29575c2b55c400eebbe8275a1aa328
Diffstat (limited to 'ethosu/vela/high_level_command_stream_generator.py')
-rw-r--r--ethosu/vela/high_level_command_stream_generator.py15
1 files changed, 8 insertions, 7 deletions
diff --git a/ethosu/vela/high_level_command_stream_generator.py b/ethosu/vela/high_level_command_stream_generator.py
index 95068081..a52bdc37 100644
--- a/ethosu/vela/high_level_command_stream_generator.py
+++ b/ethosu/vela/high_level_command_stream_generator.py
@@ -185,13 +185,14 @@ def generate_high_level_commands_for_sched_op(sched_op, schedule):
if producer_op:
assert op_info.cascade != 0
assert op_info.cascade == schedule.cost_map[producer_op].cascade
- for prev_cmd in prev_cmd_gen:
- yield prev_cmd
- if prev_cmd.is_npu_pass_command() and prev_cmd.ps == producer_op.parent_ps:
- ifm_present.end_coord = prev_cmd.ofm_box.end_coord
- if ifm_required.is_subbox_of(ifm_present):
- # There is enough IFM data - exit loop
- break
+ if not ifm_required.is_subbox_of(ifm_present):
+ for prev_cmd in prev_cmd_gen:
+ yield prev_cmd
+ if prev_cmd.is_npu_pass_command() and prev_cmd.ps == producer_op.parent_ps:
+ ifm_present.end_coord = prev_cmd.ofm_box.end_coord
+ if ifm_required.is_subbox_of(ifm_present):
+ # There is enough IFM data - exit loop
+ break
# Information about the current stripe's location in the cascade
is_first_h_stripe = ofm_box_start.height == ofm_start.height