aboutsummaryrefslogtreecommitdiff
path: root/ethosu/vela
diff options
context:
space:
mode:
Diffstat (limited to 'ethosu/vela')
-rw-r--r--ethosu/vela/npu_performance.py6
1 files changed, 6 insertions, 0 deletions
diff --git a/ethosu/vela/npu_performance.py b/ethosu/vela/npu_performance.py
index b1dae4e0..5c61c7db 100644
--- a/ethosu/vela/npu_performance.py
+++ b/ethosu/vela/npu_performance.py
@@ -708,11 +708,17 @@ def estimate_full_op_performance(
bw = access.const_read[0] * bandwidth_compression_scale_approx
bws[query.const_memory_area][TensorPurpose.Weights][BandwidthDirection.Read] += bw
+ if not cost.buffered_weight_tensor:
+ scaled_bws[query.const_memory_area][TensorPurpose.Weights][BandwidthDirection.Read] += bw
+
if access.const_read[1] > 0:
# Scales & biases
bw = access.const_read[1] * op.parent_op.bias.element_size()
bws[query.const_memory_area][TensorPurpose.FSBias][BandwidthDirection.Read] += bw
+ if not cost.buffered_weight_tensor:
+ scaled_bws[query.const_memory_area][TensorPurpose.FSBias][BandwidthDirection.Read] += bw
+
update_summary_cycles(arch, scaled_bws, cycles_a)
return bws, macs, cycles_a