MLBEDSW-2337: Intermediate feature maps in fast storage

Attempts to use fast storage for feature maps used in between cascaded passes. This is only relevant for system configurations where feature maps are by default not placed in SRAM, but there is SRAM for fast storage. Change-Id: I207b7cf32cfcb5bea3e6b93c2da1161c4af5221d Signed-off-by: Louis Verhaard <louis.verhaard@arm.com>
author: Louis Verhaard <louis.verhaard@arm.com> 2020-09-15 14:05:38 +0200
committer: Louis Verhaard <louis.verhaard@arm.com> 2020-09-25 08:32:55 +0200
commit: 0b9c9a3873da3d368e184308f4f9a4c202e3fb67 (patch)
tree: f057bfeacd6c6323cd0e7f33cd7ec33f941b4f8d /ethosu/vela/tensor_allocation.py
parent: 8854dc9088586e1bb0bf2640b2289903dfa3c822 (diff)
download: ethos-u-vela-0b9c9a3873da3d368e184308f4f9a4c202e3fb67.tar.gz
1 files changed, 10 insertions, 0 deletions
diff --git a/ethosu/vela/tensor_allocation.py b/ethosu/vela/tensor_allocation.py
index d53babc3..1efcd686 100644
--- a/ethosu/vela/tensor_allocation.py
+++ b/ethosu/vela/tensor_allocation.py
@@ -128,7 +128,10 @@ def allocate_tensors(
     show_minimum_possible_allocation=False,
     lr_graph=None,
     allocation_alignment=Tensor.AllocationQuantum,
+    max_size=None,
+    dry_test=False,
 ):
+    # Allocates addresses to tensors, returns False if tensors could not be fit within max_size
     ignore_subgraph_input_output_tensors = False
     lrs = live_range.extract_live_ranges_from_cascaded_passes(
         sg,
@@ -149,6 +152,12 @@ def allocate_tensors(
             total_sz = linear_allocate_live_ranges(lrs, allocation_alignment)
         else:
             assert 0
+        alloc_ok = max_size is None or total_sz <= max_size
+        if dry_test or not alloc_ok:
+            # Dry test or allocation failed; undo allocation
+            for lr in lrs.ranges.values():
+                lr.set_address(None)
+            return alloc_ok
 
         if sg.memory_used.get(mem_area, 0) == 0:
             sg.memory_used[mem_area] = total_sz
@@ -179,3 +188,4 @@ def allocate_tensors(
                 nng.bits_per_element[mem_area] = nng.total_size[mem_area] * 8 / nng.total_elements[mem_area]
             except ZeroDivisionError:
                 nng.bits_per_element[mem_area] = 0.0
+    return True
author	Louis Verhaard <louis.verhaard@arm.com>	2020-09-15 14:05:38 +0200
committer	Louis Verhaard <louis.verhaard@arm.com>	2020-09-25 08:32:55 +0200
commit	0b9c9a3873da3d368e184308f4f9a4c202e3fb67 (patch)
tree	f057bfeacd6c6323cd0e7f33cd7ec33f941b4f8d /ethosu/vela/tensor_allocation.py
parent	8854dc9088586e1bb0bf2640b2289903dfa3c822 (diff)
download	ethos-u-vela-0b9c9a3873da3d368e184308f4f9a4c202e3fb67.tar.gz