aboutsummaryrefslogtreecommitdiff
path: root/ethosu/vela/test/extapi/test_extapi_find_block_configs.py
diff options
context:
space:
mode:
Diffstat (limited to 'ethosu/vela/test/extapi/test_extapi_find_block_configs.py')
-rw-r--r--ethosu/vela/test/extapi/test_extapi_find_block_configs.py36
1 files changed, 36 insertions, 0 deletions
diff --git a/ethosu/vela/test/extapi/test_extapi_find_block_configs.py b/ethosu/vela/test/extapi/test_extapi_find_block_configs.py
index 07cb9cb4..a768f18d 100644
--- a/ethosu/vela/test/extapi/test_extapi_find_block_configs.py
+++ b/ethosu/vela/test/extapi/test_extapi_find_block_configs.py
@@ -61,3 +61,39 @@ def test_find_block_configs():
check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_HEIGHT_M1, op.block_config.height - 1)
check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_WIDTH_M1, op.block_config.width - 1)
check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_DEPTH_M1, op.block_config.depth - 1)
+
+
+def test_conv2d_block_height_1():
+ """Test npu_find_block_configs returns valid config in the special case of reduced ublock height (H256)."""
+ # Create a Conv2D operation
+ op = NpuConv2DOperation()
+ op.ifm = create_feature_map(
+ NpuShape3D(height=1, width=1, depth=1024),
+ 1,
+ 512,
+ quant=NpuQuantization(scale_f32=0.023528477177023888, zero_point=0),
+ )
+ op.ofm = create_feature_map(
+ NpuShape3D(height=1, width=1, depth=1001),
+ 1,
+ 0x14E40,
+ quant=NpuQuantization(scale_f32=0.16609922051429749, zero_point=66),
+ )
+ op.kernel = NpuKernel(1, 1, 1, 1, 1, 1)
+ op.padding = NpuPadding(top=0, left=0, right=0, bottom=0)
+ op.block_traversal = NpuBlockTraversal.PART_KERNEL_FIRST
+
+ # Find valid block configs
+ accelerator = NpuAccelerator.Ethos_U55_256
+ block_configs = npu_find_block_configs(op, accelerator)
+ # Select the last one
+ op.block_config = block_configs[-1]
+ # Note: the weights should be encoded with op.block_config.depth (not shown here)
+ op.weights = [NpuAddressRange(region=0, address=0, length=7696)]
+
+ # Check that generating register commands succeeds
+ cmds = npu_generate_register_command_stream([op], accelerator)
+ # Check that the selected block config was used
+ check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_HEIGHT_M1, op.block_config.height - 1)
+ check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_WIDTH_M1, op.block_config.width - 1)
+ check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_DEPTH_M1, op.block_config.depth - 1)