aboutsummaryrefslogtreecommitdiff
path: root/ethosu/vela/test
diff options
context:
space:
mode:
authorLouis Verhaard <louis.verhaard@arm.com>2020-11-25 14:10:30 +0100
committerLouis Verhaard <louis.verhaard@arm.com>2020-11-26 08:13:50 +0100
commit933f55ea6f686d0cf390f4767e87a391686c3df8 (patch)
tree370321021ef2553df76e6e46b127cac07ec9d8be /ethosu/vela/test
parent34b9dc15b27219bd6485eb5104506d647e1f6d29 (diff)
downloadethos-u-vela-933f55ea6f686d0cf390f4767e87a391686c3df8.tar.gz
MLBEDSW-3599: Added API for finding block configs
Added public API function npu_find_block_configs. Change-Id: Ib0925a62d7c5d19a9b9fbd8d808943c2ea2df02f Signed-off-by: Louis Verhaard <louis.verhaard@arm.com>
Diffstat (limited to 'ethosu/vela/test')
-rw-r--r--ethosu/vela/test/extapi/test_extapi_find_block_configs.py63
-rw-r--r--ethosu/vela/test/extapi/test_extapi_generate_commands.py33
2 files changed, 73 insertions, 23 deletions
diff --git a/ethosu/vela/test/extapi/test_extapi_find_block_configs.py b/ethosu/vela/test/extapi/test_extapi_find_block_configs.py
new file mode 100644
index 00000000..07cb9cb4
--- /dev/null
+++ b/ethosu/vela/test/extapi/test_extapi_find_block_configs.py
@@ -0,0 +1,63 @@
+# Copyright (C) 2020 Arm Limited or its affiliates. All rights reserved.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the License); you may
+# not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an AS IS BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# Description:
+# Contains unit tests for npu_find_block_configs API for an external consumer
+from ethosu.vela.api import npu_find_block_configs
+from ethosu.vela.api import npu_generate_register_command_stream
+from ethosu.vela.api import NpuAccelerator
+from ethosu.vela.api import NpuAddressRange
+from ethosu.vela.api import NpuBlockTraversal
+from ethosu.vela.api import NpuConv2DOperation
+from ethosu.vela.api import NpuKernel
+from ethosu.vela.api import NpuPadding
+from ethosu.vela.api import NpuQuantization
+from ethosu.vela.api import NpuShape3D
+from ethosu.vela.ethos_u55_regs.ethos_u55_regs import cmd0
+from ethosu.vela.test.extapi.test_extapi_generate_commands import check_cmd0
+from ethosu.vela.test.extapi.test_extapi_generate_commands import create_feature_map
+
+
+def test_find_block_configs():
+ """Tests npu_find_block_configs"""
+ # Create a Conv2D operation
+ op = NpuConv2DOperation()
+ op.ifm = create_feature_map(
+ NpuShape3D(height=30, width=62, depth=46), 1, 512, quant=NpuQuantization(scale_f32=0.007843138, zero_point=128)
+ )
+ op.ofm = create_feature_map(
+ NpuShape3D(height=30, width=31, depth=46),
+ 1,
+ 0x14E40,
+ quant=NpuQuantization(scale_f32=0.20392157, zero_point=128),
+ )
+ op.kernel = NpuKernel(3, 2, 2, 1)
+ op.biases = [NpuAddressRange(region=0, address=32000, length=464)]
+ op.padding = NpuPadding(top=0, left=0, right=1, bottom=1)
+ op.block_traversal = NpuBlockTraversal.PART_KERNEL_FIRST
+ # Find valid block configs
+ accelerator = NpuAccelerator.Ethos_U55_256
+ block_configs = npu_find_block_configs(op, accelerator)
+ # Select the last one
+ op.block_config = block_configs[-1]
+ # Note: the weights should be encoded with op.block_config.depth (not shown here)
+ op.weights = [NpuAddressRange(region=0, address=0, length=7696)]
+ # Check that generating register commands succeeds
+ cmds = npu_generate_register_command_stream([op], accelerator)
+ # Check that the selected block config was used
+ check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_HEIGHT_M1, op.block_config.height - 1)
+ check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_WIDTH_M1, op.block_config.width - 1)
+ check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_DEPTH_M1, op.block_config.depth - 1)
diff --git a/ethosu/vela/test/extapi/test_extapi_generate_commands.py b/ethosu/vela/test/extapi/test_extapi_generate_commands.py
index 86ef804a..812991a9 100644
--- a/ethosu/vela/test/extapi/test_extapi_generate_commands.py
+++ b/ethosu/vela/test/extapi/test_extapi_generate_commands.py
@@ -16,6 +16,7 @@
#
# Description:
# Contains unit tests for npu_generate_register_command_stream API for an external consumer
+from ethosu.vela.api import npu_find_block_configs
from ethosu.vela.api import npu_generate_register_command_stream
from ethosu.vela.api import NpuAccelerator
from ethosu.vela.api import NpuActivation
@@ -106,9 +107,7 @@ def test_conv2d():
op.biases = [NpuAddressRange(region=0, address=32000, length=464)]
op.padding = NpuPadding(top=0, left=0, right=1, bottom=1)
op.block_traversal = NpuBlockTraversal.PART_KERNEL_FIRST
- # In this example we assume that the weights were compressed with ofm depth 16;
- # let vela choose suitable block width and height by setting these to -1
- op.block_config = NpuShape3D(height=-1, width=-1, depth=16)
+ op.block_config = NpuShape3D(height=16, width=4, depth=16)
cmds = npu_generate_register_command_stream([op], NpuAccelerator.Ethos_U55_128)
check_cmd0(cmds, cmd0.NPU_SET_IFM_REGION, 1)
check_cmd1(cmds, cmd1.NPU_SET_IFM_BASE0, 512)
@@ -165,12 +164,6 @@ def test_conv2d():
check_cmd0(cmds, cmd0.NPU_SET_ACC_FORMAT, 0)
check_cmd0(cmds, cmd0.NPU_SET_BLOCKDEP, 0)
check_cmd0(cmds, cmd0.NPU_OP_CONV, 0)
- # Check that block width/height were generated that fit
- blk_height = find_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_HEIGHT_M1)
- blk_width = find_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_WIDTH_M1)
- assert blk_height > 0
- assert blk_width > 0
- assert (blk_height + 1) * (blk_width + 1) <= 64
def create_fully_connected_op() -> NpuConv2DOperation:
@@ -194,9 +187,7 @@ def create_fully_connected_op() -> NpuConv2DOperation:
op.biases = [NpuAddressRange(region=0, address=0x19BC0, length=960)]
op.padding = NpuPadding(top=0, left=0, right=0, bottom=0)
op.block_traversal = NpuBlockTraversal.DEPTH_FIRST
- # In this example we assume that the weights were compressed with ofm depth 96;
- # let vela choose suitable block width and height by setting these to -1
- op.block_config = NpuShape3D(height=-1, width=-1, depth=96)
+ op.block_config = NpuShape3D(height=2, width=4, depth=96)
return op
@@ -222,7 +213,7 @@ def test_depthwise():
op.padding = NpuPadding(top=1, left=1, right=1, bottom=1)
op.weights = [weights_dest]
op.biases = [NpuAddressRange(region=0, address=0, length=80)]
- op.block_config = NpuShape3D(height=-1, width=-1, depth=8)
+ op.block_config = NpuShape3D(height=8, width=12, depth=8)
cmds = npu_generate_register_command_stream([dma_op, op], NpuAccelerator.Ethos_U55_128)
check_cmd0(cmds, cmd0.NPU_SET_DMA0_SRC_REGION, 0)
check_cmd1(cmds, cmd1.NPU_SET_DMA0_SRC, 0x40)
@@ -233,10 +224,6 @@ def test_depthwise():
# A DMA WAIT should have been inserted
check_cmd0(cmds, cmd0.NPU_OP_DMA_WAIT, 0)
check_cmd0(cmds, cmd0.NPU_OP_DEPTHWISE, 0)
- blk_height = find_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_HEIGHT_M1)
- blk_width = find_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_WIDTH_M1)
- assert blk_height > 0
- assert blk_width > 0
def test_mul_with_broadcast_and_relu():
@@ -247,8 +234,10 @@ def test_mul_with_broadcast_and_relu():
op.ofm = create_feature_map(NpuShape3D(height=31, width=22, depth=31), 1, 0x52C0)
op.activation = NpuActivation(NpuActivationOp.NONE_OR_RELU)
op.activation.min = 0 # RELU
- # Do not set a block config, let vela choose one
- cmds = npu_generate_register_command_stream([op], NpuAccelerator.Ethos_U55_32)
+ accelerator = NpuAccelerator.Ethos_U55_32
+ # Select a block config using npu_find_block_configs
+ op.block_config = npu_find_block_configs(op, accelerator)[0]
+ cmds = npu_generate_register_command_stream([op], accelerator)
check_cmd1(cmds, cmd1.NPU_SET_OFM_SCALE, 1073741824, 30)
check_cmd0(cmds, cmd0.NPU_SET_IFM_REGION, 1)
check_cmd1(cmds, cmd1.NPU_SET_IFM_BASE0, 32)
@@ -298,9 +287,6 @@ def test_mul_with_broadcast_and_relu():
check_cmd0(cmds, cmd0.NPU_SET_IFM2_ZERO_POINT, 0)
check_cmd0(cmds, cmd0.NPU_SET_IFM2_PRECISION, 0)
check_cmd0(cmds, cmd0.NPU_SET_IFM2_BROADCAST, 5)
- check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_HEIGHT_M1, 23)
- check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_WIDTH_M1, 3)
- check_cmd0(cmds, cmd0.NPU_SET_OFM_BLK_DEPTH_M1, 31)
check_cmd0(cmds, cmd0.NPU_SET_IFM_IB_END, 16)
check_cmd0(cmds, cmd0.NPU_SET_AB_START, 16)
check_cmd0(cmds, cmd0.NPU_SET_IFM2_IB_START, 9)
@@ -330,7 +316,8 @@ def create_avg_pool_op() -> NpuPoolingOperation:
)
op.kernel = NpuKernel(8, 2, 3, 3)
op.padding = NpuPadding(top=0, left=2, right=3, bottom=0)
- # Do not set a block config, let vela choose one
+ # Select a block config
+ op.block_config = NpuShape3D(height=4, width=4, depth=16)
return op