/* * Copyright (c) 2019-2023 Arm Limited. * * SPDX-License-Identifier: MIT * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to * deal in the Software without restriction, including without limitation the * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or * sell copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in all * copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE * SOFTWARE. */ #include "arm_compute/core/KernelDescriptors.h" #include "arm_compute/core/Types.h" #include "arm_compute/core/utils/misc/ShapeCalculator.h" #include "arm_compute/runtime/CL/CLTensor.h" #include "arm_compute/runtime/CL/CLTensorAllocator.h" #include "src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.h" #include "tests/CL/CLAccessor.h" #include "tests/CL/Helper.h" #include "tests/PaddingCalculator.h" #include "tests/framework/Asserts.h" #include "tests/framework/Macros.h" #include "tests/framework/datasets/Datasets.h" #include "tests/validation/Validation.h" #include "tests/validation/fixtures/DepthwiseConvolutionLayerFixture.h" namespace arm_compute { namespace test { namespace validation { using framework::dataset::make; using namespace arm_compute::misc::shape_calculator; // Create function for CLDepthwiseConvolutionLayerNativeKernel using CLDepthwiseConvolutionLayerNative = CLSynthetizeFunction; // Fixture for CLDepthwiseConvolutionLayerNative template using CLDepthwiseConvolutionLayerNativeFixture = DepthwiseConvolutionLayerNativeConfigurableValidationFixture; namespace { // *INDENT-OFF* // clang-format off RelativeTolerance rel_tolerance_f32(0.001f); constexpr float abs_tolerance_f32(0.0001f); RelativeTolerance rel_tolerance_f16(half_float::half(0.01f)); constexpr float abs_tolerance_f16(0.03f); /** Width values to test - Precommit */ const auto width_values_precommit = make("width", { 1U, 33U } ); /** Width values to test - Nightly */ const auto width_values_nightly = make("width", { 53U, 47U } ); /** Height values to test - Precommit */ const auto height_values_precommit = make("height", { 19U } ); /** Height values to test - Nightly */ const auto height_values_nightly = make("height", { 39U, 43U } ); /** Channel values to test - Precommit */ const auto channel_values_precommit = make("channels", { 15U }); /** Channel values to test - Nightly */ const auto channel_values_nightly = make("channels", { 33U, 19U }); /** Channel values to test with cl_image support - Precommit */ const auto channel_values_export_to_cl_image_precommit = make("channels", { 16U }); /** Channel values to test with cl_image support - Nightly */ const auto channel_values_export_to_cl_image_nightly = make("channels", { 32U }); /** Batch values to test - Precommit */ const auto batch_values_precommit = make("batch", { 1U, 2U }); /** Batch values to test - Nightly */ const auto batch_values_nightly = make("batch", { 3U }); /** Kernel size values to test - Precommit */ const auto kernel_sz_values_precommit = make("kernel_size", { Size2D(1U, 1U), Size2D(1U, 3U), Size2D(5U, 5U) }); /** Kernel size values to test - Nightly */ const auto kernel_sz_values_nightly = make("kernel_size", { Size2D(3U, 5U), Size2D(5U, 1U), Size2D(1U, 7U), Size2D(9U, 7U) }); /** Depth multiplier values to test - All */ const auto depth_multiplier_values = make("depth_multiplier", {3U}); /** Dilation values to test - All */ const auto dilation_values = make("dilation", { Size2D(1U, 1U), Size2D(3U, 3U) }); /** Stride values to test - All */ const auto stride_values = make("stride", { Size2D(1U, 1U), Size2D(3U, 2U) }); /** Padding values to test - Precommit */ const auto padding_valid_values = make("padding_valid", { true, false }); /** Padding values to test - Nightly */ const auto padding_valid_values_nightly = make("padding_valid", { false }); /** Data layout values to test - All */ const auto data_layout_values = make("data_layout", { DataLayout::NHWC }); /** N0 values to test - Precommit */ const auto n0_values_precommit = make("N0", {2, 4}); /** N0 values to test - Nightly */ const auto n0_values_nightly = make("N0", {3, 8}); /** N0 values to test with cl_image support - Precommit */ const auto n0_values_export_to_cl_image_precommit = make("N0", {4}); /** N0 values to test with cl_image support - Nightly */ const auto n0_values_export_to_cl_image_nightly = make("N0", {8}); /** Activation values to test in precommit */ const auto act_values = make("Activation", { ActivationLayerInfo() }); const auto activations_rest = make("Activation", { ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::BOUNDED_RELU, 6.f, 0.5f), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU, 0.8f, -0.5f), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::LEAKY_RELU, 0.1f), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::SOFT_RELU), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::ELU), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::ABS), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::LOGISTIC), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::TANH), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::SQUARE), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::HARD_SWISH), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::LINEAR, 2.f, 1.f), ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::GELU) }); } // namespace TEST_SUITE(CL) TEST_SUITE(DepthwiseConvolutionLayerNative) TEST_SUITE(Float) TEST_SUITE(FP32) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( width_values_precommit, height_values_precommit), channel_values_precommit), batch_values_precommit), kernel_sz_values_precommit), make("depth_multiplier", 1)), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F32)), data_layout_values), act_values), n0_values_precommit), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32); } FIXTURE_DATA_TEST_CASE_NEW(RunLarge, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( width_values_nightly, height_values_nightly), channel_values_nightly), batch_values_nightly), kernel_sz_values_nightly), make("depth_multiplier", 1)), dilation_values), stride_values), padding_valid_values_nightly), make("DataType", DataType::F32)), data_layout_values), make("Activation", { ActivationLayerInfo() })), n0_values_nightly), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32); } FIXTURE_DATA_TEST_CASE_NEW(RunActivations, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine( make("width", { 33U } ), height_values_precommit, channel_values_precommit, make("batch", { 2U } ), make("kernel_size", { Size2D(5U, 5U) }), make("depth_multiplier", 1), make("dilation", Size2D(3U, 3U)), make("stride", Size2D(3U, 2U)), padding_valid_values_nightly, make("DataType", DataType::F32), data_layout_values, activations_rest, n0_values_precommit, make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32); } TEST_SUITE(ExportWeightsToCLImage) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( width_values_precommit, height_values_precommit), channel_values_export_to_cl_image_precommit), batch_values_precommit), kernel_sz_values_precommit), make("depth_multiplier", 1)), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F32)), data_layout_values), act_values), n0_values_export_to_cl_image_precommit), make("ExportToCLImage", true))) { // Validate output if(_validate_output) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32); } else { ARM_COMPUTE_TEST_INFO("cl_khr_image2d_from_buffer not supported. TEST skipped"); framework::ARM_COMPUTE_PRINT_INFO(); } } FIXTURE_DATA_TEST_CASE_NEW(RunLarge, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( width_values_nightly, height_values_nightly), channel_values_export_to_cl_image_nightly), batch_values_nightly), kernel_sz_values_nightly), make("depth_multiplier", 1)), dilation_values), stride_values), padding_valid_values_nightly), make("DataType", DataType::F32)), data_layout_values), make("Activation", { ActivationLayerInfo() })), n0_values_export_to_cl_image_nightly), make("ExportToCLImage", true))) { // Validate output if(_validate_output) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32); } else { ARM_COMPUTE_TEST_INFO("cl_khr_image2d_from_buffer not supported. TEST skipped"); framework::ARM_COMPUTE_PRINT_INFO(); } } TEST_SUITE_END() // ExportWeightsToCLImage TEST_SUITE_END() // FP32 TEST_SUITE(FP16) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( width_values_precommit, height_values_precommit), channel_values_precommit), batch_values_precommit), kernel_sz_values_precommit), make("depth_multiplier", 1)), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F16)), data_layout_values), act_values), n0_values_precommit), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f16); } FIXTURE_DATA_TEST_CASE_NEW(RunLarge, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 47U } ), make("height", { 39U } )), make("channels", { 19U } )), batch_values_nightly), make("kernel_size", { Size2D(5U, 5U) })), make("depth_multiplier", 1)), make("dilation", { Size2D(3U, 3U) })), make("stride", { Size2D(3U, 2U) })), padding_valid_values_nightly), make("DataType", DataType::F16)), data_layout_values), make("Activation", { ActivationLayerInfo() })), n0_values_nightly), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f16, 0.f, abs_tolerance_f16); } FIXTURE_DATA_TEST_CASE_NEW(RunActivations, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine( make("width", { 33U } ), height_values_precommit, channel_values_precommit, make("batch", { 2U } ), make("kernel_size", { Size2D(5U, 5U) }), make("depth_multiplier", 4), make("dilation", Size2D(3U, 3U)), make("stride", Size2D(3U, 2U)), padding_valid_values_nightly, make("DataType", DataType::F16), data_layout_values, activations_rest, n0_values_precommit, make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f16, 0.f, abs_tolerance_f16); } TEST_SUITE(ExportWeightsToCLImage) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( width_values_precommit, height_values_precommit), channel_values_export_to_cl_image_precommit), batch_values_precommit), kernel_sz_values_precommit), make("depth_multiplier", 1)), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F16)), data_layout_values), act_values), n0_values_export_to_cl_image_precommit), make("ExportToCLImage", true))) { // Validate output if(_validate_output) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f16, 0.f, abs_tolerance_f16); } else { ARM_COMPUTE_TEST_INFO("cl_khr_image2d_from_buffer not supported. TEST skipped"); framework::ARM_COMPUTE_PRINT_INFO(); } } FIXTURE_DATA_TEST_CASE_NEW(RunLarge, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 47U } ), make("height", { 39U } )), channel_values_export_to_cl_image_nightly), batch_values_nightly), make("kernel_size", { Size2D(5U, 5U) })), make("depth_multiplier", 1)), make("dilation", { Size2D(3U, 3U) })), make("stride", { Size2D(3U, 2U) })), padding_valid_values_nightly), make("DataType", DataType::F16)), data_layout_values), make("Activation", { ActivationLayerInfo() })), n0_values_export_to_cl_image_nightly), make("ExportToCLImage", true))) { // Validate output if(_validate_output) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f16, 0.f, abs_tolerance_f16); } else { ARM_COMPUTE_TEST_INFO("cl_khr_image2d_from_buffer not supported. TEST skipped"); framework::ARM_COMPUTE_PRINT_INFO(); } } TEST_SUITE_END() // ExportWeightsToCLImage TEST_SUITE_END() // FP16 TEST_SUITE_END() // Float TEST_SUITE(DepthMultiplier) TEST_SUITE(Float) TEST_SUITE(FP32) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 33U } ), height_values_precommit), channel_values_precommit), batch_values_precommit), kernel_sz_values_precommit), depth_multiplier_values), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F32)), data_layout_values), act_values), make("N0", 1)), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32); } FIXTURE_DATA_TEST_CASE_NEW(RunLarge, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 53U } ), height_values_nightly), channel_values_nightly), batch_values_nightly), kernel_sz_values_nightly), depth_multiplier_values), dilation_values), stride_values), padding_valid_values_nightly), make("DataType", DataType::F32)), data_layout_values), make("Activation", { ActivationLayerInfo() })), make("N0", 1)), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32); } TEST_SUITE(DepthMultiplierMultipleOfOutputChannels) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 33U } ), height_values_precommit), channel_values_precommit), batch_values_precommit), kernel_sz_values_precommit), make("depth_multiplier", 2)), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F32)), data_layout_values), act_values), make("N0", {2})), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32); } TEST_SUITE(ExportWeightsToCLImage) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 33U } ), height_values_precommit), channel_values_precommit), batch_values_precommit), kernel_sz_values_precommit), make("depth_multiplier", 4)), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F32)), data_layout_values), act_values), make("N0", {4})), make("ExportToCLImage", true))) { // Validate output if(_validate_output) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32); } else { ARM_COMPUTE_TEST_INFO("cl_khr_image2d_from_buffer not supported. TEST skipped"); framework::ARM_COMPUTE_PRINT_INFO(); } } TEST_SUITE_END() // ExportWeightsToCLImage TEST_SUITE_END() // DepthMultiplierMultipleOfOutputChannels TEST_SUITE_END() // FP32 TEST_SUITE(FP16) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 33U } ), height_values_precommit), channel_values_precommit), batch_values_precommit), kernel_sz_values_precommit), depth_multiplier_values), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F16)), data_layout_values), act_values), make("N0", 1)), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f16); } FIXTURE_DATA_TEST_CASE_NEW(RunLarge, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 53U } ), height_values_nightly), channel_values_nightly), batch_values_nightly), kernel_sz_values_nightly), depth_multiplier_values), dilation_values), stride_values), padding_valid_values_nightly), make("DataType", DataType::F16)), data_layout_values), make("Activation", { ActivationLayerInfo() })), make("N0", 1)), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f16, 0.f, abs_tolerance_f16); } TEST_SUITE(DepthMultiplierMultipleOfOutputChannels) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 33U } ), height_values_precommit), channel_values_precommit), batch_values_precommit), kernel_sz_values_precommit), make("depth_multiplier", 2)), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F16)), data_layout_values), act_values), make("N0", {2})), make("ExportToCLImage", false))) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f16, 0.f, abs_tolerance_f16); } TEST_SUITE(ExportWeightsToCLImage) FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CLDepthwiseConvolutionLayerNativeFixture, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine( make("width", { 33U } ), height_values_precommit), channel_values_precommit), batch_values_precommit), kernel_sz_values_precommit), make("depth_multiplier", 4)), dilation_values), stride_values), padding_valid_values), make("DataType", DataType::F16)), data_layout_values), act_values), make("N0", {4})), make("ExportToCLImage", true))) { // Validate output if(_validate_output) { // Validate output validate(CLAccessor(_target), _reference, rel_tolerance_f16, 0.f, abs_tolerance_f16); } else { ARM_COMPUTE_TEST_INFO("cl_khr_image2d_from_buffer not supported. TEST skipped"); framework::ARM_COMPUTE_PRINT_INFO(); } } TEST_SUITE_END() // ExportWeightsToCLImage TEST_SUITE_END() // DepthMultiplierMultipleOfOutputChannels TEST_SUITE_END() // FP16 TEST_SUITE_END() // Float TEST_SUITE_END() // DepthMultiplier TEST_SUITE_END() // DepthwiseConvolutionLayerNative TEST_SUITE_END() // CL } // namespace validation } // namespace test } // namespace arm_compute