From 6b6a16faa9375365d444b2a3998381b22cd6cd5b Mon Sep 17 00:00:00 2001 From: SiCong Li Date: Thu, 28 May 2020 08:55:51 +0100 Subject: COMPMID-3501 Modify heuristics for f16+fastmath NEON Winograd Conv * Disable winograd on certain layers of squeezenet v1.1 * Fix winograd validate_kernel_3x3 Signed-off-by: SiCong Li Change-Id: I380c6e4a0f8338056839df3c8810f726227f210f Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/3348 Tested-by: Arm Jenkins Reviewed-by: Georgios Pinitas Comments-Addressed: Arm Jenkins --- src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to 'src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp') diff --git a/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp b/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp index a74e710c62..88d8a7573f 100644 --- a/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp +++ b/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp @@ -62,7 +62,7 @@ inline Status validate_kernel_3x3(const Size2D input_dims, const ITensorInfo *in } } #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC - else if(input->data_type() == DataType::F32) + else if(input->data_type() == DataType::F16) { ARM_COMPUTE_RETURN_ON_ERROR((NEWinogradLayerTransformInputKernel<__fp16, 4, 4, 3, 3>::validate(input, input0, winograd_info))); ARM_COMPUTE_RETURN_ON_ERROR((NEWinogradLayerTransformWeightsKernel<__fp16, 4, 4, 3, 3>::validate(weights, input1, winograd_info))); -- cgit v1.2.1