aboutsummaryrefslogtreecommitdiff
path: root/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
diff options
context:
space:
mode:
authorSiCong Li <sicong.li@arm.com>2020-05-28 08:55:51 +0100
committerSiCong Li <sicong.li@arm.com>2020-07-02 10:30:40 +0000
commit6b6a16faa9375365d444b2a3998381b22cd6cd5b (patch)
tree2ba7ed6275ff900b15a90690d1f2265a3dbd84ce /src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
parentf3ad9513dd46fca1d6c5e4550286480fdbaba056 (diff)
downloadComputeLibrary-6b6a16faa9375365d444b2a3998381b22cd6cd5b.tar.gz
COMPMID-3501 Modify heuristics for f16+fastmath NEON Winograd Conv
* Disable winograd on certain layers of squeezenet v1.1 * Fix winograd validate_kernel_3x3 Signed-off-by: SiCong Li <sicong.li@arm.com> Change-Id: I380c6e4a0f8338056839df3c8810f726227f210f Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/3348 Tested-by: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp')
-rw-r--r--src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp2
1 files changed, 1 insertions, 1 deletions
diff --git a/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp b/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
index a74e710c62..88d8a7573f 100644
--- a/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
+++ b/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
@@ -62,7 +62,7 @@ inline Status validate_kernel_3x3(const Size2D input_dims, const ITensorInfo *in
}
}
#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
- else if(input->data_type() == DataType::F32)
+ else if(input->data_type() == DataType::F16)
{
ARM_COMPUTE_RETURN_ON_ERROR((NEWinogradLayerTransformInputKernel<__fp16, 4, 4, 3, 3>::validate(input, input0, winograd_info)));
ARM_COMPUTE_RETURN_ON_ERROR((NEWinogradLayerTransformWeightsKernel<__fp16, 4, 4, 3, 3>::validate(weights, input1, winograd_info)));