aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--src/runtime/CL/functions/CLDeconvolutionLayer.cpp6
1 files changed, 3 insertions, 3 deletions
diff --git a/src/runtime/CL/functions/CLDeconvolutionLayer.cpp b/src/runtime/CL/functions/CLDeconvolutionLayer.cpp
index e988ab0ac4..4e0d1501ba 100644
--- a/src/runtime/CL/functions/CLDeconvolutionLayer.cpp
+++ b/src/runtime/CL/functions/CLDeconvolutionLayer.cpp
@@ -178,9 +178,9 @@ DeconvolutionMethod CLDeconvolutionLayer::get_deconvolution_method(const ITensor
if (weights->dimension(idx_w) != deconv_info.stride().first ||
weights->dimension(idx_h) != deconv_info.stride().second)
{
- // We observe better performance for FP32 types only when ofm <= 16.
- // A better heuristic is required for selecting the method for FP16 data types.
- if (input->data_layout() == DataLayout::NHWC && !((input->data_type() == DataType::F32) && (ofm > 16)))
+ // We observe better performance for FP32 types only when ofm <= 16, and for FP16 only when ofm <= 32.
+ if (input->data_layout() == DataLayout::NHWC && !((input->data_type() == DataType::F32) && (ofm > 16)) &&
+ !((input->data_type() == DataType::F16) && (ofm > 32)))
{
return DeconvolutionMethod::DIRECT;
}