aboutsummaryrefslogtreecommitdiff
path: root/src/core/gpu/cl/kernels/ClPoolingKernel.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/core/gpu/cl/kernels/ClPoolingKernel.cpp')
-rw-r--r--src/core/gpu/cl/kernels/ClPoolingKernel.cpp4
1 files changed, 3 insertions, 1 deletions
diff --git a/src/core/gpu/cl/kernels/ClPoolingKernel.cpp b/src/core/gpu/cl/kernels/ClPoolingKernel.cpp
index 78243402bf..a432877a1d 100644
--- a/src/core/gpu/cl/kernels/ClPoolingKernel.cpp
+++ b/src/core/gpu/cl/kernels/ClPoolingKernel.cpp
@@ -173,9 +173,11 @@ std::tuple<Status, Window, ClPoolingConfig> validate_and_configure_window(ITenso
}
case DataLayout::NHWC:
{
+ const size_t vec_size = dst->data_type() == DataType::F32 ? 2 : 4;
+
// Initialize border size
border_size = BorderSize();
- num_elems_processed_per_iteration = adjust_vec_size(4, dst->dimension(0));
+ num_elems_processed_per_iteration = adjust_vec_size(vec_size, dst->dimension(0));
win = calculate_max_window(*dst, Steps(num_elems_processed_per_iteration));
break;
}