From 4406fd6cc4abded564d3791324e1f48bdfd34273 Mon Sep 17 00:00:00 2001 From: Frank Lei Date: Thu, 1 Feb 2018 14:47:14 +0800 Subject: APPBROWSER-391: Fix GLES COMPUTE alignment issues APPBROWSER-402: Performance optimization for squeezenet/xray model Change-Id: If31b186b99a6d6087164019fe94d3ac9279e3204 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/119526 Tested-by: Jenkins Reviewed-by: Georgios Pinitas --- .../GLES_COMPUTE/kernels/GCNormalizePlanarYUVLayerKernel.cpp | 12 +++++++++--- 1 file changed, 9 insertions(+), 3 deletions(-) (limited to 'src/core/GLES_COMPUTE/kernels/GCNormalizePlanarYUVLayerKernel.cpp') diff --git a/src/core/GLES_COMPUTE/kernels/GCNormalizePlanarYUVLayerKernel.cpp b/src/core/GLES_COMPUTE/kernels/GCNormalizePlanarYUVLayerKernel.cpp index bc9c7eb55a..fac29024e3 100644 --- a/src/core/GLES_COMPUTE/kernels/GCNormalizePlanarYUVLayerKernel.cpp +++ b/src/core/GLES_COMPUTE/kernels/GCNormalizePlanarYUVLayerKernel.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2017 ARM Limited. + * Copyright (c) 2017-2018 ARM Limited. * * SPDX-License-Identifier: MIT * @@ -89,6 +89,8 @@ void GCNormalizePlanarYUVLayerKernel::run(const Window &window) _kernel.use(); + _output->set_needs_shifting(true); + Window slice = window.first_slice_window_3D(); Window slice_in; @@ -100,15 +102,19 @@ void GCNormalizePlanarYUVLayerKernel::run(const Window &window) add_1D_tensor_argument(idx, _mean, 3, slice_in); add_1D_tensor_argument(idx, _sd, 4, slice_in); + slice_in = window.first_slice_window_3D(); + + slice.shift(Window::DimX, -(_output->info()->padding()).left); + do { idx = 0; - add_3D_tensor_argument(idx, _input, 1, slice); + add_3D_tensor_argument(idx, _input, 1, slice_in); add_3D_tensor_argument(idx, _output, 2, slice); _kernel.update_shader_params(); enqueue(*this, slice); } - while(window.slide_window_slice_3D(slice)); + while(window.slide_window_slice_3D(slice) && window.slide_window_slice_3D(slice_in)); } -- cgit v1.2.1