From 409ee0a69799364797263d13dd95936c851bfe80 Mon Sep 17 00:00:00 2001 From: Georgios Pinitas Date: Fri, 18 Aug 2017 10:16:09 +0100 Subject: COMPMID-417: Add in-place support for batch-normalization. Change-Id: I4b0c9348f3bc2addc198a76fadd1b583abf42b60 Reviewed-on: http://mpd-gerrit.cambridge.arm.com/84434 Tested-by: Kaizen Reviewed-by: Michalis Spyrou Reviewed-by: Gian Marco Iodice --- src/core/CL/cl_kernels/batchnormalization_layer.cl | 18 ++++++++++++------ 1 file changed, 12 insertions(+), 6 deletions(-) (limited to 'src/core/CL/cl_kernels/batchnormalization_layer.cl') diff --git a/src/core/CL/cl_kernels/batchnormalization_layer.cl b/src/core/CL/cl_kernels/batchnormalization_layer.cl index cb4d0c8947..904d5b3045 100644 --- a/src/core/CL/cl_kernels/batchnormalization_layer.cl +++ b/src/core/CL/cl_kernels/batchnormalization_layer.cl @@ -80,19 +80,25 @@ * @param[in] epsilon Epsilon parameter in the batch normalization equation */ __kernel void batchnormalization_layer(TENSOR3D_DECLARATION(input), +#ifndef IN_PLACE TENSOR3D_DECLARATION(output), +#endif /* not IN_PLACE */ VECTOR_DECLARATION(mean), VECTOR_DECLARATION(var), VECTOR_DECLARATION(beta), VECTOR_DECLARATION(gamma), float epsilon) { - Tensor3D in = CONVERT_TO_TENSOR3D_STRUCT(input); - Tensor3D out = CONVERT_TO_TENSOR3D_STRUCT(output); - Vector mean = CONVERT_TO_VECTOR_STRUCT(mean); - Vector var = CONVERT_TO_VECTOR_STRUCT(var); - Vector beta = CONVERT_TO_VECTOR_STRUCT(beta); - Vector gamma = CONVERT_TO_VECTOR_STRUCT(gamma); + Tensor3D in = CONVERT_TO_TENSOR3D_STRUCT(input); +#ifdef IN_PLACE + Tensor3D out = in; +#else /* IN_PLACE */ + Tensor3D out = CONVERT_TO_TENSOR3D_STRUCT(output); +#endif /* IN_PLACE */ + Vector mean = CONVERT_TO_VECTOR_STRUCT(mean); + Vector var = CONVERT_TO_VECTOR_STRUCT(var); + Vector beta = CONVERT_TO_VECTOR_STRUCT(beta); + Vector gamma = CONVERT_TO_VECTOR_STRUCT(gamma); VEC_DATA_TYPE(DATA_TYPE, VEC_SIZE) _in = 0; -- cgit v1.2.1