aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGian Marco Iodice <gianmarco.iodice@arm.com>2019-06-27 16:55:51 +0100
committerGian Marco Iodice <gianmarco.iodice@arm.com>2019-06-28 08:08:54 +0000
commit96aa6b136cbe38ff5ba924c0109d35ba85546a8d (patch)
tree7f766af6768738c81a72a92191ac51961d539d00
parentfffbdbcc52ae2f30b9c51637d82e5e1f5d604e71 (diff)
downloadComputeLibrary-96aa6b136cbe38ff5ba924c0109d35ba85546a8d.tar.gz
COMPMID-2431: Add a comment to max_offset in CLDepthwiseConvolutionLayer3x3NHWCKernel
Change-Id: I4097cc3aec858beb0630254fe7a6790dfcb3d90f Signed-off-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Reviewed-on: https://review.mlplatform.org/c/1431 Reviewed-by: Giuseppe Rossini <giuseppe.rossini@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com>
-rw-r--r--src/core/CL/kernels/CLDepthwiseConvolutionLayer3x3NHWCKernel.cpp35
1 files changed, 35 insertions, 0 deletions
diff --git a/src/core/CL/kernels/CLDepthwiseConvolutionLayer3x3NHWCKernel.cpp b/src/core/CL/kernels/CLDepthwiseConvolutionLayer3x3NHWCKernel.cpp
index 779cf25fdf..c78ad1a5b5 100644
--- a/src/core/CL/kernels/CLDepthwiseConvolutionLayer3x3NHWCKernel.cpp
+++ b/src/core/CL/kernels/CLDepthwiseConvolutionLayer3x3NHWCKernel.cpp
@@ -343,6 +343,41 @@ void CLDepthwiseConvolutionLayer3x3NHWCKernel::run(const Window &window, cl::Com
add_1D_tensor_argument(idx, _biases, win_biases);
}
+ // Calculate the max_offset.
+ // max_offset is the offset for the last NOT valid value in the Z dimension (spatial dimension Y for NHWC)
+ // |******************|
+ // | pad_top |
+ // |******************|
+ // | |
+ // | plane0 |
+ // | batch0 |
+ // |__________________|
+ // |******************| Batch 0
+ // | pad_bottom |
+ // | pad_top |
+ // |******************|
+ // | |
+ // | plane1 |
+ // | batch0 |
+ // |__________________|-----> max_offset
+ // |******************|
+ // | pad_bottom |
+ // | pad_top |
+ // |******************|
+ // | |
+ // | plane0 |
+ // | batch1 |
+ // |__________________|
+ // |******************| Batch 1
+ // | pad_bottom |
+ // | pad_top |
+ // |******************|
+ // | |
+ // | plane1 |
+ // | batch1 |
+ // |__________________|
+ // | pad_bottom |
+ // |******************|
const int max_offset = _input->info()->strides_in_bytes().z() * _input->info()->dimension(2) - (_input->info()->padding().bottom + _input->info()->padding().top) *
_input->info()->strides_in_bytes().y();
_kernel.setArg(idx, max_offset);