aboutsummaryrefslogtreecommitdiff
path: root/arm_compute/runtime/NEON/functions/NEGEMMConvolutionLayer.h
diff options
context:
space:
mode:
authorGiorgio Arena <giorgio.arena@arm.com>2019-11-13 17:07:13 +0000
committerMichele Di Giorgio <michele.digiorgio@arm.com>2019-11-13 18:05:19 +0000
commit7a669a87ef04ecb4c9b51ea4a10d9a16aebf3227 (patch)
treea1f1cd35578386b141dff519ee85496819a64921 /arm_compute/runtime/NEON/functions/NEGEMMConvolutionLayer.h
parent2dab2e936a41053cf260a235ac808577ae923f3e (diff)
downloadComputeLibrary-7a669a87ef04ecb4c9b51ea4a10d9a16aebf3227.tar.gz
COMPMID-2921 Performance regression on NEON Int8
Change-Id: I60ede3e8aeec678a9fb0d8d0f05a8048ab1ced7c Signed-off-by: Giorgio Arena <giorgio.arena@arm.com> Reviewed-on: https://review.mlplatform.org/c/2285 Tested-by: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Michele Di Giorgio <michele.digiorgio@arm.com>
Diffstat (limited to 'arm_compute/runtime/NEON/functions/NEGEMMConvolutionLayer.h')
-rw-r--r--arm_compute/runtime/NEON/functions/NEGEMMConvolutionLayer.h3
1 files changed, 2 insertions, 1 deletions
diff --git a/arm_compute/runtime/NEON/functions/NEGEMMConvolutionLayer.h b/arm_compute/runtime/NEON/functions/NEGEMMConvolutionLayer.h
index 2d4aaa495f..6452fc9249 100644
--- a/arm_compute/runtime/NEON/functions/NEGEMMConvolutionLayer.h
+++ b/arm_compute/runtime/NEON/functions/NEGEMMConvolutionLayer.h
@@ -231,13 +231,14 @@ private:
/** Static function to check if GEMM3D is supported in @ref NEGEMM or in @ref NEGEMMLowpMatrixMultiplyCore
*
* @param[in] input_info Input tensor info. Data types supported: QASYMM8/F16/F32.
+ * @param[in] weights_info Weights tensor info. Data types supported: QASYMM8/F16/F32.
* @param[in] act_info Activation layer information in case of a fused activation. Only RELU, BOUNDED_RELU and LU_BOUNDED_RELU supported.
* @param[in] gemm_3d_depth Depth of GEMM 3D
* @param[in] skip_im2col Flag which specifies if im2col has to be skipped. i.e. 1x1 convolution with NHWC data layout
*
* @return a status
*/
- static Status validate_gemm3d(const ITensorInfo *input_info, const ActivationLayerInfo &act_info, int gemm_3d_depth, bool skip_im2col);
+ static Status validate_gemm3d(const ITensorInfo *input_info, const ITensorInfo *weights_info, const ActivationLayerInfo &act_info, int gemm_3d_depth, bool skip_im2col);
private:
MemoryGroup _memory_group;