From cfa2bba98169cb5ab1945462514be1b6badf7d98 Mon Sep 17 00:00:00 2001 From: Georgios Pinitas Date: Thu, 27 Jun 2019 17:00:52 +0100 Subject: COMPMID-2178: Update GEMM assembly code. Perform offset reduction and requantization within the assembly wrapper. Change-Id: I5d5b3e1f6f9ef4c71805362c57f88ff199c027a3 Signed-off-by: Georgios Pinitas Reviewed-on: https://review.mlplatform.org/c/1541 Comments-Addressed: Pablo Marquez Reviewed-by: Gian Marco Iodice Comments-Addressed: Arm Jenkins Tested-by: Arm Jenkins --- src/core/NEON/kernels/arm_gemm/transform.hpp | 7 +++++++ 1 file changed, 7 insertions(+) (limited to 'src/core/NEON/kernels/arm_gemm/transform.hpp') diff --git a/src/core/NEON/kernels/arm_gemm/transform.hpp b/src/core/NEON/kernels/arm_gemm/transform.hpp index 0330783a0b..d790d566b6 100644 --- a/src/core/NEON/kernels/arm_gemm/transform.hpp +++ b/src/core/NEON/kernels/arm_gemm/transform.hpp @@ -23,6 +23,10 @@ */ #pragma once +#include "utils.hpp" + +namespace arm_gemm { + /* * Generic transform. * @@ -80,6 +84,7 @@ struct TransformImpl { *out++ = static_cast(0); } } + // "row" tail - row is out of range so fill with zeros always. TOut zeroval = static_cast(0); int pads = blank_rows * (fill_cols + blank_cols); @@ -114,3 +119,5 @@ void Transform( /*****************************************************************************/ #include "transforms/list.hpp" + +} // namespace arm_gemm -- cgit v1.2.1