aboutsummaryrefslogtreecommitdiff
path: root/arm_compute
diff options
context:
space:
mode:
Diffstat (limited to 'arm_compute')
-rw-r--r--arm_compute/runtime/NEON/functions/NEWinogradLayer.h7
1 files changed, 5 insertions, 2 deletions
diff --git a/arm_compute/runtime/NEON/functions/NEWinogradLayer.h b/arm_compute/runtime/NEON/functions/NEWinogradLayer.h
index 27b1e84201..8010810253 100644
--- a/arm_compute/runtime/NEON/functions/NEWinogradLayer.h
+++ b/arm_compute/runtime/NEON/functions/NEWinogradLayer.h
@@ -27,6 +27,7 @@
#include "arm_compute/runtime/IFunction.h"
#include "arm_compute/core/NEON/INEKernel.h"
+#include "arm_compute/core/NEON/kernels/assembly/arm_gemm.hpp"
#include "arm_compute/core/Types.h"
#include "arm_compute/runtime/CPP/functions/CPPPermute.h"
#include "arm_compute/runtime/MemoryGroup.h"
@@ -93,8 +94,9 @@ public:
NEWinogradLayer &operator=(const NEWinogradLayer &) = delete;
private:
- MemoryGroup _memory_group;
- std::unique_ptr<INEKernel> _batched_gemm_kernel;
+ MemoryGroup _memory_group;
+ std::unique_ptr<arm_gemm::GemmCommon<float, float>> _arm_gemm;
+ std::unique_ptr<INEKernel> _gemm_kernel;
std::unique_ptr<INEKernel> _transform_input_kernel;
std::unique_ptr<INEKernel> _transform_output_kernel;
std::unique_ptr<INEKernel> _transform_weights_kernel;
@@ -109,6 +111,7 @@ private:
Tensor _input_nhwc;
Tensor _output_nhwc;
Tensor _weights_hwio;
+ Tensor _workspace;
const ITensor *_input;
const ITensor *_weights;
ITensor *_output;