aboutsummaryrefslogtreecommitdiff
path: root/src/core/NEON/kernels/arm_gemm/gemm_interleaved_pretransposed_2d.hpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/core/NEON/kernels/arm_gemm/gemm_interleaved_pretransposed_2d.hpp')
-rw-r--r--src/core/NEON/kernels/arm_gemm/gemm_interleaved_pretransposed_2d.hpp14
1 files changed, 3 insertions, 11 deletions
diff --git a/src/core/NEON/kernels/arm_gemm/gemm_interleaved_pretransposed_2d.hpp b/src/core/NEON/kernels/arm_gemm/gemm_interleaved_pretransposed_2d.hpp
index 38fb26370c..97e16a61c1 100644
--- a/src/core/NEON/kernels/arm_gemm/gemm_interleaved_pretransposed_2d.hpp
+++ b/src/core/NEON/kernels/arm_gemm/gemm_interleaved_pretransposed_2d.hpp
@@ -62,9 +62,6 @@ class GemmInterleavedPretransposed2d : public GemmCommon<To, Tr> {
const unsigned int _nbatches;
const unsigned int _nmulti;
- const bool _trA;
- const bool _trB;
-
const Activation _act;
const int _maxthreads;
@@ -252,8 +249,7 @@ class GemmInterleavedPretransposed2d : public GemmCommon<To, Tr> {
first_m,
last_m,
current.k0(),
- current.kmax(),
- _trA);
+ current.kmax());
}
}
@@ -317,8 +313,6 @@ public:
, _Ksize(args._Ksize)
, _nbatches(args._nbatches)
, _nmulti(args._nmulti)
- , _trA(args._trA)
- , _trB(args._trB)
, _act(args._act)
, _maxthreads(args._maxthreads)
, _nthreads(args._maxthreads)
@@ -330,8 +324,6 @@ public:
, _Nround_div ( iceildiv(_Nsize, strategy::out_width()) )
, _Nround ( _Nround_div * strategy::out_width() )
{
-
- assert(args._pretransposed_hint);
assert(_maxthreads > 0);
const unsigned int L1_size = _ci->get_L1_cache_size();
@@ -411,7 +403,7 @@ public:
execute_pretranspose(m_start, m_end, n_start, n_end, threadid, m_threadid, n_threadid);
}
- std::size_t get_working_size()const override {
+ std::size_t get_working_size() const override {
/* Because we do not know how schedular will break up
* the task, we need to ensure that alloc enough
* space to be able to handle the case where every thread
@@ -493,7 +485,7 @@ public:
k_size *= strategy::k_unroll();
strat.transforms.PrepareB(buffer, B + (current.multi() * B_multi_stride), ldb,
- current.x0(), current.xmax(), current.k0(), current.kmax(), _trB);
+ current.x0(), current.xmax(), current.k0(), current.kmax());
buffer += (x_size * k_size);
} while (current.advance());