aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--src/core/CL/ICLKernel.cpp3
-rw-r--r--src/runtime/CL/functions/CLGEMM.cpp1
2 files changed, 2 insertions, 2 deletions
diff --git a/src/core/CL/ICLKernel.cpp b/src/core/CL/ICLKernel.cpp
index 7ac0fe3bbb..5bd7142176 100644
--- a/src/core/CL/ICLKernel.cpp
+++ b/src/core/CL/ICLKernel.cpp
@@ -31,7 +31,6 @@
#include "arm_compute/core/Utils.h"
#include "arm_compute/core/Validate.h"
#include "arm_compute/core/Window.h"
-#include "arm_compute/runtime/CL/CLScheduler.h"
#include <cstddef>
@@ -61,7 +60,7 @@ void arm_compute::enqueue(cl::CommandQueue &queue, ICLKernel &kernel, const Wind
}
ICLKernel::ICLKernel()
- : _kernel(nullptr), _lws_hint(cl::Range_128_1), _target(CLScheduler::get().target())
+ : _kernel(nullptr), _lws_hint(cl::Range_128_1), _target(GPUTarget::MIDGARD)
{
}
diff --git a/src/runtime/CL/functions/CLGEMM.cpp b/src/runtime/CL/functions/CLGEMM.cpp
index 7408054127..07b19421d6 100644
--- a/src/runtime/CL/functions/CLGEMM.cpp
+++ b/src/runtime/CL/functions/CLGEMM.cpp
@@ -101,6 +101,7 @@ void CLGEMM::configure(const ICLTensor *a, const ICLTensor *b, const ICLTensor *
_transpose_kernel.configure(b, &_tmp_b);
// Configure matrix multiply kernel
+ _mm_kernel.set_target(CLScheduler::get().target());
_mm_kernel.configure(&_tmp_a, &_tmp_b, output, alpha);
// Allocate intermediate tensors