aboutsummaryrefslogtreecommitdiff
path: root/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
diff options
context:
space:
mode:
authorGeorgios Pinitas <georgios.pinitas@arm.com>2018-11-22 19:38:27 +0000
committerGeorgios Pinitas <georgios.pinitas@arm.com>2018-11-23 14:04:27 +0000
commitca1250d548961f43ecf8499a78b5cc0c9609a37a (patch)
tree14a5ad99569819091e861595a1dc0dd592ed98be /src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
parentfea8ec3da3afd0aee3b9c228f46e7dbd52e7de2b (diff)
downloadComputeLibrary-ca1250d548961f43ecf8499a78b5cc0c9609a37a.tar.gz
COMPMID-1451: Fix MemoryManager usage.
-Fixes NEWinogradConvolution memory manager usage -Moves allocations in prepare staged for GEMMDispatchWrapper. Change-Id: Ic1c709ee473eb4968f5a081f2bc26960f882f8db
Diffstat (limited to 'src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp')
-rw-r--r--src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp13
1 files changed, 8 insertions, 5 deletions
diff --git a/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp b/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
index c8e3b3b38c..e37f8abfaf 100644
--- a/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
+++ b/src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp
@@ -464,6 +464,7 @@ void NEWinogradConvolutionLayer::configure(const ITensor *input, const ITensor *
transform_weights_kernel->configure(&_weights_hwio, &_kernel_storage, kernel_matrix_stride, out_channels, in_channels);
//The biases tensor has not been allocated at this point in time, the output transform will add the biases to the final result in the run() method
+ _memory_group.manage(&_output_nhwc);
transform_output_kernel->configure(biases, &_output_workspace,
output_matrix_stride, &_output_nhwc,
in_shape.n_batches, output_shape.n_rows, output_shape.n_cols, out_channels);
@@ -483,16 +484,16 @@ void NEWinogradConvolutionLayer::configure(const ITensor *input, const ITensor *
in_shape.n_batches, output_shape.n_rows, output_shape.n_cols, out_channels);
}
- _weights_hwio.allocator()->allocate();
_gemm_function.configure(&_input_workspace, &_kernel_storage, nullptr, &_output_workspace, 1.0f, 0.f);
_input_workspace.allocator()->allocate();
- _kernel_storage.allocator()->allocate();
_output_workspace.allocator()->allocate();
// Reorder the convoluted output to ACL's ordering NCHW
- _permute_output.configure(&_output_nhwc, _output, PermutationVector(1U, 2U, 0U));
-
- _output_nhwc.allocator()->allocate();
+ if(data_layout == DataLayout::NCHW)
+ {
+ _permute_output.configure(&_output_nhwc, _output, PermutationVector(1U, 2U, 0U));
+ _output_nhwc.allocator()->allocate();
+ }
_transform_input_kernel = std::move(transform_input_kernel);
_transform_weights_kernel = std::move(transform_weights_kernel);
@@ -656,10 +657,12 @@ void NEWinogradConvolutionLayer::prepare()
if(!_is_prepared)
{
// Permute weights
+ _weights_hwio.allocator()->allocate();
_permute_weights.run();
_weights->mark_as_unused();
// Transform weights
+ _kernel_storage.allocator()->allocate();
NEScheduler::get().schedule(_transform_weights_kernel.get(), Window::DimX);
_weights_hwio.allocator()->free();