From 917959c88361e8148696c156453f69c6ae0c95c0 Mon Sep 17 00:00:00 2001 From: John Kesapides Date: Mon, 4 Feb 2019 12:37:29 +0000 Subject: COMPMID-1281 Investigate concatenation for RNN/LSTM NEON Change-Id: I7f099348a361a6f2d4efb30618f58bd44dd41e6c Signed-off-by: John Kesapides Reviewed-on: https://review.mlplatform.org/c/712 Reviewed-by: Giuseppe Rossini Tested-by: Arm Jenkins --- arm_compute/runtime/NEON/functions/NELSTMLayer.h | 11 ++++++++--- 1 file changed, 8 insertions(+), 3 deletions(-) (limited to 'arm_compute/runtime/NEON/functions/NELSTMLayer.h') diff --git a/arm_compute/runtime/NEON/functions/NELSTMLayer.h b/arm_compute/runtime/NEON/functions/NELSTMLayer.h index b98e74d969..f3a1aa7c75 100644 --- a/arm_compute/runtime/NEON/functions/NELSTMLayer.h +++ b/arm_compute/runtime/NEON/functions/NELSTMLayer.h @@ -1,5 +1,5 @@ /* - * Copyright (c) 2018 ARM Limited. + * Copyright (c) 2018-2019 ARM Limited. * * SPDX-License-Identifier: MIT * @@ -132,6 +132,7 @@ public: // Inherited methods overridden: void run() override; + void prepare() override; private: MemoryGroup _memory_group; @@ -176,16 +177,20 @@ private: NECopyKernel _copy_cell_state; NECopyKernel _copy_output; NEWidthConcatenateLayer _concat_scratch_buffer; + NEWidthConcatenateLayer _concat_inputs_forget_gate; + NEWidthConcatenateLayer _concat_weights_forget_gate; + NEWidthConcatenateLayer _concat_weights_input_gate; + NEWidthConcatenateLayer _concat_weights_output; Tensor _input_gate_out1; Tensor _input_gate_out2; Tensor _input_gate_out3; Tensor _input_gate_out4; - Tensor _input_gate_out5; Tensor _forget_gate_out1; Tensor _forget_gate_out2; Tensor _forget_gate_out3; Tensor _forget_gate_out4; Tensor _forget_gate_out5; + Tensor _forget_gate_out6; Tensor _cell_state_out1; Tensor _cell_state_out2; Tensor _cell_state_out3; @@ -195,7 +200,6 @@ private: Tensor _output2; Tensor _output3; Tensor _output4; - Tensor _output5; Tensor _cell_state_activation; Tensor _output_state1; Tensor _ones; @@ -204,6 +208,7 @@ private: bool _perform_cell_clipping; bool _has_projection_weights; bool _perform_projection_clipping; + bool _is_prepared; }; } // namespace arm_compute #endif /* __ARM_COMPUTE_NELSTMLAYER_H__ */ -- cgit v1.2.1