COMPMID-784: Added support for biases in WinogradLayer.

1) Updated to the latest code from the RSH repo. 2) Moved winograd transforms into kernels. 3) Added support for biases Change-Id: I7f39f34a599b49d7d9b549cc10a4f4d4a8007ab8 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/117474 Tested-by: Jenkins <bsgcomp@arm.com> Reviewed-by: Anthony Barbier <anthony.barbier@arm.com>
author: Pablo Tello <pablo.tello@arm.com> 2018-01-23 09:36:04 +0000
committer: Anthony Barbier <anthony.barbier@arm.com> 2018-11-02 16:45:00 +0000
commit: d6ca478a7e410f8f529c2e505305b46d9fe21a9b (patch)
tree: 5c50c06e07f812890f127b1c4933996987f74f17 /src/core/NEON/kernels/winograd/winograd_gemm.cpp
parent: d05dce46a14a7b67f322328ecd95bf96bdd30bae (diff)
download: ComputeLibrary-d6ca478a7e410f8f529c2e505305b46d9fe21a9b.tar.gz
1 files changed, 11 insertions, 2 deletions
diff --git a/src/core/NEON/kernels/winograd/winograd_gemm.cpp b/src/core/NEON/kernels/winograd/winograd_gemm.cpp
index b44a45367f..fcfa635232 100644
--- a/src/core/NEON/kernels/winograd/winograd_gemm.cpp
+++ b/src/core/NEON/kernels/winograd/winograd_gemm.cpp
@@ -372,6 +372,7 @@ void WinogradGEMM<output_tile_rows, output_tile_cols, kernel_rows, kernel_cols>:
 Convolution<TOut, TIn>::execute(
   TOut* const output,
   const TIn* const input,
+  const TOut* const biases,
   void *working_space,
   const int n_threads
 )
@@ -479,7 +480,11 @@ Convolution<TOut, TIn>::execute(
     kernel_matrices[0],
     output_matrices[0]
   );
-  gemms.run(0, gemms.get_window());
+  for (unsigned int i = 0; i < gemms.get_window(); i++)
+  {
+    auto run_gemm = [&] () { gemms.run(i, i+1); };
+    prof("GEMM", run_gemm, 0, 0, 0);
+  }
 
   // If the output tensor needs to be in NCHW form then store the NHWC output
   // tensor in temporary storage and then reorder. If the output tensor needs
@@ -498,6 +503,7 @@ Convolution<TOut, TIn>::execute(
     output_matrices[0],
     out_matrix_stride_bytes / sizeof(TOut),
     out_matrix_row_stride,
+    biases,
     output_nhwc,
     output_shape.n_batches,
     output_shape.n_rows,
@@ -548,13 +554,16 @@ void WinogradGEMM<output_tile_rows, output_tile_cols, kernel_rows, kernel_cols>:
 Convolution<TOut, TIn>::execute(
   TOut* const output,
   const TIn* const input,
+  const TOut* const biases,
   const int n_threads
 )
 {
-  execute(output, input, NULL, n_threads);
+  execute(output, input, biases, NULL, n_threads);
 }
 
 
 // Instantiate required implementations
 template class WinogradGEMM<2, 2, 3, 3>::Convolution<float, float>;
 template class WinogradGEMM<4, 4, 3, 3>::Convolution<float, float>;
+
+template class WinogradGEMM<2, 2, 5, 5>::Convolution<float, float>;
author	Pablo Tello <pablo.tello@arm.com>	2018-01-23 09:36:04 +0000
committer	Anthony Barbier <anthony.barbier@arm.com>	2018-11-02 16:45:00 +0000
commit	d6ca478a7e410f8f529c2e505305b46d9fe21a9b (patch)
tree	5c50c06e07f812890f127b1c4933996987f74f17 /src/core/NEON/kernels/winograd/winograd_gemm.cpp
parent	d05dce46a14a7b67f322328ecd95bf96bdd30bae (diff)
download	ComputeLibrary-d6ca478a7e410f8f529c2e505305b46d9fe21a9b.tar.gz