aboutsummaryrefslogtreecommitdiff
path: root/src/cpu/kernels/softmax/generic/sme2/fp32.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/cpu/kernels/softmax/generic/sme2/fp32.cpp')
-rw-r--r--src/cpu/kernels/softmax/generic/sme2/fp32.cpp8
1 files changed, 4 insertions, 4 deletions
diff --git a/src/cpu/kernels/softmax/generic/sme2/fp32.cpp b/src/cpu/kernels/softmax/generic/sme2/fp32.cpp
index e80041c812..159039a320 100644
--- a/src/cpu/kernels/softmax/generic/sme2/fp32.cpp
+++ b/src/cpu/kernels/softmax/generic/sme2/fp32.cpp
@@ -191,16 +191,16 @@ loop_1_start%=:
// Step 1: Find max
// ==================================================
+ // Loop for processing 4 vectors per iteration.
+ mov x9, #0 // x9: index
+ dup z11.s, w10 // z11: max_value = -inf
+
// ---------------------------------------------------------------- z16-z19: max_value = -inf
mov z16.d, z11.d
mov z17.d, z11.d
mov z18.d, z11.d
mov z19.d, z11.d
- // Loop for processing 4 vectors per iteration.
- mov x9, #0 // x9: index
- dup z11.s, w10 // z11: max_value = -inf
-
find_max_body_start%=:
cmp x9, x13
b.eq find_max_body_end%=