Skip to content

Commit 2470882

Browse files
aniraj01EmilOhlssonARM
authored andcommitted
Update the register back up for kai_kernel_matmul_clamp_f32_qai8dxp1x4_qsi8cxp4vlx4_1x4vl_sme2_dot
- Following the procedure call standard, backup registers d8-d15 in kai_kernel_matmul_clamp_f32_qai8dxp1x4_qsi8cxp4vlx4_1x4vl_sme2_dot asm micro-kernel. Signed-off-by: Anitha Raj <anitha.raj@arm.com> Approved-by: Emil Ohlsson <emil.ohlsson@arm.com>
1 parent a15b672 commit 2470882

1 file changed

Lines changed: 11 additions & 6 deletions

File tree

kai/ukernels/matmul/matmul_clamp_f32_qai8dxp_qsi8cxp/kai_matmul_clamp_f32_qai8dxp1x4_qsi8cxp4vlx4_1x4vl_sme2_dot_asm.S

Lines changed: 11 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -42,13 +42,16 @@
4242

4343
KAI_ASM_FUNCTION_TYPE(kai_kernel_matmul_clamp_f32_qai8dxp1x4_qsi8cxp4vlx4_1x4vl_sme2_dot)
4444
KAI_ASM_FUNCTION_LABEL(kai_kernel_matmul_clamp_f32_qai8dxp1x4_qsi8cxp4vlx4_1x4vl_sme2_dot)
45-
stp x19, x20, [sp, -112]!
45+
stp x19, x20, [sp, -144]!
4646
stp x21, x22, [sp, 16]
4747
stp x23, x24, [sp, 32]
4848
stp x25, x26, [sp, 48]
4949
stp x27, x28, [sp, 64]
50-
stp d12, d13, [sp, 80]
51-
stp d14, d15, [sp, 96]
50+
stp d8, d9, [sp, 80]
51+
stp d10, d11, [sp, 96]
52+
stp d12, d13, [sp, 112]
53+
stp d14, d15, [sp, 128]
54+
5255
KAI_ASM_INST(0xd503477f) // smstart
5356
ldr x16, [x0] // dst
5457
mov x11, #0x0 // =0
@@ -137,13 +140,15 @@ KAI_ASM_LABEL(label_3) // Block Loop
137140
cmp x21, x20
138141
b.lt label_1
139142
KAI_ASM_INST(0xd503467f) // smstop
140-
ldp d14, d15, [sp, 96]
141-
ldp d12, d13, [sp, 80]
143+
ldp d14, d15, [sp, 128]
144+
ldp d12, d13, [sp, 112]
145+
ldp d10, d11, [sp, 96]
146+
ldp d8, d9, [sp, 80]
142147
ldp x27, x28, [sp, 64]
143148
ldp x25, x26, [sp, 48]
144149
ldp x23, x24, [sp, 32]
145150
ldp x21, x22, [sp, 16]
146-
ldp x19, x20, [sp], 112
151+
ldp x19, x20, [sp], 144
147152
ret
148153
KAI_ASM_FUNCTION_END(kai_kernel_matmul_clamp_f32_qai8dxp1x4_qsi8cxp4vlx4_1x4vl_sme2_dot)
149154

0 commit comments

Comments
 (0)