diff --git a/sm4/asm_arm64.s b/sm4/asm_arm64.s index f601f7d..baaae1b 100644 --- a/sm4/asm_arm64.s +++ b/sm4/asm_arm64.s @@ -202,6 +202,10 @@ loop: MOVW.P R2, 4(R10) MOVW.P R2, -4(R11) + ADD $16, R0 + CMP $128, R0 + BNE loop + expand_end: RET @@ -299,7 +303,7 @@ loop: VEOR x.B16, t3.B16, t3.B16 ADD $16, R0 - CMP $4*32, R0 + CMP $128, R0 BNE loop VTBL FLIP_MASK.B16, [t0.B16], t0.B16 @@ -404,7 +408,7 @@ loop: VEOR x.B16, t3.B16, t3.B16 ADD $16, R0 - CMP $4*32, R0 + CMP $128, R0 BNE loop VTBL FLIP_MASK.B16, [t0.B16], t0.B16