diff options
author | polwex <polwex@sortug.com> | 2025-10-05 21:56:51 +0700 |
---|---|---|
committer | polwex <polwex@sortug.com> | 2025-10-05 21:56:51 +0700 |
commit | fcedfddf00b3f994e4f4e40332ac7fc192c63244 (patch) | |
tree | 51d38e62c7bdfcc5f9a5e9435fe820c93cfc9a3d /vere/ext/gmp/gen/aarch64-macos/mpn/sublsh1_n.s |
claude is gud
Diffstat (limited to 'vere/ext/gmp/gen/aarch64-macos/mpn/sublsh1_n.s')
-rw-r--r-- | vere/ext/gmp/gen/aarch64-macos/mpn/sublsh1_n.s | 161 |
1 files changed, 161 insertions, 0 deletions
diff --git a/vere/ext/gmp/gen/aarch64-macos/mpn/sublsh1_n.s b/vere/ext/gmp/gen/aarch64-macos/mpn/sublsh1_n.s new file mode 100644 index 0000000..e3e924f --- /dev/null +++ b/vere/ext/gmp/gen/aarch64-macos/mpn/sublsh1_n.s @@ -0,0 +1,161 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + .text + .align 3 + .globl ___gmpn_sublsh1_n + +___gmpn_sublsh1_n: + lsr x6, x3, #2 + tbz x3, #0, Lbx0 + +Lbx1: ldr x5, [x1] + tbnz x3, #1, Lb11 + +Lb01: ldr x11, [x2] + cbz x6, L1 + ldp x8, x9, [x2,#8] + lsl x13, x11, #1 + subs x15, x5, x13 + str x15, [x0],#8 + sub x1, x1, #24 + sub x2, x2, #8 + b Lmid + +L1: lsl x13, x11, #1 + subs x15, x5, x13 + str x15, [x0] + lsr x0, x11, 63 + cinc x0, x0, cc + ret + +Lb11: ldr x9, [x2] + ldp x10, x11, [x2,#8]! + lsl x13, x9, #1 + subs x17, x5, x13 + str x17, [x0],#8 + sub x1, x1, #8 + cbz x6, Lend + b Ltop + +Lbx0: tbnz x3, #1, Lb10 + +Lb00: subs x11, xzr, xzr + ldp x8, x9, [x2],#-16 + sub x1, x1, #32 + b Lmid + +Lb10: subs x9, xzr, xzr + ldp x10, x11, [x2] + sub x1, x1, #16 + cbz x6, Lend + + .align 4 +Ltop: ldp x4, x5, [x1,#16] + extr x12, x10, x9, #63 + ldp x8, x9, [x2,#16] + extr x13, x11, x10, #63 + sbcs x14, x4, x12 + sbcs x15, x5, x13 + stp x14, x15, [x0],#16 +Lmid: ldp x4, x5, [x1,#32]! + extr x12, x8, x11, #63 + ldp x10, x11, [x2,#32]! + extr x13, x9, x8, #63 + sbcs x16, x4, x12 + sbcs x17, x5, x13 + stp x16, x17, [x0],#16 + sub x6, x6, #1 + cbnz x6, Ltop + +Lend: ldp x4, x5, [x1,#16] + extr x12, x10, x9, #63 + extr x13, x11, x10, #63 + sbcs x14, x4, x12 + sbcs x15, x5, x13 + stp x14, x15, [x0] + lsr x0, x11, 63 + cinc x0, x0, cc + ret + + |