summaryrefslogtreecommitdiff
path: root/vere/ext/gmp/gen/x86_64-windows/mpn/addmul_1.s
diff options
context:
space:
mode:
authorpolwex <polwex@sortug.com>2025-10-05 21:56:51 +0700
committerpolwex <polwex@sortug.com>2025-10-05 21:56:51 +0700
commitfcedfddf00b3f994e4f4e40332ac7fc192c63244 (patch)
tree51d38e62c7bdfcc5f9a5e9435fe820c93cfc9a3d /vere/ext/gmp/gen/x86_64-windows/mpn/addmul_1.s
claude is gud
Diffstat (limited to 'vere/ext/gmp/gen/x86_64-windows/mpn/addmul_1.s')
-rw-r--r--vere/ext/gmp/gen/x86_64-windows/mpn/addmul_1.s199
1 files changed, 199 insertions, 0 deletions
diff --git a/vere/ext/gmp/gen/x86_64-windows/mpn/addmul_1.s b/vere/ext/gmp/gen/x86_64-windows/mpn/addmul_1.s
new file mode 100644
index 0000000..3a2880c
--- /dev/null
+++ b/vere/ext/gmp/gen/x86_64-windows/mpn/addmul_1.s
@@ -0,0 +1,199 @@
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ .text
+ .align 16, 0x90
+ .globl __gmpn_addmul_1
+
+ .def __gmpn_addmul_1
+ .scl 2
+ .type 32
+ .endef
+__gmpn_addmul_1:
+
+
+push %rsi
+push %rdi
+mov %rdx, %rsi
+
+ mov (%rsi), %rax
+ push %rbx
+
+ mov %r8, %rbx
+ mul %r9
+
+
+ and $3, %ebx
+ jz Lb0
+ cmp $2, %ebx
+ jz Lb2
+ jg Lb3
+
+Lb1: dec %r8
+ jne Lgt1
+ add %rax, (%rcx)
+ jmp Lret
+Lgt1: lea 8(%rsi,%r8,8), %rsi
+ lea -8(%rcx,%r8,8), %rcx
+ neg %r8
+ xor %r10, %r10
+ xor %ebx, %ebx
+ mov %rax, %rdi
+ mov (%rsi,%r8,8), %rax
+ mov %rdx, %r11
+ jmp LL1
+
+Lb0: lea (%rsi,%r8,8), %rsi
+ lea -16(%rcx,%r8,8), %rcx
+ neg %r8
+ xor %r10, %r10
+ mov %rax, %r11
+ mov %rdx, %rbx
+ jmp LL0
+
+Lb3: lea -8(%rsi,%r8,8), %rsi
+ lea -24(%rcx,%r8,8), %rcx
+ neg %r8
+ mov %rax, %rbx
+ mov %rdx, %r10
+ jmp LL3
+
+Lb2: lea -16(%rsi,%r8,8), %rsi
+ lea -32(%rcx,%r8,8), %rcx
+ neg %r8
+ xor %r11, %r11
+ xor %ebx, %ebx
+ mov %rax, %r10
+ mov 24(%rsi,%r8,8), %rax
+ mov %rdx, %rdi
+ jmp LL2
+
+ .align 16, 0x90
+Ltop: add %r10, (%rcx,%r8,8)
+ adc %rax, %rdi
+ mov (%rsi,%r8,8), %rax
+ adc %rdx, %r11
+ mov $0, %r10d
+LL1: mul %r9
+ add %rdi, 8(%rcx,%r8,8)
+ adc %rax, %r11
+ adc %rdx, %rbx
+LL0: mov 8(%rsi,%r8,8), %rax
+ mul %r9
+ add %r11, 16(%rcx,%r8,8)
+ adc %rax, %rbx
+ adc %rdx, %r10
+LL3: mov 16(%rsi,%r8,8), %rax
+ mul %r9
+ add %rbx, 24(%rcx,%r8,8)
+ mov $0, %r11d
+ mov %r11, %rbx
+ adc %rax, %r10
+ mov 24(%rsi,%r8,8), %rax
+ mov %r11, %rdi
+ adc %rdx, %rdi
+LL2: mul %r9
+ add $4, %r8
+ js Ltop
+
+ add %r10, (%rcx,%r8,8)
+ adc %rax, %rdi
+ adc %r11, %rdx
+ add %rdi, 8(%rcx,%r8,8)
+Lret: adc $0, %rdx
+ mov %rdx, %rax
+
+ pop %rbx
+pop %rdi
+pop %rsi
+ ret
+