1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
|
.text
.align 4, 0x90
.globl ___gmpn_sub_nc
___gmpn_sub_nc:
mov %ecx, %eax
shr $3, %rcx
and $7, %eax
lea Ltab(%rip), %r9
neg %r8
movslq (%r9,%rax,4), %rax
lea (%r9,%rax), %rax
jmp *%rax
.align 4, 0x90
.globl ___gmpn_sub_n
___gmpn_sub_n:
mov %ecx, %eax
shr $3, %rcx
and $7, %eax
lea Ltab(%rip), %r9
movslq (%r9,%rax,4), %rax
lea (%r9,%rax), %rax
jmp *%rax
L0: mov (%rsi), %r8
mov 8(%rsi), %r9
sbb (%rdx), %r8
jmp Le0
L4: mov (%rsi), %r8
mov 8(%rsi), %r9
sbb (%rdx), %r8
lea -32(%rsi), %rsi
lea -32(%rdx), %rdx
lea -32(%rdi), %rdi
inc %rcx
jmp Le4
L5: mov (%rsi), %r11
mov 8(%rsi), %r8
mov 16(%rsi), %r9
sbb (%rdx), %r11
lea -24(%rsi), %rsi
lea -24(%rdx), %rdx
lea -24(%rdi), %rdi
inc %rcx
jmp Le5
L6: mov (%rsi), %r10
sbb (%rdx), %r10
mov 8(%rsi), %r11
lea -16(%rsi), %rsi
lea -16(%rdx), %rdx
lea -16(%rdi), %rdi
inc %rcx
jmp Le6
L7: mov (%rsi), %r9
mov 8(%rsi), %r10
sbb (%rdx), %r9
sbb 8(%rdx), %r10
lea -8(%rsi), %rsi
lea -8(%rdx), %rdx
lea -8(%rdi), %rdi
inc %rcx
jmp Le7
.align 4, 0x90
Ltop:
Le3: mov %r9, 40(%rdi)
Le2: mov %r10, 48(%rdi)
Le1: mov (%rsi), %r8
mov 8(%rsi), %r9
sbb (%rdx), %r8
mov %r11, 56(%rdi)
lea 64(%rdi), %rdi
Le0: mov 16(%rsi), %r10
sbb 8(%rdx), %r9
sbb 16(%rdx), %r10
mov %r8, (%rdi)
Le7: mov 24(%rsi), %r11
mov %r9, 8(%rdi)
Le6: mov 32(%rsi), %r8
mov 40(%rsi), %r9
sbb 24(%rdx), %r11
mov %r10, 16(%rdi)
Le5: sbb 32(%rdx), %r8
mov %r11, 24(%rdi)
Le4: mov 48(%rsi), %r10
mov 56(%rsi), %r11
mov %r8, 32(%rdi)
lea 64(%rsi), %rsi
sbb 40(%rdx), %r9
sbb 48(%rdx), %r10
sbb 56(%rdx), %r11
lea 64(%rdx), %rdx
dec %rcx
jnz Ltop
Lend: mov %r9, 40(%rdi)
mov %r10, 48(%rdi)
mov %r11, 56(%rdi)
mov %ecx, %eax
adc %ecx, %eax
ret
.align 4, 0x90
L3: mov (%rsi), %r9
mov 8(%rsi), %r10
mov 16(%rsi), %r11
sbb (%rdx), %r9
sbb 8(%rdx), %r10
sbb 16(%rdx), %r11
jrcxz Lx3
lea 24(%rsi), %rsi
lea 24(%rdx), %rdx
lea -40(%rdi), %rdi
jmp Le3
Lx3: mov %r9, (%rdi)
mov %r10, 8(%rdi)
mov %r11, 16(%rdi)
mov %ecx, %eax
adc %ecx, %eax
ret
.align 4, 0x90
L1: mov (%rsi), %r11
sbb (%rdx), %r11
jrcxz Lx1
lea 8(%rsi), %rsi
lea 8(%rdx), %rdx
lea -56(%rdi), %rdi
jmp Le1
Lx1: mov %r11, (%rdi)
mov %ecx, %eax
adc %ecx, %eax
ret
.align 4, 0x90
L2: mov (%rsi), %r10
mov 8(%rsi), %r11
sbb (%rdx), %r10
sbb 8(%rdx), %r11
jrcxz Lx2
lea 16(%rsi), %rsi
lea 16(%rdx), %rdx
lea -48(%rdi), %rdi
jmp Le2
Lx2: mov %r10, (%rdi)
mov %r11, 8(%rdi)
mov %ecx, %eax
adc %ecx, %eax
ret
.text
.align 3, 0x90
Ltab: .set L0_tmp, L0-Ltab
.long L0_tmp
.set L1_tmp, L1-Ltab
.long L1_tmp
.set L2_tmp, L2-Ltab
.long L2_tmp
.set L3_tmp, L3-Ltab
.long L3_tmp
.set L4_tmp, L4-Ltab
.long L4_tmp
.set L5_tmp, L5-Ltab
.long L5_tmp
.set L6_tmp, L6-Ltab
.long L6_tmp
.set L7_tmp, L7-Ltab
.long L7_tmp
|