1 | (in-package "CCL") |
---|
2 | |
---|
3 | ;;; %BIGNUM-REF needs to access bignums as obviously as possible, and it needs |
---|
4 | ;;; to be able to return 32 bits somewhere no one looks for real objects. |
---|
5 | ;;; |
---|
6 | ;;; The easiest thing to do is to store the 32 raw bits in two fixnums |
---|
7 | ;;; and return multiple values. |
---|
8 | ;;; |
---|
9 | ;;; XXX -- figure out how we're going to handle multiple-values... |
---|
10 | (defx8632lapfunction %bignum-ref ((bignum arg_y) (i arg_z)) |
---|
11 | (movl (% esp) (% temp0)) |
---|
12 | (movzwl (@ (+ 2 x8632::misc-data-offset) (% bignum) (% i)) (% imm0)) |
---|
13 | (box-fixnum imm0 temp1) |
---|
14 | (push (% temp1)) ;high |
---|
15 | (movzwl (@ x8632::misc-data-offset (% bignum) (% i)) (% imm0)) |
---|
16 | (box-fixnum imm0 temp1) |
---|
17 | (push (% temp1)) ;low |
---|
18 | (set-nargs 2) |
---|
19 | (jmp-subprim .SPvalues)) |
---|
20 | |
---|
21 | ;;; BIGNUM[I] := DIGIT[0] |
---|
22 | (defx8632lapfunction %set-digit ((bignum 4) #|(ra 0)|# (i arg_y) (digit arg_z)) |
---|
23 | (movl (@ bignum (% esp)) (% temp0)) |
---|
24 | (svref digit 0 imm0) |
---|
25 | (movl (% imm0) (@ x8632::misc-data-offset (% temp0) (% i))) |
---|
26 | (single-value-return 3)) |
---|
27 | |
---|
28 | ;;; Return the sign of bignum (0 or -1) as a fixnum |
---|
29 | (defx8632lapfunction %bignum-sign ((bignum arg_z)) |
---|
30 | (vector-length bignum imm0) |
---|
31 | (movl (@ (- x8632::misc-data-offset 4) (% bignum) (% imm0)) (% imm0)) |
---|
32 | (sarl ($ 31) (% imm0)) ;propagate sign bit |
---|
33 | (box-fixnum imm0 arg_z) |
---|
34 | (single-value-return)) |
---|
35 | |
---|
36 | ;;; Count the sign bits in the most significant digit of bignum; |
---|
37 | ;;; return fixnum count. |
---|
38 | (defx8632lapfunction %bignum-sign-bits ((bignum arg_z)) |
---|
39 | (vector-length bignum imm0) |
---|
40 | (movl (@ (- x8632::misc-data-offset 4) (% bignum) (% imm0)) (% imm0)) |
---|
41 | (mark-as-imm temp0) |
---|
42 | (movl (% imm0) (% temp0)) |
---|
43 | (notl (% imm0)) |
---|
44 | (testl (% temp0) (% temp0)) |
---|
45 | (js @wasneg) |
---|
46 | (notl (% imm0)) |
---|
47 | @wasneg |
---|
48 | (bsrl (% imm0) (% imm0)) |
---|
49 | (sete (% temp0.b)) |
---|
50 | (xorl ($ 31) (% imm0)) |
---|
51 | (addb (% temp0.b) (% imm0.b)) |
---|
52 | (box-fixnum imm0 arg_z) |
---|
53 | (mark-as-node temp0) |
---|
54 | (single-value-return)) |
---|
55 | |
---|
56 | (defx8632lapfunction %digit-0-or-plusp ((bignum arg_y) (idx arg_z)) |
---|
57 | (movl (@ x8632::misc-data-offset (% bignum) (% idx)) (% imm0)) |
---|
58 | (movl ($ x8632::nil-value) (% temp0)) |
---|
59 | (leal (@ x8632::t-offset (% temp0)) (% arg_z)) |
---|
60 | (testl (% imm0) (% imm0)) |
---|
61 | (cmovll (% temp0) (% arg_z)) |
---|
62 | (single-value-return)) |
---|
63 | |
---|
64 | ;;; For oddp, evenp |
---|
65 | (defx8632lapfunction %bignum-oddp ((bignum arg_z)) |
---|
66 | (movl (@ x8632::misc-data-offset (% bignum)) (% imm0)) |
---|
67 | (movl ($ x8632::nil-value) (% temp0)) |
---|
68 | (leal (@ x8632::t-offset (% temp0)) (% arg_z)) |
---|
69 | (testb ($ 1) (% imm0.b)) |
---|
70 | (cmovzl (% temp0) (% arg_z)) |
---|
71 | (single-value-return)) |
---|
72 | |
---|
73 | (defx8632lapfunction bignum-plusp ((bignum arg_z)) |
---|
74 | (vector-length bignum imm0) |
---|
75 | (movl (@ (- x8632::misc-data-offset 4) (% bignum) (% imm0)) (% imm0)) |
---|
76 | (movl ($ x8632::nil-value) (% temp0)) |
---|
77 | (lea (@ x8632::t-offset (% temp0)) (% arg_z)) |
---|
78 | (testl (% imm0) (% imm0)) |
---|
79 | (cmovlel (% temp0) (% arg_z)) |
---|
80 | (single-value-return)) |
---|
81 | |
---|
82 | (defx8632lapfunction bignum-minusp ((bignum arg_z)) |
---|
83 | (vector-length bignum imm0) |
---|
84 | (movl (@ (- x8632::misc-data-offset 4) (% bignum) (% imm0)) (% imm0)) |
---|
85 | (movl ($ x8632::nil-value) (% temp0)) |
---|
86 | (lea (@ x8632::t-offset (% temp0)) (% arg_z)) |
---|
87 | (testl (% imm0) (% imm0)) |
---|
88 | (cmovgl (% temp0) (% arg_z)) |
---|
89 | (single-value-return)) |
---|
90 | |
---|
91 | ;;; Add the digits A[I] and B[J], and the incoming carry C (a fixnum, |
---|
92 | ;;; either 0 or 1). Store the result in R[K], and return the outgoing |
---|
93 | ;;; carry. If I is NIL, A is a fixnum. If J is NIL, B is a fixnum. |
---|
94 | (defx8632lapfunction %add-with-carry ((r 20) (k 16) (c 12) (a 8) (i 4) #|(ra 0)|# (b arg_y) (j arg_z)) |
---|
95 | (mark-as-imm temp0) |
---|
96 | (unbox-fixnum b imm0) |
---|
97 | (cmpl ($ x8632::nil-value) (% j)) |
---|
98 | ;; if j not nil, get b[j] |
---|
99 | (cmovnel (@ x8632::misc-data-offset (% b) (% j)) (% imm0)) |
---|
100 | (movl (@ a (% esp)) (% arg_y)) |
---|
101 | (unbox-fixnum arg_y temp0) |
---|
102 | (movl (@ i (% esp)) (% arg_z)) |
---|
103 | (cmpl ($ x8632::nil-value) (% arg_z)) |
---|
104 | ;; if i not nil, get a[i] |
---|
105 | (cmovnel (@ x8632::misc-data-offset (% arg_y) (% arg_z)) (% temp0)) |
---|
106 | (movl ($ '1) (% arg_z)) ;for outgoing carry |
---|
107 | (xorl (% arg_y) (% arg_y)) |
---|
108 | ;; I can't think of a better way to set CF at the moment. |
---|
109 | ;; NEG would be ideal, but we don't have a free imm reg. |
---|
110 | (btl ($ x8632::fixnumshift) (@ c (% esp))) ;CF = lsb of carry fixnum |
---|
111 | (adc (% temp0) (% imm0)) |
---|
112 | (mark-as-node temp0) |
---|
113 | (movl (@ r (% esp)) (% temp0)) |
---|
114 | (movl (@ k (% esp)) (% temp1)) |
---|
115 | (movl (% imm0) (@ x8632::misc-data-offset (% temp0) (% temp1))) |
---|
116 | (cmovnc (% arg_y) (% arg_z)) ;zero outgoing carry if CF = 0 |
---|
117 | (single-value-return 7)) |
---|
118 | |
---|
119 | ;;; Add the digits A[I] and B[J], and the incoming carry C (a fixnum). |
---|
120 | ;;; Store the result in R[K], and return the outgoing carry. If I is |
---|
121 | ;;; NIL, A is a fixnum. If J is NIL, B is a fixnum. |
---|
122 | #+sse2 |
---|
123 | (defx8632lapfunction %add-with-carry ((r 20) (k 16) (c 12) (a 8) (i 4) #|(ra 0)|# (b arg_y) (j arg_z)) |
---|
124 | (let ((aa mm2) |
---|
125 | (bb mm3) |
---|
126 | (cc mm4)) |
---|
127 | (unbox-fixnum b imm0) ;assume j will be nil |
---|
128 | (cmpl ($ x8632::nil-value) (% j)) |
---|
129 | ;; if j not nil, get b[j] |
---|
130 | (cmovnel (@ x8632::misc-data-offset (% b) (% j)) (% imm0)) |
---|
131 | (movd (% imm0) (% bb)) |
---|
132 | (movl (@ a (% esp)) (% arg_y)) |
---|
133 | (movl (@ i (% esp)) (% arg_z)) |
---|
134 | (movl (@ c (% esp)) (% temp0)) |
---|
135 | (unbox-fixnum arg_y imm0) ;assume i will be nil |
---|
136 | (cmpl ($ x8632::nil-value) (% arg_z)) |
---|
137 | ;; if i not nil, get a[i] |
---|
138 | (cmovnel (@ x8632::misc-data-offset (% arg_y) (% arg_z)) (% imm0)) |
---|
139 | (movd (% imm0) (% aa)) |
---|
140 | (unbox-fixnum temp0 imm0) |
---|
141 | (movd (% imm0) (% cc)) |
---|
142 | (paddq (% xx) (% yy)) |
---|
143 | (paddq (% cc) (% yy)) |
---|
144 | (movl (@ r (% esp)) (% temp0)) |
---|
145 | (movl (@ k (% esp)) (% temp1)) |
---|
146 | (movd (% yy) (@ x8632::misc-data-offset (% temp0) (% temp1))) |
---|
147 | (psrlq ($ 32) (% yy)) ;carry bit |
---|
148 | (movd (% yy) (% imm0)) |
---|
149 | (box-fixnum imm0 arg_z) |
---|
150 | (single-value-return 7))) |
---|
151 | |
---|
152 | ;;; Store the result of A[I] - B[J] - borrow into R[K], returning the borrow. |
---|
153 | ;;; If I is NIL, A is a fixnum; likewise for J and B. |
---|
154 | ;;; |
---|
155 | ;;; (a - b) - (1 - borrow), or equivalently, (a - b) + borrow - 1 |
---|
156 | ;;; |
---|
157 | ;;; Note: borrow is 1 for no borrow and 0 for a borrow. |
---|
158 | (defx8632lapfunction %subtract-with-borrow ((r 20) (k 16) (borrow 12) (a 8) (i 4) #|(ra 0)|# (b arg_y) (j arg_z)) |
---|
159 | (mark-as-imm temp0) |
---|
160 | (unbox-fixnum b imm0) |
---|
161 | (cmpl ($ x8632::nil-value) (% j)) |
---|
162 | (cmovnel (@ x8632::misc-data-offset (% b) (% j)) (% imm0)) |
---|
163 | (movl (@ a (% esp)) (% arg_y)) |
---|
164 | (unbox-fixnum arg_y temp0) |
---|
165 | (movl (@ i (% esp)) (% arg_z)) |
---|
166 | (cmpl ($ x8632::nil-value) (% arg_z)) |
---|
167 | (cmovnel (@ x8632::misc-data-offset (% arg_y) (% arg_z)) (% temp0)) |
---|
168 | ;; unboxed a or a[i] in temp0, unboxed b or b[j] in imm0 |
---|
169 | (cmpl ($ '1) (@ borrow (% esp))) ;CF = 1 if borrow is 0 else CF = 0 |
---|
170 | (sbb (% imm0) (% temp0)) |
---|
171 | (movl ($ 1) (% imm0)) |
---|
172 | (sbb ($ 0) (% imm0)) |
---|
173 | (box-fixnum imm0 arg_z) |
---|
174 | (movl (% temp0) (% imm0)) |
---|
175 | (mark-as-node temp0) |
---|
176 | (movl (@ r (% esp)) (% temp0)) |
---|
177 | (movl (@ k (% esp)) (% temp1)) |
---|
178 | (movl (% imm0) (@ x8632::misc-data-offset (% temp0) (% temp1))) |
---|
179 | (single-value-return 7)) |
---|
180 | |
---|
181 | #+sse2 |
---|
182 | (defx8632lapfunction %subtract-with-borrow ((r 20) (k 16) (borrow 12) (a 8) (i 4) #|(ra 0)|# (b arg_y) (j arg_z)) |
---|
183 | (let ((aa mm2) |
---|
184 | (bb mm3) |
---|
185 | (ww mm4)) |
---|
186 | (unbox-fixnum b imm0) |
---|
187 | (cmpl ($ x8632::nil-value) (% j)) |
---|
188 | ;; if j not nil, get b[j] |
---|
189 | (cmovnel (@ x8632::misc-data-offset (% b) (% j)) (% imm0)) |
---|
190 | (movd (% imm0) (% bb)) |
---|
191 | (movl (@ a (% esp)) (% arg_y)) |
---|
192 | (movl (@ i (% esp)) (% arg_z)) |
---|
193 | (movl (@ borrow (% esp)) (% temp0)) |
---|
194 | (unbox-fixnum arg_y imm0) |
---|
195 | (cmpl ($ x8632::nil-value) (% arg_z)) |
---|
196 | ;; if i not nil, get a[i] |
---|
197 | (cmovnel (@ x8632::misc-data-offset (% arg_y) (% arg_z)) (% imm0)) |
---|
198 | (movd (% imm0) (% aa)) |
---|
199 | (unbox-fixnum temp0 imm0) |
---|
200 | (subl ($ 1) (% imm0)) |
---|
201 | (movd (% imm0) (% ww)) |
---|
202 | (psubq (% bb) (% aa)) |
---|
203 | (paddq (% ww) (% aa)) |
---|
204 | (movl (@ r (% esp)) (% temp0)) |
---|
205 | (movl (@ k (% esp)) (% temp1)) |
---|
206 | (movd (% aa) (@ x8632::misc-data-offset (% temp0) (% temp1))) |
---|
207 | (psrlq ($ 32) (% aa)) ;carry digit |
---|
208 | (movd (% aa) (% imm0)) |
---|
209 | (xorl (% arg_z) (% arg_z)) |
---|
210 | (test ($ 1) (% imm0)) |
---|
211 | (cmovzl ($ '1) (% arg_z)) |
---|
212 | (single-value-return 7))) |
---|
213 | |
---|
214 | (defx8632lapfunction %subtract-one ((high arg_y) (low arg_z)) |
---|
215 | (mark-as-imm temp0) |
---|
216 | (unbox-fixnum low imm0) |
---|
217 | (movl (% high) (% temp0)) |
---|
218 | (shll ($ (- 16 x8632::fixnumshift)) (% temp0)) |
---|
219 | (orl (% imm0) (% temp0)) |
---|
220 | (subl ($ 1) (% temp0)) |
---|
221 | (movzwl (% temp0.w) (% imm0)) |
---|
222 | (box-fixnum imm0 low) |
---|
223 | (sarl ($ 16) (% temp0)) |
---|
224 | (box-fixnum temp0 high) |
---|
225 | (mark-as-node temp0) |
---|
226 | (push (% high)) |
---|
227 | (push (% low)) |
---|
228 | (movl (% esp) (% temp0)) |
---|
229 | (jmp-subprim .SPvalues)) |
---|
230 | |
---|
231 | ;;; %SUBTRACT-WITH-BORROW -- Internal. |
---|
232 | ;;; |
---|
233 | ;;; This should be in assembler, and should not cons intermediate results. It |
---|
234 | ;;; returns a 32bit digit and a borrow resulting from subtracting b from a, and |
---|
235 | ;;; subtracting a possible incoming borrow. |
---|
236 | ;;; |
---|
237 | ;;; We really do: a - b - 1 + borrow, where borrow is either 0 or 1. |
---|
238 | ;;; |
---|
239 | |
---|
240 | (defx8632lapfunction %subtract-with-borrow-1 ((a-h 12) (a-l 8) (b-h 4) #|(ra 0)|# (b-l arg_y) (borrow arg_z)) |
---|
241 | (mark-as-imm temp0) |
---|
242 | (mark-as-imm temp1) |
---|
243 | (unbox-fixnum b-l temp0) |
---|
244 | (movl (@ b-h (% esp)) (% imm0)) |
---|
245 | (unbox-fixnum imm0 imm0) |
---|
246 | (shll ($ 16) (% imm0)) |
---|
247 | (orl (% imm0) (% temp0)) |
---|
248 | (movl (@ a-l (% esp)) (% temp1)) |
---|
249 | (unbox-fixnum temp1 temp1) |
---|
250 | (movl (@ a-h (% esp)) (% imm0)) |
---|
251 | (unbox-fixnum imm0 imm0) |
---|
252 | (shll ($ 16) (% imm0)) |
---|
253 | (orl (% imm0) (% temp1)) |
---|
254 | (cmpl ($ '1) (@ borrow (% esp))) ;CF = 1 if borrow is 0 else CF = 0 |
---|
255 | (sbbl (% temp0) (% temp1)) |
---|
256 | (movl ($ 1) (% imm0)) |
---|
257 | (subb ($ 0) (% imm0)) |
---|
258 | (box-fixnum imm0 arg_z) |
---|
259 | (movzwl (% temp1.w) (% imm0)) |
---|
260 | (box-fixnum imm0 imm0) |
---|
261 | (push (% imm0)) ;high |
---|
262 | (sarl ($ 16) (% temp1)) |
---|
263 | (box-fixnum temp1 imm0) |
---|
264 | (mark-as-node temp0) |
---|
265 | (mark-as-node temp1) |
---|
266 | (push (% imm0)) ;low |
---|
267 | (push (% arg_z)) ;borrow |
---|
268 | (set-nargs 3) |
---|
269 | (popl (@ 16 (% esp))) ;relocate return addr |
---|
270 | (addl ($ '4) (% esp)) ;discard args, part of saved frame |
---|
271 | (movl (% esp) (% temp0)) |
---|
272 | (jmp-subprim .SPvalues)) |
---|
273 | |
---|
274 | |
---|
275 | ;;; To normalize a bignum is to drop "trailing" digits which are |
---|
276 | ;;; redundant sign information. When return-fixnum-p is non-nil, make |
---|
277 | ;;; the resultant bignum into a fixnum if it fits. |
---|
278 | (defx8632lapfunction %normalize-bignum-2 ((return-fixnum-p arg_y) (bignum arg_z)) |
---|
279 | (push (% return-fixnum-p)) |
---|
280 | (mark-as-imm temp0) |
---|
281 | (mark-as-imm temp1) |
---|
282 | (let ((len arg_y) |
---|
283 | (sign temp0) |
---|
284 | (next temp1)) |
---|
285 | (vector-length bignum len) |
---|
286 | (cmpl ($ '1) (% len)) |
---|
287 | (jle @maybe-return-fixnum) |
---|
288 | ;; Zero trailing sign digits. |
---|
289 | (push (% len)) |
---|
290 | ;; next-to-last digit |
---|
291 | (movl (@ (- x8632::misc-data-offset 8) (% bignum) (% len)) (% next)) |
---|
292 | ;; last digit |
---|
293 | (movl (@ (- x8632::misc-data-offset 4) (% bignum) (% len)) (% sign)) |
---|
294 | (jmp @test) |
---|
295 | @loop |
---|
296 | (subl ($ '1) (% len)) |
---|
297 | (movl ($ 0) (@ x8632::misc-data-offset (% bignum) (% len))) |
---|
298 | (cmpl ($ '1) (% len)) ;any more digits? |
---|
299 | (je @adjust-length) |
---|
300 | (movl (% next) (% sign)) |
---|
301 | ;; (bignum-ref bignum (- len 2)) |
---|
302 | (movl (@ (- x8632::misc-data-offset 8) (% bignum) (% len)) (% next)) |
---|
303 | @test |
---|
304 | (movl (% next) (% imm0)) |
---|
305 | (sarl ($ 31) (% imm0)) ;propagate sign bit |
---|
306 | (xorl (% sign) (% imm0)) ;whole digit only sign? |
---|
307 | (jz @loop) |
---|
308 | ;; New length now in len. |
---|
309 | @adjust-length |
---|
310 | (pop (% imm0)) ;original length |
---|
311 | (cmpl (% len) (% imm0)) |
---|
312 | ;; If the new length is the same as the original length, we know |
---|
313 | ;; that the bignum is at least two digits long (because if it was |
---|
314 | ;; shorter, we would have branched directly to |
---|
315 | ;; @maybe-return-fixnum), and thus won't fit in a fixnum. |
---|
316 | ;; Therefore, there's no need to do either of the tests at |
---|
317 | ;; @maybe-return-fixnum. |
---|
318 | (je @done) |
---|
319 | (movl (% len) (% imm0)) |
---|
320 | (shll ($ (- x8632::num-subtag-bits x8632::fixnumshift)) (% imm0)) |
---|
321 | (movb ($ x8632::subtag-bignum) (% imm0.b)) |
---|
322 | (movl (% imm0) (@ x8632::misc-header-offset (% bignum))) |
---|
323 | @maybe-return-fixnum |
---|
324 | ;; could use SETcc here to avoid one branch |
---|
325 | (cmpl ($ x8632::nil-value) (@ 0 (% esp))) ;return-fixnum-p |
---|
326 | (je @done) |
---|
327 | (cmpl ($ x8632::one-digit-bignum-header) (% bignum)) |
---|
328 | (jne @done) |
---|
329 | ;; Bignum has one digit. If it fits in a fixnum, return a fixnum. |
---|
330 | (movl (@ x8632::misc-data-offset (% bignum)) (% imm0)) |
---|
331 | (box-fixnum imm0 arg_y) |
---|
332 | (unbox-fixnum arg_y temp0) |
---|
333 | (cmpl (% temp0) (% imm0)) |
---|
334 | (cmovel (% arg_y) (% arg_z)) |
---|
335 | @done |
---|
336 | (pop (% imm0)) ;discard saved return-fixnum-p |
---|
337 | (mark-as-node temp0) |
---|
338 | (mark-as-node temp1) |
---|
339 | (single-value-return))) |
---|
340 | |
---|
341 | ;;; Multiply X[I] by the unboxed value of the (non-negative) fixnum Y; |
---|
342 | ;;; add the incoming carry from CARRY[0] to the 64-bit product. Store |
---|
343 | ;;; the low word of the 64-bit sum in R[0] and the high word in |
---|
344 | ;;; CARRY[0]. |
---|
345 | (defx8632lapfunction %multiply-and-add ((r 12) (carry 8) (x 4) #|(ra 0)|# (i arg_y) (y arg_z)) |
---|
346 | (let ((xx mm2) |
---|
347 | (yy mm3) |
---|
348 | (cc mm4)) |
---|
349 | (movl (@ x (% esp)) (% imm0)) |
---|
350 | (movd (@ x8632::misc-data-offset (% imm0) (% i)) (% xx)) |
---|
351 | (unbox-fixnum y imm0) |
---|
352 | (movd (% imm0) (% yy)) |
---|
353 | (pmuludq (% xx) (% yy)) ;64 bit product |
---|
354 | (movl (@ carry (% esp)) (% arg_y)) |
---|
355 | (movd (@ x8632::misc-data-offset (% arg_y)) (% cc)) |
---|
356 | (paddq (% cc) (% yy)) ;add in 32 bit carry digit |
---|
357 | (movl (@ r (% esp)) (% arg_z)) |
---|
358 | (movd (% yy) (@ x8632::misc-data-offset (% arg_z))) |
---|
359 | (psrlq ($ 32) (% yy)) |
---|
360 | (movd (% yy) (@ x8632::misc-data-offset (% arg_y))) |
---|
361 | (single-value-return 5))) |
---|
362 | |
---|
363 | ;; multiply x[i] by y and add to result starting at digit i |
---|
364 | (defx8632lapfunction %multiply-and-add-harder-loop-2 |
---|
365 | ((x 12) (y 8) (r 4) #|(ra 0)|# (i arg_y) (ylen arg_z)) |
---|
366 | (let ((cc mm2) |
---|
367 | (xx mm3) |
---|
368 | (yy mm4) |
---|
369 | (j imm0)) |
---|
370 | (movl (@ x (% esp)) (% temp0)) |
---|
371 | (movd (@ x8632::misc-data-offset (% temp0) (% i)) (% xx)) ;x[i] |
---|
372 | (movl (@ y (% esp)) (% temp0)) |
---|
373 | (movl (@ r (% esp)) (% temp1)) |
---|
374 | (pxor (% cc) (% cc)) |
---|
375 | (xorl (% j) (% j)) |
---|
376 | @loop |
---|
377 | (movd (@ x8632::misc-data-offset (% temp0) (% j)) (% yy)) ;y[j] |
---|
378 | (pmuludq (% xx) (% yy)) |
---|
379 | (paddq (% cc) (% yy)) |
---|
380 | (movd (% yy) (@ x8632::misc-data-offset (% temp1) (% i))) ;store r[i] |
---|
381 | (movq (% yy) (% cc)) |
---|
382 | (psrlq ($ 32) (% cc)) ;carry high digit |
---|
383 | (addl ($ '1) (% i)) |
---|
384 | (addl ($ '1) (% j)) |
---|
385 | (subl ($ '1) (% ylen)) |
---|
386 | (jg @loop) |
---|
387 | (movd (% cc) (@ x8632::misc-data-offset (% temp1) (% i))) |
---|
388 | (single-value-return 5))) |
---|
389 | |
---|
390 | ;; this is silly |
---|
391 | (defx8632lapfunction %add-the-carry ((high 4) #|(ra 0)|# (low arg_y) (c arg_z)) |
---|
392 | (mark-as-imm temp0) |
---|
393 | (unbox-fixnum low imm0) |
---|
394 | (movl (@ high (% esp)) (% temp0)) |
---|
395 | (shll ($ (- 16 x8632::fixnumshift)) (% temp0)) |
---|
396 | (orl (% imm0) (% temp0)) |
---|
397 | (unbox-fixnum c imm0) |
---|
398 | (addl (% imm0) (% temp0)) |
---|
399 | (movzwl (% temp0.w) (% imm0)) |
---|
400 | (box-fixnum imm0 temp1) |
---|
401 | (sarl ($ 16) (% temp0)) |
---|
402 | (box-fixnum temp0 temp0) |
---|
403 | (push (% temp0)) ;high |
---|
404 | (push (% temp1)) ;low |
---|
405 | (set-nargs 2) |
---|
406 | (mark-as-node temp0) |
---|
407 | (movl (% esp) (% temp0)) |
---|
408 | (jmp-subprim .SPvalues)) |
---|
409 | |
---|
410 | (defx8632lapfunction %bignum-count-trailing-zero-bits ((bignum arg_z)) |
---|
411 | (let ((i arg_y) |
---|
412 | (len temp0) |
---|
413 | (zeros temp1)) |
---|
414 | (vector-length bignum temp0) |
---|
415 | (xorl (% i) (% i)) |
---|
416 | (movl ($ '32) (% zeros)) |
---|
417 | @loop |
---|
418 | (movl (@ x8632::misc-data-offset (% bignum) (% i)) (% imm0)) |
---|
419 | (addl ($ '1) (% i)) |
---|
420 | (addl ($ '32) (% zeros)) |
---|
421 | (testl (% imm0) (% imm0)) |
---|
422 | (jz @loop) |
---|
423 | ;; now count zero bits in digit |
---|
424 | (bsrl (% imm0) (% imm0)) |
---|
425 | (box-fixnum imm0 imm0) |
---|
426 | (addl (% imm0) (% zeros)) |
---|
427 | (movl (% zeros) (% arg_z)) |
---|
428 | (single-value-return))) |
---|
429 | |
---|
430 | ;;; dest[i] = (logand x[i] y[i]) |
---|
431 | (defx8632lapfunction %bignum-logand ((idx 8) (x 4) #|(ra 0)|# (y arg_y) (dest arg_z)) |
---|
432 | (let ((i temp0) |
---|
433 | (xx temp1) |
---|
434 | (yy arg_y)) |
---|
435 | (movl (@ idx (% esp)) (% i)) |
---|
436 | (movl (@ x (% esp)) (% xx)) |
---|
437 | (movl (@ x8632::misc-data-offset (% xx) (% i)) (% imm0)) |
---|
438 | (andl (@ x8632::misc-data-offset (% yy) (% i)) (% imm0)) |
---|
439 | (movl (% imm0) (@ x8632::misc-data-offset (% dest) (% i))) |
---|
440 | (single-value-return 4))) |
---|
441 | |
---|
442 | ;;; dest[i] = (logandc1 x[i] y[i]) |
---|
443 | (defx8632lapfunction %bignum-logandc1 ((idx 8) (x 4) #|(ra 0)|# (y arg_y) (dest arg_z)) |
---|
444 | (let ((i temp0) |
---|
445 | (xx temp1) |
---|
446 | (yy arg_y)) |
---|
447 | (movl (@ idx (% esp)) (% i)) |
---|
448 | (movl (@ x (% esp)) (% xx)) |
---|
449 | (movl (@ x8632::misc-data-offset (% xx) (% i)) (% imm0)) |
---|
450 | (not (% imm0)) |
---|
451 | (andl (@ x8632::misc-data-offset (% yy) (% i)) (% imm0)) |
---|
452 | (movl (% imm0) (@ x8632::misc-data-offset (% dest) (% i))) |
---|
453 | (single-value-return 4))) |
---|
454 | |
---|
455 | ;;; dest[i] = (logandc2 x[i] y[i]) |
---|
456 | (defx8632lapfunction %bignum-logandc2 ((idx 8) (x 4) #|(ra 0)|# (y arg_y) (dest arg_z)) |
---|
457 | (let ((i temp0) |
---|
458 | (xx temp1) |
---|
459 | (yy arg_y)) |
---|
460 | (movl (@ idx (% esp)) (% i)) |
---|
461 | (movl (@ x (% esp)) (% xx)) |
---|
462 | (movl (@ x8632::misc-data-offset (% yy) (% i)) (% imm0)) |
---|
463 | (not (% imm0)) |
---|
464 | (andl (@ x8632::misc-data-offset (% xx) (% i)) (% imm0)) |
---|
465 | (movl (% imm0) (@ x8632::misc-data-offset (% dest) (% i))) |
---|
466 | (single-value-return 4))) |
---|
467 | |
---|
468 | ;;; dest[i] = (logior x[i] y[i]) |
---|
469 | (defx8632lapfunction %bignum-logior ((idx 8) (x 4) #|(ra 0)|# (y arg_y) (dest arg_z)) |
---|
470 | (let ((i temp0) |
---|
471 | (xx temp1) |
---|
472 | (yy arg_y)) |
---|
473 | (movl (@ idx (% esp)) (% i)) |
---|
474 | (movl (@ x (% esp)) (% xx)) |
---|
475 | (movl (@ x8632::misc-data-offset (% xx) (% i)) (% imm0)) |
---|
476 | (orl (@ x8632::misc-data-offset (% yy) (% i)) (% imm0)) |
---|
477 | (movl (% imm0) (@ x8632::misc-data-offset (% dest) (% i))) |
---|
478 | (single-value-return 4))) |
---|
479 | |
---|
480 | ;;; dest[i] = (lognot x[i]) |
---|
481 | (defx8632lapfunction %bignum-logior ((idx 4) #|(ra 0)|# (x arg_y) (dest arg_z)) |
---|
482 | (let ((i temp0)) |
---|
483 | (movl (@ idx (% esp)) (% i)) |
---|
484 | (movl (@ x8632::misc-data-offset (% x) (% i)) (% imm0)) |
---|
485 | (not (% imm0)) |
---|
486 | (movl (% imm0) (@ x8632::misc-data-offset (% dest) (% i))) |
---|
487 | (single-value-return 3))) |
---|
488 | |
---|
489 | ;;; dest[i] = (logxor x[i] y[i]) |
---|
490 | (defx8632lapfunction %bignum-logxor ((idx 8) (x 4) #|(ra 0)|# (y arg_y) (dest arg_z)) |
---|
491 | (let ((i temp0) |
---|
492 | (xx temp1) |
---|
493 | (yy arg_y)) |
---|
494 | (movl (@ idx (% esp)) (% i)) |
---|
495 | (movl (@ x (% esp)) (% xx)) |
---|
496 | (movl (@ x8632::misc-data-offset (% xx) (% i)) (% imm0)) |
---|
497 | (xorl (@ x8632::misc-data-offset (% yy) (% i)) (% imm0)) |
---|
498 | (movl (% imm0) (@ x8632::misc-data-offset (% dest) (% i))) |
---|
499 | (single-value-return 4))) |
---|
500 | |
---|
501 | (defx8632lapfunction %compare-digits ((a 4) #|(ra 0)|# (b arg_y) (i arg_z)) |
---|
502 | (movl (@ a (% esp)) (% temp0)) |
---|
503 | (movl (@ x8632::misc-data-offset (% temp0) (% i)) (% imm0)) |
---|
504 | (xorl (% temp0) (% temp0)) |
---|
505 | (movl ($ '1) (% temp1)) |
---|
506 | (movl ($ '-1) (% arg_y)) |
---|
507 | (cmpl (@ x8632::misc-data-offset (% b) (% i)) (% imm0)) |
---|
508 | (cmovzl (% temp0) (% arg_z)) |
---|
509 | (cmovgl (% temp1) (% arg_z)) |
---|
510 | (cmovll (% arg_y) (% arg_z)) |
---|
511 | (single-value-return 3)) |
---|
512 | |
---|
513 | ;; returns number of bits in digit-hi,digit-lo that are sign bits |
---|
514 | ;; 32 - digits-sign-bits is integer-length |
---|
515 | (defx8632lapfunction %digits-sign-bits ((hi arg_y) (lo arg_z)) |
---|
516 | (mark-as-imm temp0) |
---|
517 | (shll ($ (- 16 x8632::fixnumshift)) (% hi)) |
---|
518 | (unbox-fixnum lo imm0) |
---|
519 | (orl (% hi) (% imm0)) |
---|
520 | (movl (% imm0) (% temp0)) |
---|
521 | (not (% imm0)) |
---|
522 | (testl (% temp0) (% temp0)) |
---|
523 | (js @wasneg) |
---|
524 | (not (% imm0)) |
---|
525 | @wasneg |
---|
526 | (bsrl (% imm0) (% imm0)) |
---|
527 | (sete (% temp0.b)) |
---|
528 | (xorl ($ 31) (% imm0)) |
---|
529 | (addb (% temp0.b) (% imm0.b)) |
---|
530 | (box-fixnum imm0 arg_z) |
---|
531 | (mark-as-node temp0) |
---|
532 | (single-value-return)) |
---|
533 | |
---|
534 | ; if dest not nil store unboxed result in dest(0), else return a fixnum |
---|
535 | (defx8632lapfunction fix-digit-logandc2 ((fix 4) #|(ra 0)|# (big arg_y) (dest arg_z)) ; index 0 |
---|
536 | (mark-as-imm temp0) |
---|
537 | (movl (@ fix (% esp)) (% temp0)) |
---|
538 | (unbox-fixnum temp0 temp0) |
---|
539 | (movl (@ x8632::misc-data-offset (% big)) (% imm0)) |
---|
540 | (not (% imm0)) |
---|
541 | (andl (% temp0) (% imm0)) |
---|
542 | (mark-as-node temp0) |
---|
543 | (cmpl ($ x8632::nil-value) (% dest)) |
---|
544 | (jne @store) |
---|
545 | (box-fixnum imm0 arg_z) |
---|
546 | (single-value-return 3) |
---|
547 | @store |
---|
548 | (movl (% imm0) (@ x8632::misc-data-offset (% dest))) |
---|
549 | (single-value-return 3)) |
---|
550 | |
---|
551 | (defx8632lapfunction digit-lognot-move ((index 4) #|(ra 0)|# (source arg_y) (dest arg_z)) |
---|
552 | (movl (@ index (% esp)) (% temp0)) |
---|
553 | (movl (@ x8632::misc-data-offset (% source) (% temp0)) (% imm0)) |
---|
554 | (not (% imm0)) |
---|
555 | (movl (% imm0) (@ x8632::misc-data-offset (% dest) (% temp0))) |
---|
556 | (single-value-return 3)) |
---|
557 | |
---|
558 | ;; Add b to a starting at a[i] |
---|
559 | ;; might want not to use SSE2 for this. use lea to update loop counter |
---|
560 | ;; variables so that the flags don't get set. |
---|
561 | (defx8632lapfunction bignum-add-loop-+ ((i 8) (a 4) #|(ra 0)|# (b arg_y) (blen arg_z)) |
---|
562 | (let ((aa mm2) |
---|
563 | (bb mm3) |
---|
564 | (cc mm4)) |
---|
565 | (movl (@ a (% esp)) (% temp0)) |
---|
566 | (movl (@ i (% esp)) (% temp1)) |
---|
567 | (xorl (% imm0) (% imm0)) |
---|
568 | (pxor (% cc) (% cc)) |
---|
569 | @loop |
---|
570 | (movd (@ x8632::misc-data-offset (% temp0) (% temp1)) (% aa)) |
---|
571 | (movd (@ x8632::misc-data-offset (% b) (% imm0)) (% bb)) |
---|
572 | (paddq (% bb) (% aa)) |
---|
573 | (paddq (% cc) (% aa)) |
---|
574 | (movd (% aa) (@ x8632::misc-data-offset (% temp0) (% temp1))) |
---|
575 | (psrlq ($ 32) (% aa)) |
---|
576 | (movq (% aa) (% cc)) |
---|
577 | (addl ($ '1) (% temp1)) |
---|
578 | (addl ($ '1) (% imm0)) |
---|
579 | (subl ($ '1) (% blen)) |
---|
580 | (jg @loop) |
---|
581 | ;; add in final carry |
---|
582 | (movd (% cc) (% imm0)) |
---|
583 | (addl (% imm0) (@ x8632::misc-data-offset (% temp0) (% temp1))) |
---|
584 | (single-value-return 4))) |
---|
585 | |
---|
586 | (defx8632lapfunction bignum-logtest-loop ((count 4) #|(ra 0)|# (s1 arg_y) (s2 arg_z)) |
---|
587 | (let ((i temp1) |
---|
588 | (c temp0)) |
---|
589 | (movl (@ count (% esp)) (% c)) |
---|
590 | (xorl (% i) (% i)) |
---|
591 | @loop |
---|
592 | (movl (@ x8632::misc-data-offset (% s1) (% i)) (% imm0)) |
---|
593 | (test (@ x8632::misc-data-offset (% s2) (% i)) (% imm0)) |
---|
594 | (jnz @true) |
---|
595 | (addl ($ '1) (% i)) |
---|
596 | (cmpl (% i) (% c)) |
---|
597 | (jg @loop) |
---|
598 | (movl ($ x8632::nil-value) (% arg_z)) |
---|
599 | (single-value-return 3) |
---|
600 | @true |
---|
601 | (movl ($ x8632::t-value) (% arg_z)) |
---|
602 | (single-value-return 3))) |
---|
603 | |
---|
604 | ;;; called from bignum-ashift-left-unaligned |
---|
605 | (defx8632lapfunction bignum-shift-left-loop ((nbits 12) (result 8) (bignum 4) #|(ra 0)|# (res-len-1 arg_y) (j arg_z)) |
---|
606 | (let ((r temp0) |
---|
607 | (b temp1) |
---|
608 | (bb mm2) |
---|
609 | (bits mm3) |
---|
610 | (tt mm4) |
---|
611 | (remaining-bits mm5)) |
---|
612 | (movl (% j) (% imm0)) |
---|
613 | (subl ($ '1) (% imm0)) |
---|
614 | (pushl (% imm0)) ;digits |
---|
615 | (movl (@ nbits (% esp)) (% imm0)) |
---|
616 | (unbox-fixnum imm0 imm0) |
---|
617 | (movd (% imm0) (% bits)) ;shift count |
---|
618 | (negl (% imm0)) |
---|
619 | (addl ($ 32) (% imm0)) |
---|
620 | (movd (% imm0) (% remaining-bits)) |
---|
621 | (movl (@ result (% esp)) (% r)) |
---|
622 | (movl (@ bignum (% esp)) (% b)) |
---|
623 | (xorl (% imm0) (% imm0)) |
---|
624 | @loop |
---|
625 | ;; bignum[i] |
---|
626 | (movd (@ x8632::misc-data-offset (% b) (% imm0)) (% bb)) |
---|
627 | (psrlq (% remaining-bits) (% bb)) |
---|
628 | ;; bignum[i+1] |
---|
629 | (movd (@ (+ x8632::misc-data-offset 4) (% b) (% imm0)) (% tt)) |
---|
630 | (psllq (% bits) (% tt)) |
---|
631 | (por (% tt) (% bb)) |
---|
632 | (movd (% bb) (@ x8632::misc-data-offset (% r) (% j))) |
---|
633 | (addl ($ '1) (% imm0)) |
---|
634 | (addl ($ '1) (% j)) |
---|
635 | (cmpl (% j) (% res-len-1)) |
---|
636 | (jne @loop) |
---|
637 | (movd (@ x8632::misc-data-offset (% bignum)) (% bb)) ;bignum[0] |
---|
638 | (psllq (% bits) (% bb)) |
---|
639 | (popl (% arg_y)) ;digits |
---|
640 | (movd (% bb) (@ x8632::misc-data-offset (% r) (% arg_y))) |
---|
641 | (movd (@ x8632::misc-data-offset (% bignum) (% imm0)) (% bb)) ;bignum[i] |
---|
642 | (psrlq (% remaining-bits) (% bb)) |
---|
643 | (movd (% bb) (@ x8632::misc-data-offset (% r) (% j))) |
---|
644 | (single-value-return 5))) |
---|
645 | |
---|
646 | (defx8632lapfunction %logcount-complement ((bignum arg_y) (i arg_z)) |
---|
647 | (mark-as-imm temp0) |
---|
648 | (let ((rshift imm0) |
---|
649 | (temp temp0)) |
---|
650 | (movl (@ x8632::misc-data-offset (% bignum) (% i)) (% rshift)) |
---|
651 | (notl (% rshift)) |
---|
652 | (xorl (% arg_z) (% arg_z)) |
---|
653 | (testl (% rshift) (% rshift)) |
---|
654 | (jmp @test) |
---|
655 | @next |
---|
656 | (lea (@ -1 (% rshift)) (% temp)) |
---|
657 | (and (% temp) (% rshift)) ;sets flags |
---|
658 | (lea (@ '1 (% arg_z)) (% arg_z)) ;doesn't set flags |
---|
659 | @test |
---|
660 | (jne @next) |
---|
661 | (mark-as-node temp0) |
---|
662 | (single-value-return))) |
---|
663 | |
---|
664 | (defx8632lapfunction %logcount ((bignum arg_y) (i arg_z)) |
---|
665 | (mark-as-imm temp0) |
---|
666 | (let ((rshift imm0) |
---|
667 | (temp temp0)) |
---|
668 | (movl (@ x8632::misc-data-offset (% bignum) (% i)) (% rshift)) |
---|
669 | (xorl (% arg_z) (% arg_z)) |
---|
670 | (testl (% rshift) (% rshift)) |
---|
671 | (jmp @test) |
---|
672 | @next |
---|
673 | (lea (@ -1 (% rshift)) (% temp)) |
---|
674 | (and (% temp) (% rshift)) ;sets flags |
---|
675 | (lea (@ '1 (% arg_z)) (% arg_z)) ;doesn't set flags |
---|
676 | @test |
---|
677 | (jne @next) |
---|
678 | (mark-as-node temp0) |
---|
679 | (single-value-return))) |
---|
680 | |
---|
681 | |
---|
682 | ;;; floor: given x and y, producing q and r, q * y + r = x. |
---|
683 | |
---|
684 | ;;; Divide bignum x by single digit y (passed as two halves). |
---|
685 | ;;; The quotient in stored in q, and the remainder is returned |
---|
686 | ;;; in two halves. |
---|
687 | (defx8632lapfunction %floor-loop-quo ((x 8) (q 4) #|(ra 0)|# (yhi arg_y) (ylo arg_z)) |
---|
688 | ) |
---|
689 | |
---|
690 | |
---|
691 | |
---|