Line data Source code
1 : #line 2 "../src/kernel/none/mp.c"
2 : /* Copyright (C) 2000-2003 The PARI group.
3 :
4 : This file is part of the PARI/GP package.
5 :
6 : PARI/GP is free software; you can redistribute it and/or modify it under the
7 : terms of the GNU General Public License as published by the Free Software
8 : Foundation; either version 2 of the License, or (at your option) any later
9 : version. It is distributed in the hope that it will be useful, but WITHOUT
10 : ANY WARRANTY WHATSOEVER.
11 :
12 : Check the License for details. You should have received a copy of it, along
13 : with the package; see the file 'COPYING'. If not, write to the Free Software
14 : Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */
15 :
16 : /***********************************************************************/
17 : /** **/
18 : /** MULTIPRECISION KERNEL **/
19 : /** **/
20 : /***********************************************************************/
21 : #include "pari.h"
22 : #include "paripriv.h"
23 : #include "../src/kernel/none/tune-gen.h"
24 :
25 : void
26 776 : pari_kernel_init(void) { }
27 : void
28 774 : pari_kernel_close(void) { }
29 : const char *
30 2 : pari_kernel_version(void) { return ""; }
31 :
32 : /* NOTE: arguments of "spec" routines (muliispec, addiispec, etc.) aren't
33 : * GENs but pairs (long *a, long na) representing a list of digits (in basis
34 : * BITS_IN_LONG) : a[0], ..., a[na-1]. [ In ordre to facilitate splitting: no
35 : * need to reintroduce codewords ] */
36 :
37 : #define LIMBS(x) ((x)+2)
38 : #define NLIMBS(x) (lgefint(x)-2)
39 :
40 : /* Normalize a nonnegative integer */
41 : GEN
42 847277238 : int_normalize(GEN x, long known_zero_words)
43 : {
44 847277238 : long i, lx = lgefint(x);
45 : GEN x0;
46 847277238 : if (lx == 2) { x[1] = evalsigne(0) | evallgefint(2); return x; }
47 847277238 : if (!known_zero_words && x[2]) return x;
48 3154966497 : for (i = 2+known_zero_words; i < lx; i++)
49 3088997409 : if (x[i]) break;
50 328105851 : x0 = x; i -= 2; x += i;
51 328105851 : if (x0 == (GEN)avma) set_avma((pari_sp)x);
52 197048124 : else stackdummy((pari_sp)(x0+i), (pari_sp)x0);
53 328105851 : lx -= i;
54 328105851 : x[0] = evaltyp(t_INT) | evallg(lx);
55 328105851 : if (lx == 2) x[1] = evalsigne(0) | evallgefint(lx);
56 262136763 : else x[1] = evalsigne(1) | evallgefint(lx);
57 328105851 : return x;
58 : }
59 :
60 : /***********************************************************************/
61 : /** **/
62 : /** ADDITION / SUBTRACTION **/
63 : /** **/
64 : /***********************************************************************/
65 :
66 : GEN
67 2247009 : setloop(GEN a)
68 : {
69 2247009 : pari_sp av = avma;
70 2247009 : (void)cgetg(lgefint(a) + 3, t_VECSMALL);
71 2247009 : return icopy_avma(a, av); /* two cells of extra space before a */
72 : }
73 :
74 : /* we had a = setloop(?), then some incloops. Reset a to b */
75 : GEN
76 130656 : resetloop(GEN a, GEN b) {
77 130656 : long lb = lgefint(b);
78 130656 : a += lgefint(a) - lb;
79 130656 : a[0] = evaltyp(t_INT) | evallg(lb);
80 130656 : affii(b, a); return a;
81 : }
82 :
83 : /* assume a > 0, initialized by setloop. Do a++ */
84 : static GEN
85 31953747 : incpos(GEN a)
86 : {
87 31953747 : long i, l = lgefint(a);
88 31953750 : for (i=l-1; i>1; i--)
89 31953747 : if (++a[i]) return a;
90 3 : l++; a--; /* use extra cell */
91 3 : a[0]=evaltyp(t_INT) | _evallg(l);
92 3 : a[1]=evalsigne(1) | evallgefint(l);
93 3 : a[2]=1; return a;
94 : }
95 :
96 : /* assume a < 0, initialized by setloop. Do a++ */
97 : static GEN
98 49989 : incneg(GEN a)
99 : {
100 49989 : long i, l = lgefint(a)-1;
101 49989 : if (uel(a,l)--)
102 : {
103 49986 : if (l == 2 && !a[2])
104 : {
105 1482 : a++; /* save one cell */
106 1482 : a[0] = evaltyp(t_INT) | _evallg(2);
107 1482 : a[1] = evalsigne(0) | evallgefint(2);
108 : }
109 49986 : return a;
110 : }
111 3 : for (i = l-1;; i--) /* finishes since a[2] != 0 */
112 3 : if (uel(a,i)--) break;
113 3 : if (!a[2])
114 : {
115 3 : a++; /* save one cell */
116 3 : a[0] = evaltyp(t_INT) | _evallg(l);
117 3 : a[1] = evalsigne(-1) | evallgefint(l);
118 : }
119 3 : return a;
120 : }
121 :
122 : /* assume a initialized by setloop. Do a++ */
123 : GEN
124 32256207 : incloop(GEN a)
125 : {
126 32256207 : switch(signe(a))
127 : {
128 252471 : case 0: a--; /* use extra cell */
129 252471 : a[0]=evaltyp(t_INT) | _evallg(3);
130 252471 : a[1]=evalsigne(1) | evallgefint(3);
131 252471 : a[2]=1; return a;
132 49989 : case -1: return incneg(a);
133 31953747 : default: return incpos(a);
134 : }
135 : }
136 :
137 : INLINE GEN
138 2252855481 : adduispec(ulong s, GEN x, long nx)
139 : {
140 2252855481 : GEN xd, zd = (GEN)avma;
141 : long lz;
142 :
143 2252855481 : if (nx == 1) return adduu(s, uel(x,0));
144 738687825 : lz = nx+3; (void)new_chunk(lz);
145 738687825 : xd = x + nx;
146 738687825 : *--zd = (ulong)*--xd + s;
147 738687825 : if ((ulong)*zd < s)
148 : for(;;)
149 : {
150 263370924 : if (xd == x) { *--zd = 1; break; } /* enlarge z */
151 259659675 : *--zd = ((ulong)*--xd) + 1;
152 259659675 : if (*zd) { lz--; break; }
153 : }
154 482002803 : else lz--;
155 1766042865 : while (xd > x) *--zd = *--xd;
156 738687825 : *--zd = evalsigne(1) | evallgefint(lz);
157 738687825 : *--zd = evaltyp(t_INT) | evallg(lz);
158 738687825 : return gc_const((pari_sp)zd, zd);
159 : }
160 :
161 : GEN
162 352286694 : adduispec_offset(ulong s, GEN x, long offset, long nx)
163 : {
164 352286694 : GEN xd = x+lgefint(x)-nx-offset;
165 460601667 : while (nx && *xd==0) {xd++; nx--;}
166 352286694 : if (!nx) return utoi(s);
167 320284554 : return adduispec(s,xd,nx);
168 : }
169 :
170 : static GEN
171 4405499742 : addiispec(GEN x, GEN y, long nx, long ny)
172 : {
173 : GEN xd, yd, zd;
174 4405499742 : long lz, i = -2;
175 : LOCAL_OVERFLOW;
176 :
177 4405499742 : if (nx < ny) swapspec(x,y, nx,ny);
178 4405499742 : if (ny == 1) return adduispec(*y,x,nx);
179 2541666234 : zd = (GEN)avma;
180 2541666234 : lz = nx+3; (void)new_chunk(lz);
181 2541666234 : xd = x + nx;
182 2541666234 : yd = y + ny;
183 2541666234 : zd[-1] = addll(xd[-1], yd[-1]);
184 : #ifdef addllx8
185 2216132303 : for ( ; i-8 > -ny; i-=8)
186 1368910225 : addllx8(xd+i, yd+i, zd+i, overflow);
187 : #endif
188 34806114868 : for ( ; i >= -ny; i--) zd[i] = addllx(xd[i], yd[i]);
189 2541666234 : if (overflow)
190 : for(;;)
191 : {
192 509826249 : if (i < -nx) { zd[i] = 1; i--; break; } /* enlarge z */
193 336276762 : zd[i] = uel(xd,i) + 1;
194 336276762 : if (zd[i]) { i--; lz--; break; }
195 63458346 : i--;
196 : }
197 2095298331 : else lz--;
198 17992712433 : for (; i >= -nx; i--) zd[i] = xd[i];
199 2541666234 : zd += i+1;
200 2541666234 : *--zd = evalsigne(1) | evallgefint(lz);
201 2541666234 : *--zd = evaltyp(t_INT) | evallg(lz);
202 2541666234 : return gc_const((pari_sp)zd, zd);
203 : }
204 :
205 : /* assume x >= s */
206 : INLINE GEN
207 1542130266 : subiuspec(GEN x, ulong s, long nx)
208 : {
209 1542130266 : GEN xd, zd = (GEN)avma;
210 : long lz;
211 : LOCAL_OVERFLOW;
212 :
213 1542130266 : if (nx == 1) return utoi(x[0] - s);
214 :
215 350196966 : lz = nx+2; (void)new_chunk(lz);
216 350196966 : xd = x + nx;
217 350196966 : *--zd = subll(*--xd, s);
218 350196966 : if (overflow)
219 : for(;;)
220 : {
221 148035195 : *--zd = ((ulong)*--xd) - 1;
222 148035195 : if (*xd) break;
223 : }
224 350196966 : if (xd == x)
225 240647259 : while (*zd == 0) { zd++; lz--; } /* shorten z */
226 : else
227 4730674962 : do *--zd = *--xd; while (xd > x);
228 350196966 : *--zd = evalsigne(1) | evallgefint(lz);
229 350196966 : *--zd = evaltyp(t_INT) | evallg(lz);
230 350196966 : return gc_const((pari_sp)zd, zd);
231 : }
232 :
233 : /* assume x > y */
234 : static GEN
235 3311380968 : subiispec(GEN x, GEN y, long nx, long ny)
236 : {
237 : GEN xd,yd,zd;
238 3311380968 : long lz, i = -2;
239 : LOCAL_OVERFLOW;
240 :
241 3311380968 : if (ny==1) return subiuspec(x,*y,nx);
242 1928711496 : zd = (GEN)avma;
243 1928711496 : lz = nx+2; (void)new_chunk(lz);
244 1928711496 : xd = x + nx;
245 1928711496 : yd = y + ny;
246 1928711496 : zd[-1] = subll(xd[-1], yd[-1]);
247 : #ifdef subllx8
248 2117096552 : for ( ; i-8 > -ny; i-=8)
249 1474192720 : subllx8(xd+i, yd+i, zd+i, overflow);
250 : #endif
251 32987399128 : for ( ; i >= -ny; i--) zd[i] = subllx(xd[i], yd[i]);
252 1928711496 : if (overflow)
253 : for(;;)
254 : {
255 986473311 : zd[i] = uel(xd,i) - 1;
256 986473311 : if (xd[i--]) break;
257 : }
258 1928711496 : if (i>=-nx)
259 4530195099 : for (; i >= -nx; i--) zd[i] = xd[i];
260 : else
261 2301106719 : while (zd[i+1] == 0) { i++; lz--; } /* shorten z */
262 1928711496 : zd += i+1;
263 1928711496 : *--zd = evalsigne(1) | evallgefint(lz);
264 1928711496 : *--zd = evaltyp(t_INT) | evallg(lz);
265 1928711496 : return gc_const((pari_sp)zd, zd);
266 : }
267 :
268 : static void
269 443554570 : roundr_up_ip(GEN x, long l)
270 : {
271 443554570 : long i = l;
272 : for(;;)
273 : {
274 444515776 : if (++uel(x,--i)) break;
275 1288989 : if (i == 2) { x[2] = (long)HIGHBIT; shiftr_inplace(x, 1); break; }
276 : }
277 443554570 : }
278 :
279 : void
280 320284926 : affir(GEN x, GEN y)
281 : {
282 320284926 : const long s = signe(x), ly = lg(y);
283 : long lx, sh, i;
284 :
285 320284926 : if (!s)
286 : {
287 31123311 : y[1] = evalexpo(-bit_accuracy(ly));
288 31123311 : return;
289 : }
290 :
291 289161615 : lx = lgefint(x); sh = bfffo(x[2]);
292 289161615 : y[1] = evalsigne(s) | evalexpo(bit_accuracy(lx)-sh-1);
293 289161615 : if (sh) {
294 284108175 : if (lx <= ly)
295 : {
296 748266834 : for (i=lx; i<ly; i++) y[i]=0;
297 203721966 : shift_left(y,x,2,lx-1, 0,sh);
298 203721966 : return;
299 : }
300 80386209 : shift_left(y,x,2,ly-1, x[ly],sh);
301 : /* lx > ly: round properly */
302 80386209 : if ((uel(x,ly)<<sh) & HIGHBIT) roundr_up_ip(y, ly);
303 : }
304 : else {
305 5053440 : if (lx <= ly)
306 : {
307 4677705 : for (i=2; i<lx; i++) y[i]=x[i];
308 3727707 : for ( ; i<ly; i++) y[i]=0;
309 1271364 : return;
310 : }
311 9517176 : for (i=2; i<ly; i++) y[i]=x[i];
312 : /* lx > ly: round properly */
313 3782076 : if (uel(x,ly) & HIGHBIT) roundr_up_ip(y, ly);
314 : }
315 : }
316 :
317 : INLINE GEN
318 1273628508 : shiftispec(GEN x, long nx, long n)
319 : {
320 : long ny, i, m;
321 : GEN y, yd;
322 1273628508 : if (!n) return icopyspec(x, nx);
323 :
324 1187142933 : if (n > 0)
325 : {
326 731212707 : GEN z = (GEN)avma;
327 731212707 : long d = dvmdsBIL(n, &m);
328 :
329 731212707 : ny = nx+d; y = new_chunk(ny + 2); yd = y + 2;
330 6711692991 : for ( ; d; d--) *--z = 0;
331 1904318616 : if (!m) for (i=0; i<nx; i++) yd[i]=x[i];
332 : else
333 : {
334 710279727 : const ulong sh = BITS_IN_LONG - m;
335 710279727 : shift_left(yd,x, 0,nx-1, 0,m);
336 710279727 : i = uel(x,0) >> sh;
337 : /* Extend y on the left? */
338 710279727 : if (i) { ny++; y = new_chunk(1); y[2] = i; }
339 : }
340 : }
341 : else
342 : {
343 455930226 : ny = nx - dvmdsBIL(-n, &m);
344 455930226 : if (ny<1) return gen_0;
345 454666461 : y = new_chunk(ny + 2); yd = y + 2;
346 454666461 : if (m) {
347 277049931 : shift_right(yd,x, 0,ny, 0,m);
348 277049931 : if (yd[0] == 0)
349 : {
350 33168849 : if (ny==1) return gc_const((pari_sp)(y+3), gen_0);
351 25521672 : ny--; set_avma((pari_sp)(++y));
352 : }
353 : } else {
354 7407515709 : for (i=0; i<ny; i++) yd[i]=x[i];
355 : }
356 : }
357 1178231991 : y[1] = evalsigne(1)|evallgefint(ny + 2);
358 1178231991 : y[0] = evaltyp(t_INT)|evallg(ny + 2); return y;
359 : }
360 :
361 : GEN
362 48682809 : mantissa2nr(GEN x, long n)
363 : { /*This is a kludge since x is not an integer*/
364 48682809 : long s = signe(x);
365 : GEN y;
366 :
367 48682809 : if(s == 0) return gen_0;
368 48681888 : y = shiftispec(x + 2, lg(x) - 2, n);
369 48681888 : if (signe(y)) setsigne(y, s);
370 48681888 : return y;
371 : }
372 :
373 : GEN
374 2613753 : truncr(GEN x)
375 : {
376 : long d,e,i,s,m;
377 : GEN y;
378 :
379 2613753 : if ((s=signe(x)) == 0 || (e=expo(x)) < 0) return gen_0;
380 1101966 : d = nbits2lg(e+1); m = remsBIL(e);
381 1101966 : if (d > lg(x)) pari_err_PREC( "truncr (precision loss in truncation)");
382 :
383 1101963 : y=cgeti(d); y[1] = evalsigne(s) | evallgefint(d);
384 1101963 : if (++m == BITS_IN_LONG)
385 828 : for (i=2; i<d; i++) y[i]=x[i];
386 : else
387 1101612 : shift_right(y,x, 2,d,0, BITS_IN_LONG - m);
388 1101963 : return y;
389 : }
390 :
391 : /* integral part */
392 : GEN
393 5229609 : floorr(GEN x)
394 : {
395 : long d,e,i,lx,m;
396 : GEN y;
397 :
398 5229609 : if (signe(x) >= 0) return truncr(x);
399 3149277 : if ((e=expo(x)) < 0) return gen_m1;
400 2634081 : d = nbits2lg(e+1); m = remsBIL(e);
401 2634081 : lx=lg(x); if (d>lx) pari_err_PREC( "floorr (precision loss in truncation)");
402 2634081 : y = new_chunk(d);
403 2634081 : if (++m == BITS_IN_LONG)
404 : {
405 501 : for (i=2; i<d; i++) y[i]=x[i];
406 210 : i=d; while (i<lx && !x[i]) i++;
407 174 : if (i==lx) goto END;
408 : }
409 : else
410 : {
411 2633907 : shift_right(y,x, 2,d,0, BITS_IN_LONG - m);
412 2633907 : if (uel(x,d-1)<<m == 0)
413 : {
414 313041 : i=d; while (i<lx && !x[i]) i++;
415 83946 : if (i==lx) goto END;
416 : }
417 : }
418 : /* set y:=y+1 */
419 2577546 : for (i=d-1; i>=2; i--) { uel(y,i)++; if (y[i]) goto END; }
420 0 : y=new_chunk(1); y[2]=1; d++;
421 2634081 : END:
422 2634081 : y[1] = evalsigne(-1) | evallgefint(d);
423 2634081 : y[0] = evaltyp(t_INT) | evallg(d); return y;
424 : }
425 :
426 : INLINE int
427 4010332377 : cmpiispec(GEN x, GEN y, long lx, long ly)
428 : {
429 : long i;
430 4010332377 : if (lx < ly) return -1;
431 3744549393 : if (lx > ly) return 1;
432 3724067982 : i = 0; while (i<lx && x[i]==y[i]) i++;
433 3232019637 : if (i==lx) return 0;
434 3011843325 : return (uel(x,i) > uel(y,i))? 1: -1;
435 : }
436 :
437 : INLINE int
438 200780253 : equaliispec(GEN x, GEN y, long lx, long ly)
439 : {
440 : long i;
441 200780253 : if (lx != ly) return 0;
442 368308245 : i = ly-1; while (i>=0 && x[i]==y[i]) i--;
443 200695098 : return i < 0;
444 : }
445 :
446 : /***********************************************************************/
447 : /** **/
448 : /** MULTIPLICATION **/
449 : /** **/
450 : /***********************************************************************/
451 : /* assume ny > 0 */
452 : INLINE GEN
453 4728432945 : muluispec(ulong x, GEN y, long ny)
454 : {
455 4728432945 : GEN yd, z = (GEN)avma;
456 4728432945 : long lz = ny+3;
457 : LOCAL_HIREMAINDER;
458 :
459 4728432945 : (void)new_chunk(lz);
460 4728432945 : yd = y + ny; *--z = mulll(x, *--yd);
461 15321015060 : while (yd > y) *--z = addmul(x,*--yd);
462 4728432945 : if (hiremainder) *--z = hiremainder; else lz--;
463 4728432945 : *--z = evalsigne(1) | evallgefint(lz);
464 4728432945 : *--z = evaltyp(t_INT) | evallg(lz);
465 4728432945 : return gc_const((pari_sp)z, z);
466 : }
467 :
468 : /* a + b*|Y| */
469 : GEN
470 0 : addumului(ulong a, ulong b, GEN Y)
471 : {
472 : GEN yd,y,z;
473 : long ny,lz;
474 : LOCAL_HIREMAINDER;
475 : LOCAL_OVERFLOW;
476 :
477 0 : if (!b || !signe(Y)) return utoi(a);
478 :
479 0 : y = LIMBS(Y); z = (GEN)avma;
480 0 : ny = NLIMBS(Y);
481 0 : lz = ny+3;
482 :
483 0 : (void)new_chunk(lz);
484 0 : yd = y + ny; *--z = addll(a, mulll(b, *--yd));
485 0 : if (overflow) hiremainder++; /* can't overflow */
486 0 : while (yd > y) *--z = addmul(b,*--yd);
487 0 : if (hiremainder) *--z = hiremainder; else lz--;
488 0 : *--z = evalsigne(1) | evallgefint(lz);
489 0 : *--z = evaltyp(t_INT) | evallg(lz);
490 0 : return gc_const((pari_sp)z, z);
491 : }
492 :
493 : /***********************************************************************/
494 : /** **/
495 : /** DIVISION **/
496 : /** **/
497 : /***********************************************************************/
498 :
499 : ulong
500 1409721822 : umodiu(GEN y, ulong x)
501 : {
502 1409721822 : long sy=signe(y),ly,i;
503 : ulong xi;
504 : LOCAL_HIREMAINDER;
505 :
506 1409721822 : if (!x) pari_err_INV("umodiu",gen_0);
507 1409721822 : if (!sy) return 0;
508 1113077922 : ly = lgefint(y);
509 1113077922 : if (x <= uel(y,2))
510 : {
511 338098998 : hiremainder=0;
512 338098998 : if (ly==3)
513 : {
514 307825944 : hiremainder=uel(y,2)%x;
515 307825944 : if (!hiremainder) return 0;
516 259203309 : return (sy > 0)? hiremainder: x - hiremainder;
517 : }
518 : }
519 : else
520 : {
521 774978924 : if (ly==3) return (sy > 0)? uel(y,2): x - uel(y,2);
522 97711413 : hiremainder=uel(y,2); ly--; y++;
523 : }
524 127984467 : xi = get_Fl_red(x);
525 917650857 : for (i=2; i<ly; i++) (void)divll_pre(y[i],x,xi);
526 127984467 : if (!hiremainder) return 0;
527 122084166 : return (sy > 0)? hiremainder: x - hiremainder;
528 : }
529 :
530 : /* return |y| \/ x */
531 : GEN
532 270713994 : absdiviu_rem(GEN y, ulong x, ulong *rem)
533 : {
534 : long ly,i;
535 : GEN z;
536 : ulong xi;
537 : LOCAL_HIREMAINDER;
538 :
539 270713994 : if (!x) pari_err_INV("absdiviu_rem",gen_0);
540 270713994 : if (!signe(y)) { *rem = 0; return gen_0; }
541 :
542 253861968 : ly = lgefint(y);
543 253861968 : if (x <= uel(y,2))
544 : {
545 226696221 : hiremainder=0;
546 226696221 : if (ly==3)
547 : {
548 203255340 : z = cgetipos(3);
549 203255340 : z[2] = divll(uel(y,2),x);
550 203255340 : *rem = hiremainder; return z;
551 : }
552 : }
553 : else
554 : {
555 27165747 : if (ly==3) { *rem = uel(y,2); return gen_0; }
556 6836649 : hiremainder = uel(y,2); ly--; y++;
557 : }
558 30277530 : xi = get_Fl_red(x);
559 30277530 : z = cgetipos(ly);
560 164447682 : for (i=2; i<ly; i++) z[i]=divll_pre(y[i],x,xi);
561 30277530 : *rem = hiremainder; return z;
562 : }
563 :
564 : GEN
565 65014488 : divis_rem(GEN y, long x, long *rem)
566 : {
567 65014488 : long sy=signe(y),ly,s,i;
568 : GEN z;
569 : ulong xi;
570 : LOCAL_HIREMAINDER;
571 :
572 65014488 : if (!x) pari_err_INV("divis_rem",gen_0);
573 65014488 : if (!sy) { *rem=0; return gen_0; }
574 45958092 : if (x<0) { s = -sy; x = -x; } else s = sy;
575 :
576 45958092 : ly = lgefint(y);
577 45958092 : if ((ulong)x <= uel(y,2))
578 : {
579 31719537 : hiremainder=0;
580 31719537 : if (ly==3)
581 : {
582 31416843 : z = cgeti(3); z[1] = evallgefint(3) | evalsigne(s);
583 31416843 : z[2] = divll(uel(y,2),x);
584 31416843 : if (sy<0) hiremainder = - ((long)hiremainder);
585 31416843 : *rem = (long)hiremainder; return z;
586 : }
587 : }
588 : else
589 : {
590 14238555 : if (ly==3) { *rem = itos(y); return gen_0; }
591 258018 : hiremainder = uel(y,2); ly--; y++;
592 : }
593 560712 : xi = get_Fl_red(x);
594 560712 : z = cgeti(ly); z[1] = evallgefint(ly) | evalsigne(s);
595 2955549 : for (i=2; i<ly; i++) z[i]=divll_pre(y[i],x,xi);
596 560712 : if (sy<0) hiremainder = - ((long)hiremainder);
597 560712 : *rem = (long)hiremainder; return z;
598 : }
599 :
600 : GEN
601 721875 : divis(GEN y, long x)
602 : {
603 721875 : long sy=signe(y),ly,s,i;
604 : ulong xi;
605 : GEN z;
606 : LOCAL_HIREMAINDER;
607 :
608 721875 : if (!x) pari_err_INV("divis",gen_0);
609 721875 : if (!sy) return gen_0;
610 721839 : if (x<0) { s = -sy; x = -x; } else s = sy;
611 :
612 721839 : ly = lgefint(y);
613 721839 : if ((ulong)x <= uel(y,2))
614 : {
615 712815 : hiremainder=0;
616 712815 : if (ly==3)
617 : {
618 643344 : z = cgeti(3); z[1] = evallgefint(3) | evalsigne(s);
619 643344 : z[2] = divll(y[2],x);
620 643344 : return z;
621 : }
622 : }
623 : else
624 : {
625 9024 : if (ly==3) return gen_0;
626 8790 : hiremainder=y[2]; ly--; y++;
627 : }
628 78261 : xi = get_Fl_red(x);
629 78261 : z = cgeti(ly); z[1] = evallgefint(ly) | evalsigne(s);
630 593268 : for (i=2; i<ly; i++) z[i]=divll_pre(y[i],x, xi);
631 78261 : return z;
632 : }
633 :
634 : GEN
635 129495234 : divrr(GEN x, GEN y)
636 : {
637 129495234 : long sx=signe(x), sy=signe(y), lx,ly,lr,e,i,j;
638 : ulong y0,y1;
639 : GEN r, r1;
640 :
641 129495234 : if (!sy) pari_err_INV("divrr",y);
642 129495234 : e = expo(x) - expo(y);
643 129495234 : if (!sx) return real_0_bit(e);
644 129137640 : if (sy<0) sx = -sx;
645 :
646 129137640 : lx=lg(x); ly=lg(y);
647 129137640 : if (ly==3)
648 : {
649 23492214 : ulong k = x[2], l = (lx>3)? x[3]: 0;
650 : LOCAL_HIREMAINDER;
651 23492214 : if (k < uel(y,2)) e--;
652 : else
653 : {
654 6873000 : l >>= 1; if (k&1) l |= HIGHBIT;
655 6873000 : k >>= 1;
656 : }
657 23492214 : hiremainder = k; k = divll(l,y[2]);
658 23492214 : if (hiremainder > (uel(y,2) >> 1) && !++k) { k = HIGHBIT; e++; }
659 23492214 : r = cgetg(3, t_REAL);
660 23492214 : r[1] = evalsigne(sx) | evalexpo(e);
661 23492214 : r[2] = k; return r;
662 : }
663 :
664 105645426 : lr = minss(lx,ly); r = new_chunk(lr);
665 105645426 : r1 = r-1;
666 748826913 : r1[1] = 0; for (i=2; i<lr; i++) r1[i]=x[i];
667 105645426 : r1[lr] = (lx>ly)? x[lr]: 0;
668 105645426 : y0 = y[2]; y1 = y[3];
669 854472339 : for (i=0; i<lr-1; i++)
670 : { /* r1 = r + (i-1), OK up to r1[2] (accesses at most r[lr]) */
671 : ulong k, qp;
672 : LOCAL_HIREMAINDER;
673 : LOCAL_OVERFLOW;
674 :
675 748826913 : if (uel(r1,1) == y0) { qp = ULONG_MAX; k = addll(y0,r1[2]); }
676 : else
677 : {
678 747251595 : if (uel(r1,1) > y0) /* can't happen if i=0 */
679 : {
680 0 : GEN y1 = y+1;
681 0 : j = lr-i; r1[j] = subll(r1[j],y1[j]);
682 0 : for (j--; j>0; j--) r1[j] = subllx(r1[j],y1[j]);
683 0 : j=i; do uel(r,--j)++; while (j && !uel(r,j));
684 : }
685 747251595 : hiremainder = r1[1]; overflow = 0;
686 747251595 : qp = divll(r1[2],y0); k = hiremainder;
687 : }
688 748826913 : j = lr-i+1;
689 748826913 : if (!overflow)
690 : {
691 : long k3, k4;
692 747576060 : k3 = mulll(qp,y1);
693 747576060 : if (j == 3) /* i = lr - 2 maximal, r1[3] undefined -> 0 */
694 105577905 : k4 = subll(hiremainder,k);
695 : else
696 : {
697 641998155 : k3 = subll(k3, r1[3]);
698 641998155 : k4 = subllx(hiremainder,k);
699 : }
700 990517766 : while (!overflow && k4) { qp--; k3 = subll(k3,y1); k4 = subllx(k4,y0); }
701 : }
702 748826913 : if (j<ly) (void)mulll(qp,y[j]); else { hiremainder = 0 ; j = ly; }
703 4959446397 : for (j--; j>1; j--)
704 : {
705 4210619484 : r1[j] = subll(r1[j], addmul(qp,y[j]));
706 4210619484 : hiremainder += overflow;
707 : }
708 748826913 : if (uel(r1,1) != hiremainder)
709 : {
710 596829 : if (uel(r1,1) < hiremainder)
711 : {
712 596829 : qp--;
713 596829 : j = lr-i-(lr-i>=ly); r1[j] = addll(r1[j], y[j]);
714 3311730 : for (j--; j>1; j--) r1[j] = addllx(r1[j], y[j]);
715 : }
716 : else
717 : {
718 0 : r1[1] -= hiremainder;
719 0 : while (r1[1])
720 : {
721 0 : qp++; if (!qp) { j=i; do uel(r,--j)++; while (j && !r[j]); }
722 0 : j = lr-i-(lr-i>=ly); r1[j] = subll(r1[j],y[j]);
723 0 : for (j--; j>1; j--) r1[j] = subllx(r1[j],y[j]);
724 0 : r1[1] -= overflow;
725 : }
726 : }
727 : }
728 748826913 : *++r1 = qp;
729 : }
730 : /* i = lr-1 */
731 : /* round correctly */
732 105645426 : if (uel(r1,1) > (y0>>1))
733 : {
734 51897576 : j=i; do uel(r,--j)++; while (j && !r[j]);
735 : }
736 748826913 : r1 = r-1; for (j=i; j>=2; j--) r[j]=r1[j];
737 105645426 : if (r[0] == 0) e--;
738 45957714 : else if (r[0] == 1) { shift_right(r,r, 2,lr, 1,1); }
739 : else { /* possible only when rounding up to 0x2 0x0 ... */
740 6 : r[2] = (long)HIGHBIT; e++;
741 : }
742 105645426 : r[0] = evaltyp(t_REAL)|evallg(lr);
743 105645426 : r[1] = evalsigne(sx) | evalexpo(e);
744 105645426 : return r;
745 : }
746 :
747 : GEN
748 113279049 : divri(GEN x, GEN y)
749 : {
750 113279049 : long lx, s = signe(y);
751 : pari_sp av;
752 : GEN z;
753 :
754 113279049 : if (!s) pari_err_INV("divri",y);
755 113279049 : if (!signe(x)) return real_0_bit(expo(x) - expi(y));
756 113109138 : if (!is_bigint(y)) {
757 88908852 : GEN z = divru(x, y[2]);
758 88908852 : if (s < 0) togglesign(z);
759 88908852 : return z;
760 : }
761 24200286 : lx = lg(x); z = cgetg(lx, t_REAL); av = avma;
762 24200286 : affrr(divrr(x, itor(y, lg2prec(lx+1))), z);
763 24200286 : return gc_const(av, z);
764 : }
765 :
766 : /* Integer division x / y: such that sign(r) = sign(x)
767 : * if z = ONLY_REM return remainder, otherwise return quotient
768 : * if z != NULL set *z to remainder
769 : * *z is the last object on stack (and thus can be disposed of with cgiv
770 : * instead of gerepile)
771 : * If *z is zero, we put gen_0 here and no copy.
772 : * space needed: lx + ly */
773 : GEN
774 1474728540 : dvmdii(GEN x, GEN y, GEN *z)
775 : {
776 1474728540 : long sx = signe(x), sy = signe(y);
777 1474728540 : long lx, ly = lgefint(y), lz, i, j, sh, lq, lr;
778 : pari_sp av;
779 : ulong y0,y0i,y1, *xd,*rd,*qd;
780 : GEN q, r, r1;
781 :
782 1474728540 : if (!sx)
783 : {
784 52868412 : if (ly < 3) pari_err_INV("dvmdii",gen_0);
785 52868409 : if (!z || z == ONLY_REM) return gen_0;
786 32208144 : *z=gen_0; return gen_0;
787 : }
788 1421860128 : if (ly <= 3)
789 : {
790 : ulong rem;
791 652614438 : if (ly < 3) pari_err_INV("dvmdii",gen_0);
792 652614438 : if (z == ONLY_REM)
793 : {
794 450910602 : rem = umodiu(x,uel(y,2));
795 450910602 : if (!rem) return gen_0;
796 408503592 : return (sx < 0)? utoineg(uel(y,2) - rem): utoipos(rem);
797 : }
798 201703836 : q = absdiviu_rem(x, uel(y,2), &rem);
799 201703836 : if (sx != sy) togglesign(q);
800 201703836 : if (!z) return q;
801 198487347 : if (!rem) *z = gen_0;
802 54387069 : else *z = sx < 0? utoineg(rem): utoipos(rem);
803 198487347 : return q;
804 : }
805 769245690 : lx=lgefint(x);
806 769245690 : lz=lx-ly;
807 769245690 : if (lz <= 0)
808 : {
809 375582753 : if (lz == 0)
810 : {
811 328163064 : for (i=2; i<lx; i++)
812 327539652 : if (x[i] != y[i])
813 : {
814 311384571 : if (uel(x,i) > uel(y,i)) goto DIVIDE;
815 45772695 : goto TRIVIAL;
816 : }
817 623412 : if (z == ONLY_REM) return gen_0;
818 66051 : if (z) *z = gen_0;
819 66051 : if (sx < 0) sy = -sy;
820 66051 : return stoi(sy);
821 : }
822 63574770 : TRIVIAL:
823 109347465 : if (z == ONLY_REM) return icopy(x);
824 2085705 : if (z) *z = icopy(x);
825 2085705 : return gen_0;
826 : }
827 393662937 : DIVIDE: /* quotient is nonzero */
828 659274813 : av=avma; if (sx<0) sy = -sy;
829 659274813 : r1 = new_chunk(lx); sh = bfffo(y[2]);
830 659274813 : if (sh)
831 : { /* normalize so that highbit(y) = 1 (shift left x and y by sh bits)*/
832 650481006 : const ulong m = BITS_IN_LONG - sh;
833 650481006 : r = new_chunk(ly);
834 650481006 : shift_left(r, y,2,ly-1, 0,sh); y = r;
835 650481006 : shift_left(r1,x,2,lx-1, 0,sh);
836 650481006 : r1[1] = uel(x,2) >> m;
837 : }
838 : else
839 : {
840 91076055 : r1[1] = 0; for (j=2; j<lx; j++) r1[j] = x[j];
841 : }
842 659274813 : x = r1;
843 659274813 : y0 = y[2]; y0i = get_Fl_red(y0);
844 659274813 : y1 = y[3];
845 2868050679 : for (i=0; i<=lz; i++)
846 : { /* r1 = x + i */
847 : ulong k, qp;
848 : LOCAL_HIREMAINDER;
849 : LOCAL_OVERFLOW;
850 :
851 2208775866 : if (uel(r1,1) == y0)
852 : {
853 48831 : qp = ULONG_MAX; k = addll(y0,r1[2]);
854 : }
855 : else
856 : {
857 2208727035 : hiremainder = r1[1]; overflow = 0;
858 2208727035 : qp = divll_pre(r1[2],y0,y0i); k = hiremainder;
859 : }
860 2208775866 : if (!overflow)
861 : {
862 2208726088 : long k3 = subll(mulll(qp,y1), r1[3]);
863 2208726088 : long k4 = subllx(hiremainder,k);
864 2685960012 : while (!overflow && k4) { qp--; k3 = subll(k3,y1); k4 = subllx(k4,y0); }
865 : }
866 2208775866 : hiremainder = 0; j = ly;
867 63957812088 : for (j--; j>1; j--)
868 : {
869 61749036222 : r1[j] = subll(r1[j], addmul(qp,y[j]));
870 61749036222 : hiremainder += overflow;
871 : }
872 2208775866 : if (uel(r1,1) < hiremainder)
873 : {
874 5912085 : qp--;
875 5912085 : j = ly-1; r1[j] = addll(r1[j],y[j]);
876 31187909 : for (j--; j>1; j--) r1[j] = addllx(r1[j],y[j]);
877 : }
878 2208775866 : *++r1 = qp;
879 : }
880 :
881 659274813 : lq = lz+2;
882 659274813 : if (!z)
883 : {
884 2811789 : qd = (ulong*)av;
885 2811789 : xd = (ulong*)(x + lq);
886 2811789 : if (x[1]) { lz++; lq++; }
887 34975101 : while (lz--) *--qd = *--xd;
888 2811789 : *--qd = evalsigne(sy) | evallgefint(lq);
889 2811789 : *--qd = evaltyp(t_INT) | evallg(lq);
890 2811789 : return gc_const((pari_sp)qd, (GEN)qd);
891 : }
892 :
893 748083432 : j=lq; while (j<lx && !x[j]) j++;
894 656463024 : lz = lx-j;
895 656463024 : if (z == ONLY_REM)
896 : {
897 376953501 : if (lz==0) return gc_const(av, gen_0);
898 367708290 : rd = (ulong*)av; lr = lz+2;
899 367708290 : xd = (ulong*)(x + lx);
900 399897102 : if (!sh) while (lz--) *--rd = *--xd;
901 : else
902 : { /* shift remainder right by sh bits */
903 359685099 : const ulong shl = BITS_IN_LONG - sh;
904 : ulong l;
905 359685099 : xd--;
906 1222601472 : while (--lz) /* fill r[3..] */
907 : {
908 862916373 : l = *xd >> sh;
909 862916373 : *--rd = l | (*--xd << shl);
910 : }
911 359685099 : l = *xd >> sh;
912 359685099 : if (l) *--rd = l; else lr--;
913 : }
914 367708290 : *--rd = evalsigne(sx) | evallgefint(lr);
915 367708290 : *--rd = evaltyp(t_INT) | evallg(lr);
916 367708290 : return gc_const((pari_sp)rd, (GEN)rd);
917 : }
918 :
919 279509523 : lr = lz+2;
920 279509523 : rd = NULL; /* gcc -Wall */
921 279509523 : if (lz)
922 : { /* non zero remainder: initialize rd */
923 274920417 : xd = (ulong*)(x + lx);
924 274920417 : if (!sh)
925 : {
926 569856 : rd = (ulong*)avma; (void)new_chunk(lr);
927 5775018 : while (lz--) *--rd = *--xd;
928 : }
929 : else
930 : { /* shift remainder right by sh bits */
931 274350561 : const ulong shl = BITS_IN_LONG - sh;
932 : ulong l;
933 274350561 : rd = (ulong*)x; /* overwrite shifted y */
934 274350561 : xd--;
935 1224382335 : while (--lz)
936 : {
937 950031774 : l = *xd >> sh;
938 950031774 : *--rd = l | (*--xd << shl);
939 : }
940 274350561 : l = *xd >> sh;
941 274350561 : if (l) *--rd = l; else lr--;
942 : }
943 274920417 : *--rd = evalsigne(sx) | evallgefint(lr);
944 274920417 : *--rd = evaltyp(t_INT) | evallg(lr);
945 274920417 : rd += lr;
946 : }
947 279509523 : qd = (ulong*)av;
948 279509523 : xd = (ulong*)(x + lq);
949 279509523 : if (x[1]) lq++;
950 874662678 : j = lq-2; while (j--) *--qd = *--xd;
951 279509523 : *--qd = evalsigne(sy) | evallgefint(lq);
952 279509523 : *--qd = evaltyp(t_INT) | evallg(lq);
953 279509523 : q = (GEN)qd;
954 279509523 : if (lr==2) *z = gen_0;
955 : else
956 : { /* rd has been properly initialized: we had lz > 0 */
957 1874187177 : while (lr--) *--qd = *--rd;
958 274920417 : *z = (GEN)qd;
959 : }
960 279509523 : return gc_const((pari_sp)qd, q);
961 : }
962 :
963 : /* Montgomery reduction.
964 : * N has k words, assume T >= 0 has less than 2k.
965 : * Return res := T / B^k mod N, where B = 2^BIL
966 : * such that 0 <= res < T/B^k + N and res has less than k words */
967 : GEN
968 39035064 : red_montgomery(GEN T, GEN N, ulong inv)
969 : {
970 : pari_sp av;
971 : GEN Te, Td, Ne, Nd, scratch;
972 39035064 : ulong i, j, m, t, d, k = NLIMBS(N);
973 : int carry;
974 : LOCAL_HIREMAINDER;
975 : LOCAL_OVERFLOW;
976 :
977 39035064 : if (k == 0) return gen_0;
978 39035064 : d = NLIMBS(T); /* <= 2*k */
979 39035064 : if (d == 0) return gen_0;
980 : #ifdef DEBUG
981 : if (d > 2*k) pari_err_BUG("red_montgomery");
982 : #endif
983 39035055 : if (k == 1)
984 : { /* as below, special cased for efficiency */
985 163341 : ulong n = uel(N,2);
986 163341 : if (d == 1) {
987 163194 : hiremainder = uel(T,2);
988 163194 : m = hiremainder * inv;
989 163194 : (void)addmul(m, n); /* t + m*n = 0 */
990 163194 : return utoi(hiremainder);
991 : } else { /* d = 2 */
992 147 : hiremainder = uel(T,3);
993 147 : m = hiremainder * inv;
994 147 : (void)addmul(m, n); /* t + m*n = 0 */
995 147 : t = addll(hiremainder, uel(T,2));
996 147 : if (overflow) t -= n; /* t > n doesn't fit in 1 word */
997 147 : return utoi(t);
998 : }
999 : }
1000 : /* assume k >= 2 */
1001 38871714 : av = avma; scratch = new_chunk(k<<1); /* >= k + 2: result fits */
1002 :
1003 : /* copy T to scratch space (pad with zeroes to 2k words) */
1004 38871714 : Td = (GEN)av;
1005 38871714 : Te = T + (d+2);
1006 855180453 : for (i=0; i < d ; i++) *--Td = *--Te;
1007 64883187 : for ( ; i < (k<<1); i++) *--Td = 0;
1008 :
1009 38871714 : Te = (GEN)av; /* 1 beyond end of current T mantissa (in scratch) */
1010 38871714 : Ne = N + k+2; /* 1 beyond end of N mantissa */
1011 :
1012 38871714 : carry = 0;
1013 460031820 : for (i=0; i<k; i++) /* set T := T/B nod N, k times */
1014 : {
1015 421160106 : Td = Te; /* one beyond end of (new) T mantissa */
1016 421160106 : Nd = Ne;
1017 421160106 : hiremainder = *--Td;
1018 421160106 : m = hiremainder * inv; /* solve T + m N = O(B) */
1019 :
1020 : /* set T := (T + mN) / B */
1021 421160106 : Te = Td;
1022 421160106 : (void)addmul(m, *--Nd); /* = 0 */
1023 6860316678 : for (j=1; j<k; j++)
1024 : {
1025 6439156572 : t = addll(addmul(m, *--Nd), *--Td);
1026 6439156572 : *Td = t;
1027 6439156572 : hiremainder += overflow;
1028 : }
1029 421160106 : t = addll(hiremainder, *--Td); *Td = t + carry;
1030 421160106 : carry = (overflow || (carry && *Td == 0));
1031 : }
1032 38871714 : if (carry)
1033 : { /* Td > N overflows (k+1 words), set Td := Td - N */
1034 373056 : Td = Te;
1035 373056 : Nd = Ne;
1036 373056 : t = subll(*--Td, *--Nd); *Td = t;
1037 6971085 : while (Td > scratch) { t = subllx(*--Td, *--Nd); *Td = t; }
1038 : }
1039 :
1040 : /* copy result */
1041 38871714 : Td = (GEN)av;
1042 42614829 : while (*scratch == 0 && Te > scratch) scratch++; /* strip leading 0s */
1043 456288705 : while (Te > scratch) *--Td = *--Te;
1044 38871714 : k = (GEN)av - Td; if (!k) return gc_const(av, gen_0);
1045 38871714 : k += 2;
1046 38871714 : *--Td = evalsigne(1) | evallgefint(k);
1047 38871714 : *--Td = evaltyp(t_INT) | evallg(k);
1048 : #ifdef DEBUG
1049 : {
1050 : long l = NLIMBS(N), s = BITS_IN_LONG*l;
1051 : GEN R = int2n(s);
1052 : GEN res = remii(mulii(T, Fp_inv(R, N)), N);
1053 : if (k > lgefint(N)
1054 : || !equalii(remii(Td,N),res)
1055 : || cmpii(Td, addii(shifti(T, -s), N)) >= 0) pari_err_BUG("red_montgomery");
1056 : }
1057 : #endif
1058 38871714 : return gc_const((pari_sp)Td, Td);
1059 : }
1060 :
1061 : /* EXACT INTEGER DIVISION */
1062 :
1063 : /* assume xy>0, the division is exact and y is odd. Destroy x */
1064 : static GEN
1065 29475291 : diviuexact_i(GEN x, ulong y)
1066 : {
1067 : long i, lz, lx;
1068 : ulong q, yinv;
1069 : GEN z, z0, x0, x0min;
1070 :
1071 29475291 : if (y == 1) return icopy(x);
1072 23835717 : lx = lgefint(x);
1073 23835717 : if (lx == 3)
1074 : {
1075 850569 : q = uel(x,2) / y;
1076 850569 : if (!q) pari_err_OP("exact division", x, utoi(y));
1077 850569 : return utoipos(q);
1078 : }
1079 22985148 : yinv = invmod2BIL(y);
1080 22985148 : lz = (y <= uel(x,2)) ? lx : lx-1;
1081 22985148 : z = new_chunk(lz);
1082 22985148 : z0 = z + lz;
1083 22985148 : x0 = x + lx; x0min = x + lx-lz+2;
1084 :
1085 82949883 : while (x0 > x0min)
1086 : {
1087 59964735 : *--z0 = q = yinv*uel(--x0,0); /* i-th quotient */
1088 59964735 : if (!q) continue;
1089 : /* x := x - q * y */
1090 : { /* update neither lowest word (could set it to 0) nor highest ones */
1091 59437692 : GEN x1 = x0 - 1;
1092 : LOCAL_HIREMAINDER;
1093 59437692 : (void)mulll(q,y);
1094 59437692 : if (hiremainder)
1095 : {
1096 47650680 : if (uel(x1,0) < hiremainder)
1097 : {
1098 138306 : uel(x1,0) -= hiremainder;
1099 140310 : do uel(--x1,0)--; while (uel(x1,0) == ULONG_MAX);
1100 : }
1101 : else
1102 47512374 : uel(x1,0) -= hiremainder;
1103 : }
1104 : }
1105 : }
1106 22985148 : i=2; while(!z[i]) i++;
1107 22985148 : z += i-2; lz -= i-2;
1108 22985148 : z[0] = evaltyp(t_INT)|evallg(lz);
1109 22985148 : z[1] = evalsigne(1)|evallg(lz);
1110 22985148 : if (lz == 2) pari_err_OP("exact division", x, utoi(y));
1111 22985148 : return gc_const((pari_sp)z, z);
1112 : }
1113 :
1114 : /* assume y != 0 and the division is exact */
1115 : GEN
1116 22143957 : diviuexact(GEN x, ulong y)
1117 : {
1118 : pari_sp av;
1119 22143957 : long lx, vy, s = signe(x);
1120 : GEN z;
1121 :
1122 22143957 : if (!s) return gen_0;
1123 21297498 : if (y == 1) return icopy(x);
1124 18305922 : lx = lgefint(x);
1125 18305922 : if (lx == 3) {
1126 14215116 : ulong q = uel(x,2) / y;
1127 14215116 : if (!q) pari_err_OP("exact division", x, utoi(y));
1128 14215116 : return (s > 0)? utoipos(q): utoineg(q);
1129 : }
1130 4090806 : av = avma; (void)new_chunk(lx); vy = vals(y);
1131 4090806 : if (vy) {
1132 1582641 : y >>= vy;
1133 1582641 : if (y == 1) { set_avma(av); return shifti(x, -vy); }
1134 754287 : x = shifti(x, -vy);
1135 754287 : if (lx == 3) {
1136 0 : ulong q = uel(x,2) / y;
1137 0 : set_avma(av);
1138 0 : if (!q) pari_err_OP("exact division", x, utoi(y));
1139 0 : return (s > 0)? utoipos(q): utoineg(q);
1140 : }
1141 2508165 : } else x = icopy(x);
1142 3262452 : set_avma(av);
1143 3262452 : z = diviuexact_i(x, y);
1144 3262452 : setsigne(z, s); return z;
1145 : }
1146 :
1147 : /* Find z such that x=y*z, knowing that y | x (unchecked)
1148 : * Method: y0 z0 = x0 mod B = 2^BITS_IN_LONG ==> z0 = 1/y0 mod B.
1149 : * Set x := (x - z0 y) / B, updating only relevant words, and repeat */
1150 : GEN
1151 375851376 : diviiexact(GEN x, GEN y)
1152 : {
1153 375851376 : long lx, ly, lz, vy, i, ii, sx = signe(x), sy = signe(y);
1154 : pari_sp av;
1155 : ulong y0inv,q;
1156 : GEN z;
1157 :
1158 375851376 : if (!sy) pari_err_INV("diviiexact",gen_0);
1159 375851376 : if (!sx) return gen_0;
1160 309229683 : lx = lgefint(x);
1161 309229683 : if (lx == 3) {
1162 246026049 : q = uel(x,2) / uel(y,2);
1163 246026049 : if (!q) pari_err_OP("exact division", x, y);
1164 246026049 : return (sx+sy) ? utoipos(q): utoineg(q);
1165 : }
1166 63203634 : vy = vali(y); av = avma;
1167 63203634 : (void)new_chunk(lx); /* enough room for z */
1168 63203634 : if (vy)
1169 : { /* make y odd */
1170 32232819 : y = shifti(y,-vy);
1171 32232819 : x = shifti(x,-vy); lx = lgefint(x);
1172 : }
1173 30970815 : else x = icopy(x); /* necessary because we destroy x */
1174 63203634 : set_avma(av); /* will erase our x,y when exiting */
1175 : /* now y is odd */
1176 63203634 : ly = lgefint(y);
1177 63203634 : if (ly == 3)
1178 : {
1179 26212839 : z = diviuexact_i(x,uel(y,2)); /* x != 0 */
1180 26212839 : setsigne(z, (sx+sy)? 1: -1); return z;
1181 : }
1182 36990795 : y0inv = invmod2BIL(y[ly-1]);
1183 58222677 : i=2; while (i<ly && y[i]==x[i]) i++;
1184 36990795 : lz = (i==ly || uel(y,i) < uel(x,i)) ? lx-ly+3 : lx-ly+2;
1185 36990795 : z = new_chunk(lz);
1186 :
1187 36990795 : y += ly - 1; /* now y[-i] = i-th word of y */
1188 173558436 : for (ii=lx-1,i=lz-1; i>=2; i--,ii--)
1189 : {
1190 : long limj;
1191 : LOCAL_HIREMAINDER;
1192 : LOCAL_OVERFLOW;
1193 :
1194 136567641 : z[i] = q = y0inv*uel(x,ii); /* i-th quotient */
1195 136567641 : if (!q) continue;
1196 :
1197 : /* x := x - q * y */
1198 136436784 : (void)mulll(q,y[0]); limj = maxss(lx - lz, ii+3-ly);
1199 : { /* update neither lowest word (could set it to 0) nor highest ones */
1200 136436784 : GEN x0 = x + (ii - 1), y0 = y - 1, xlim = x + limj;
1201 2318052651 : for (; x0 >= xlim; x0--, y0--)
1202 : {
1203 2181615867 : *x0 = subll(*x0, addmul(q,*y0));
1204 2181615867 : hiremainder += overflow;
1205 : }
1206 136436784 : if (hiremainder && limj != lx - lz)
1207 : {
1208 72248997 : if ((ulong)*x0 < hiremainder)
1209 : {
1210 835950 : *x0 -= hiremainder;
1211 835950 : do (*--x0)--; while ((ulong)*x0 == ULONG_MAX);
1212 : }
1213 : else
1214 71413047 : *x0 -= hiremainder;
1215 : }
1216 : }
1217 : }
1218 36990795 : i=2; while(!z[i]) i++;
1219 36990795 : z += i-2; lz -= (i-2);
1220 36990795 : z[0] = evaltyp(t_INT)|evallg(lz);
1221 36990795 : z[1] = evalsigne((sx+sy)? 1: -1) | evallg(lz);
1222 36990795 : if (lz == 2) pari_err_OP("exact division", x, y);
1223 36990795 : return gc_const((pari_sp)z, z);
1224 : }
1225 :
1226 : /* assume yz != and yz | x */
1227 : GEN
1228 149130 : diviuuexact(GEN x, ulong y, ulong z)
1229 : {
1230 : long tmp[4];
1231 : ulong t;
1232 : LOCAL_HIREMAINDER;
1233 149130 : t = mulll(y, z);
1234 149130 : if (!hiremainder) return diviuexact(x, t);
1235 0 : tmp[0] = evaltyp(t_INT)|_evallg(4);
1236 0 : tmp[1] = evalsigne(1)|evallgefint(4);
1237 0 : tmp[2] = hiremainder;
1238 0 : tmp[3] = t;
1239 0 : return diviiexact(x, tmp);
1240 : }
1241 :
1242 : /********************************************************************/
1243 : /** **/
1244 : /** INTEGER MULTIPLICATION (BASECASE) **/
1245 : /** **/
1246 : /********************************************************************/
1247 : /* nx >= ny = num. of digits of x, y (not GEN, see mulii) */
1248 : INLINE GEN
1249 5077985760 : muliispec_basecase(GEN x, GEN y, long nx, long ny)
1250 : {
1251 : GEN z2e,z2d,yd,xd,ye,zd;
1252 : long p1,lz;
1253 : LOCAL_HIREMAINDER;
1254 :
1255 5077985760 : if (ny == 1) return muluispec((ulong)*y, x, nx);
1256 1082617239 : if (ny == 0) return gen_0;
1257 1081396128 : zd = (GEN)avma; lz = nx+ny+2;
1258 1081396128 : (void)new_chunk(lz);
1259 1081396128 : xd = x + nx;
1260 1081396128 : yd = y + ny;
1261 1081396128 : ye = yd; p1 = *--xd;
1262 :
1263 1081396128 : *--zd = mulll(p1, *--yd); z2e = zd;
1264 8677572906 : while (yd > y) *--zd = addmul(p1, *--yd);
1265 1081396128 : *--zd = hiremainder;
1266 :
1267 10038451926 : while (xd > x)
1268 : {
1269 : LOCAL_OVERFLOW;
1270 8957055798 : yd = ye; p1 = *--xd;
1271 :
1272 8957055798 : z2d = --z2e;
1273 8957055798 : *z2d = addll(mulll(p1, *--yd), *z2d); z2d--;
1274 >11103*10^7 : while (yd > y)
1275 : {
1276 >10208*10^7 : hiremainder += overflow;
1277 >10208*10^7 : *z2d = addll(addmul(p1, *--yd), *z2d); z2d--;
1278 : }
1279 8957055798 : *--zd = hiremainder + overflow;
1280 : }
1281 1081396128 : if (*zd == 0) { zd++; lz--; } /* normalize */
1282 1081396128 : *--zd = evalsigne(1) | evallgefint(lz);
1283 1081396128 : *--zd = evaltyp(t_INT) | evallg(lz);
1284 1081396128 : return gc_const((pari_sp)zd, zd);
1285 : }
1286 :
1287 : INLINE GEN
1288 899883450 : sqrispec_basecase(GEN x, long nx)
1289 : {
1290 : GEN z2e,z2d,yd,xd,zd,x0,z0;
1291 : long p1,lz;
1292 : LOCAL_HIREMAINDER;
1293 : LOCAL_OVERFLOW;
1294 :
1295 899883450 : if (nx == 1) return sqru((ulong)*x);
1296 602566983 : if (nx == 0) return gen_0;
1297 220558554 : zd = (GEN)avma; lz = (nx+1) << 1;
1298 220558554 : z0 = new_chunk(lz);
1299 220558554 : if (nx == 1)
1300 : {
1301 0 : *--zd = mulll(*x, *x);
1302 0 : *--zd = hiremainder; goto END;
1303 : }
1304 220558554 : xd = x + nx;
1305 :
1306 : /* compute double products --> zd */
1307 220558554 : p1 = *--xd; yd = xd; --zd;
1308 220558554 : *--zd = mulll(p1, *--yd); z2e = zd;
1309 1199552496 : while (yd > x) *--zd = addmul(p1, *--yd);
1310 220558554 : *--zd = hiremainder;
1311 :
1312 220558554 : x0 = x+1;
1313 1199552496 : while (xd > x0)
1314 : {
1315 : LOCAL_OVERFLOW;
1316 978993942 : p1 = *--xd; yd = xd;
1317 :
1318 978993942 : z2e -= 2; z2d = z2e;
1319 978993942 : *z2d = addll(mulll(p1, *--yd), *z2d); z2d--;
1320 7867791111 : while (yd > x)
1321 : {
1322 6888797169 : hiremainder += overflow;
1323 6888797169 : *z2d = addll(addmul(p1, *--yd), *z2d); z2d--;
1324 : }
1325 978993942 : *--zd = hiremainder + overflow;
1326 : }
1327 : /* multiply zd by 2 (put result in zd - 1) */
1328 220558554 : zd[-1] = ((*zd & HIGHBIT) != 0);
1329 220558554 : shift_left(zd, zd, 0, (nx<<1)-3, 0, 1);
1330 :
1331 : /* add the squares */
1332 220558554 : xd = x + nx; zd = z0 + lz;
1333 220558554 : p1 = *--xd;
1334 220558554 : zd--; *zd = mulll(p1,p1);
1335 220558554 : zd--; *zd = addll(hiremainder, *zd);
1336 1420111050 : while (xd > x)
1337 : {
1338 1199552496 : p1 = *--xd;
1339 1199552496 : zd--; *zd = addll(mulll(p1,p1)+ overflow, *zd);
1340 1199552496 : zd--; *zd = addll(hiremainder + overflow, *zd);
1341 : }
1342 :
1343 220558554 : END:
1344 220558554 : if (*zd == 0) { zd++; lz--; } /* normalize */
1345 220558554 : *--zd = evalsigne(1) | evallgefint(lz);
1346 220558554 : *--zd = evaltyp(t_INT) | evallg(lz);
1347 220558554 : return gc_const((pari_sp)zd, zd);
1348 : }
1349 :
1350 : /********************************************************************/
1351 : /** **/
1352 : /** INTEGER MULTIPLICATION (FFT) **/
1353 : /** **/
1354 : /********************************************************************/
1355 :
1356 : /*
1357 : Compute parameters for FFT:
1358 : len: result length
1359 : k: FFT depth.
1360 : n: number of blocks (2^k)
1361 : bs: block size
1362 : mod: Modulus is M=2^(BIL*mod)+1
1363 : ord: order of 2 in Z/MZ.
1364 : We must have:
1365 : bs*n >= l
1366 : 2^(BIL*mod) > nb*2^(2*BIL*bs)
1367 : 2^k | 2*BIL*mod
1368 : */
1369 : static void
1370 85068 : mulliifft_params(long len, long *k, long *mod, long *bs, long *n, ulong *ord)
1371 : {
1372 : long r;
1373 85068 : *k = expu((3*len)>>2)-3;
1374 : do {
1375 85071 : (*k)--;
1376 85071 : r = *k-(TWOPOTBITS_IN_LONG+2);
1377 85071 : *n = 1L<<*k;
1378 85071 : *bs = (len+*n-1)>>*k;
1379 85071 : *mod= 2**bs+1;
1380 85071 : if (r>0)
1381 5145 : *mod=((*mod+(1L<<r)-1)>>r)<<r;
1382 85071 : } while(*mod>=3**bs);
1383 85068 : *ord= 4**mod*BITS_IN_LONG;
1384 85068 : }
1385 :
1386 : /* Zf_: arithmetic in ring Z/MZ where M= 2^(BITS_IN_LONG*mod)+1
1387 : * for some mod.
1388 : * Do not garbage collect.
1389 : */
1390 :
1391 : static GEN
1392 186970176 : Zf_add(GEN a, GEN b, GEN M)
1393 : {
1394 186970176 : GEN y, z = addii(a,b);
1395 186970176 : long mod = lgefint(M)-3;
1396 186970176 : long l = NLIMBS(z);
1397 186970176 : if (l<=mod) return z;
1398 72435387 : y = subiu(z, 1);
1399 72435387 : if (NLIMBS(y)<=mod) return z;
1400 72435387 : return int_normalize(y,1);
1401 : }
1402 :
1403 : static GEN
1404 190355244 : Zf_sub(GEN a, GEN b, GEN M)
1405 : {
1406 190355244 : GEN z = subii(a,b);
1407 190355244 : return signe(z)>=0? z: addii(M,z);
1408 : }
1409 :
1410 : /* destroy z */
1411 : static GEN
1412 397737516 : Zf_red_destroy(GEN z, GEN M)
1413 : {
1414 397737516 : long mod = lgefint(M)-3;
1415 397737516 : long l = NLIMBS(z);
1416 : GEN y;
1417 397737516 : if (l<=mod) return z;
1418 176535555 : y = shifti(z, -mod*BITS_IN_LONG);
1419 176535555 : z = int_normalize(z, NLIMBS(y));
1420 176535555 : y = Zf_red_destroy(y, M);
1421 176535555 : z = subii(z, y);
1422 176535555 : if (signe(z)<0) z = addii(z, M);
1423 176535555 : return z;
1424 : }
1425 :
1426 : INLINE GEN
1427 205469481 : Zf_shift(GEN a, ulong s, GEN M) { return Zf_red_destroy(shifti(a, s), M); }
1428 :
1429 : /*
1430 : Multiply by sqrt(2)^s
1431 : We use the formula sqrt(2)=z_8*(1-z_4)) && z_8=2^(ord/16) [2^(ord/4)+1]
1432 : */
1433 :
1434 : static GEN
1435 186970176 : Zf_mulsqrt2(GEN a, ulong s, ulong ord, GEN M)
1436 : {
1437 186970176 : ulong hord = ord>>1;
1438 186970176 : if (!signe(a)) return gen_0;
1439 182966865 : if (odd(s)) /* Multiply by 2^(s/2) */
1440 : {
1441 3385068 : GEN az8 = Zf_shift(a, ord>>4, M);
1442 3385068 : GEN az83 = Zf_shift(az8, ord>>3, M);
1443 3385068 : a = Zf_sub(az8, az83, M);
1444 3385068 : s--;
1445 : }
1446 182966865 : if (s < hord)
1447 135920298 : return Zf_shift(a, s>>1, M);
1448 : else
1449 47046567 : return subii(M,Zf_shift(a, (s-hord)>>1, M));
1450 : }
1451 :
1452 : INLINE GEN
1453 448896 : Zf_sqr(GEN a, GEN M) { return Zf_red_destroy(sqri(a), M); }
1454 :
1455 : INLINE GEN
1456 15283584 : Zf_mul(GEN a, GEN b, GEN M) { return Zf_red_destroy(mulii(a,b), M); }
1457 :
1458 : /* In place, bit reversing FFT */
1459 : static void
1460 30847587 : muliifft_dit(ulong o, ulong ord, GEN M, GEN FFT, long d, long step)
1461 : {
1462 30847587 : pari_sp av = avma;
1463 : long i;
1464 30847587 : ulong j, no = (o<<1)%ord;
1465 30847587 : long hstep=step>>1;
1466 154836003 : for (i = d+1, j = 0; i <= d+hstep; ++i, j =(j+o)%ord)
1467 : {
1468 123988416 : GEN a = Zf_add(gel(FFT,i), gel(FFT,i+hstep), M);
1469 123988416 : GEN b = Zf_mulsqrt2(Zf_sub(gel(FFT,i), gel(FFT,i+hstep), M), j, ord, M);
1470 123988416 : affii(a,gel(FFT,i));
1471 123988416 : affii(b,gel(FFT,i+hstep));
1472 123988416 : set_avma(av);
1473 : }
1474 30847587 : if (hstep>1)
1475 : {
1476 15339555 : muliifft_dit(no, ord, M, FFT, d, hstep);
1477 15339555 : muliifft_dit(no, ord, M, FFT, d+hstep, hstep);
1478 : }
1479 30847587 : }
1480 :
1481 : /* In place, bit reversed FFT, inverse of muliifft_dit */
1482 : static void
1483 15647412 : muliifft_dis(ulong o, ulong ord, GEN M, GEN FFT, long d, long step)
1484 : {
1485 15647412 : pari_sp av = avma;
1486 : long i;
1487 15647412 : ulong j, no = (o<<1)%ord;
1488 15647412 : long hstep=step>>1;
1489 15647412 : if (hstep>1)
1490 : {
1491 7781172 : muliifft_dis(no, ord, M, FFT, d, hstep);
1492 7781172 : muliifft_dis(no, ord, M, FFT, d+hstep, hstep);
1493 : }
1494 78629172 : for (i = d+1, j = 0; i <= d+hstep; ++i, j =(j+o)%ord)
1495 : {
1496 62981760 : GEN z = Zf_mulsqrt2(gel(FFT,i+hstep), j, ord, M);
1497 62981760 : GEN a = Zf_add(gel(FFT,i), z, M);
1498 62981760 : GEN b = Zf_sub(gel(FFT,i), z, M);
1499 62981760 : affii(a,gel(FFT,i));
1500 62981760 : affii(b,gel(FFT,i+hstep));
1501 62981760 : set_avma(av);
1502 : }
1503 15647412 : }
1504 :
1505 : static GEN
1506 168477 : muliifft_spliti(GEN a, long na, long bs, long n, long mod)
1507 : {
1508 168477 : GEN ap = a+na-1;
1509 168477 : GEN c = cgetg(n+1, t_VEC);
1510 : long i,j;
1511 31184541 : for(i=1;i<=n;i++)
1512 : {
1513 31016064 : GEN z = cgeti(mod+3);
1514 31016064 : if (na)
1515 : {
1516 15272730 : long m = minss(bs, na), v=0;
1517 15272730 : GEN zp, aa=ap-m+1;
1518 83147766 : while (!*aa && v<m) {aa++; v++;}
1519 15272730 : zp = z+m-v+1;
1520 380188806 : for (j=v; j < m; j++)
1521 364916076 : *zp-- = *ap--;
1522 15272730 : ap -= v; na -= m;
1523 15272730 : z[1] = evalsigne(m!=v) | evallgefint(m-v+2);
1524 : } else
1525 15743334 : z[1] = evalsigne(0) | evallgefint(2);
1526 31016064 : gel(c, i) = z;
1527 : }
1528 168477 : return c;
1529 : }
1530 :
1531 : static GEN
1532 85068 : muliifft_unspliti(GEN V, long bs, long len)
1533 : {
1534 85068 : long s, i, j, l = lg(V);
1535 85068 : GEN a = cgeti(len);
1536 85068 : a[1] = evalsigne(1)|evallgefint(len);
1537 439674603 : for(i=2;i<len;i++)
1538 439589535 : a[i] = 0;
1539 15817548 : for(i=1, s=0; i<l; i++, s+=bs)
1540 : {
1541 15732480 : GEN u = gel(V,i);
1542 15732480 : if (signe(u))
1543 : {
1544 15158649 : GEN ap = int_W(a,s);
1545 15158649 : GEN up = int_LSW(u);
1546 15158649 : long lu = NLIMBS(u);
1547 : LOCAL_OVERFLOW;
1548 15158649 : *ap = addll(*ap, *up--); ap--;
1549 859648563 : for (j=1; j<lu; j++)
1550 844489914 : { *ap = addllx(*ap, *up--); ap--; }
1551 15161205 : while (overflow)
1552 2556 : { *ap = addll(*ap, 1); ap--; }
1553 : }
1554 : }
1555 85068 : return int_normalize(a,0);
1556 : }
1557 :
1558 : static GEN
1559 1659 : sqrispec_fft(GEN a, long na)
1560 : {
1561 1659 : pari_sp av, ltop = avma;
1562 1659 : long len = 2*na;
1563 : long k, mod, bs, n;
1564 : GEN FFT, M;
1565 : long i;
1566 : ulong o, ord;
1567 :
1568 1659 : mulliifft_params(len,&k,&mod,&bs,&n,&ord);
1569 1659 : o = ord>>k;
1570 1659 : M = int2n(mod*BITS_IN_LONG);
1571 1659 : M[2+mod] = 1;
1572 1659 : FFT = muliifft_spliti(a, na, bs, n, mod);
1573 1659 : muliifft_dit(o, ord, M, FFT, 0, n);
1574 1659 : av = avma;
1575 450555 : for(i=1; i<=n; i++)
1576 : {
1577 448896 : affii(Zf_sqr(gel(FFT,i), M), gel(FFT,i));
1578 448896 : set_avma(av);
1579 : }
1580 1659 : muliifft_dis(ord-o, ord, M, FFT, 0, n);
1581 450555 : for(i=1; i<=n; i++)
1582 : {
1583 448896 : affii(Zf_shift(gel(FFT,i), (ord>>1)-k, M), gel(FFT,i));
1584 448896 : set_avma(av);
1585 : }
1586 1659 : return gerepileuptoint(ltop, muliifft_unspliti(FFT,bs,2+len));
1587 : }
1588 :
1589 : static GEN
1590 83409 : muliispec_fft(GEN a, GEN b, long na, long nb)
1591 : {
1592 83409 : pari_sp av, av2, ltop = avma;
1593 83409 : long len = na+nb;
1594 : long k, mod, bs, n;
1595 : GEN FFT, FFTb, M;
1596 : long i;
1597 : ulong o, ord;
1598 :
1599 83409 : mulliifft_params(len,&k,&mod,&bs,&n,&ord);
1600 83409 : o = ord>>k;
1601 83409 : M = int2n(mod*BITS_IN_LONG);
1602 83409 : M[2+mod] = 1;
1603 83409 : FFT = muliifft_spliti(a, na, bs, n, mod);
1604 83409 : av=avma;
1605 83409 : muliifft_dit(o, ord, M, FFT, 0, n);
1606 83409 : FFTb = muliifft_spliti(b, nb, bs, n, mod);
1607 83409 : av2 = avma;
1608 83409 : muliifft_dit(o, ord, M, FFTb, 0, n);
1609 15366993 : for(i=1; i<=n; i++)
1610 : {
1611 15283584 : affii(Zf_mul(gel(FFT,i), gel(FFTb,i), M), gel(FFT,i));
1612 15283584 : set_avma(av2);
1613 : }
1614 83409 : set_avma(av);
1615 83409 : muliifft_dis(ord-o, ord, M, FFT, 0, n);
1616 15366993 : for(i=1; i<=n; i++)
1617 : {
1618 15283584 : affii(Zf_shift(gel(FFT,i),(ord>>1)-k,M), gel(FFT,i));
1619 15283584 : set_avma(av);
1620 : }
1621 83409 : return gerepileuptoint(ltop, muliifft_unspliti(FFT,bs,2+len));
1622 : }
1623 :
1624 : /********************************************************************/
1625 : /** **/
1626 : /** INTEGER MULTIPLICATION (KARATSUBA) **/
1627 : /** **/
1628 : /********************************************************************/
1629 :
1630 : /* return (x shifted left d words) + y. Assume d > 0, x > 0 and y >= 0 */
1631 : static GEN
1632 651793083 : addshiftw(GEN x, GEN y, long d)
1633 : {
1634 651793083 : GEN z,z0,y0,yd, zd = (GEN)avma;
1635 651793083 : long a,lz,ly = lgefint(y);
1636 :
1637 651793083 : z0 = new_chunk(d);
1638 651793083 : a = ly-2; yd = y+ly;
1639 651793083 : if (a >= d)
1640 : {
1641 11113552596 : y0 = yd-d; while (yd > y0) *--zd = *--yd; /* copy last d words of y */
1642 647196495 : a -= d;
1643 647196495 : if (a)
1644 414883269 : z = addiispec(LIMBS(x), LIMBS(y), NLIMBS(x), a);
1645 : else
1646 232313226 : z = icopy(x);
1647 : }
1648 : else
1649 : {
1650 17050149 : y0 = yd-a; while (yd > y0) *--zd = *--yd; /* copy last a words of y */
1651 69975840 : while (zd > z0) *--zd = 0; /* complete with 0s */
1652 4596588 : z = icopy(x);
1653 : }
1654 651793083 : lz = lgefint(z)+d;
1655 651793083 : z[1] = evalsigne(1) | evallgefint(lz);
1656 651793083 : z[0] = evaltyp(t_INT) | evallg(lz); return z;
1657 : }
1658 :
1659 : /* Fast product (Karatsuba) of integers. a and b are "special" GENs
1660 : * c,c0,c1,c2 are genuine GENs.
1661 : */
1662 : GEN
1663 5281303014 : muliispec(GEN a, GEN b, long na, long nb)
1664 : {
1665 : GEN a0,c,c0;
1666 : long n0, n0a, i;
1667 : pari_sp av;
1668 :
1669 5281303014 : if (na < nb) swapspec(a,b, na,nb);
1670 5281303014 : if (nb < MULII_KARATSUBA_LIMIT) return muliispec_basecase(a,b,na,nb);
1671 203317254 : if (nb >= MULII_FFT_LIMIT) return muliispec_fft(a,b,na,nb);
1672 203233845 : i=(na>>1); n0=na-i; na=i;
1673 203233845 : av=avma; a0=a+na; n0a=n0;
1674 302787756 : while (n0a && !*a0) { a0++; n0a--; }
1675 :
1676 203233845 : if (n0a && nb > n0)
1677 199743744 : { /* nb <= na <= n0 */
1678 : GEN b0,c1,c2;
1679 : long n0b;
1680 :
1681 199743744 : nb -= n0;
1682 199743744 : c = muliispec(a,b,na,nb);
1683 199743744 : b0 = b+nb; n0b = n0;
1684 283769784 : while (n0b && !*b0) { b0++; n0b--; }
1685 199743744 : if (n0b)
1686 : {
1687 198978306 : c0 = muliispec(a0,b0, n0a,n0b);
1688 :
1689 198978306 : c2 = addiispec(a0,a, n0a,na);
1690 198978306 : c1 = addiispec(b0,b, n0b,nb);
1691 198978306 : c1 = muliispec(LIMBS(c1),LIMBS(c2), NLIMBS(c1),NLIMBS(c2));
1692 198978306 : c2 = addiispec(LIMBS(c0),LIMBS(c), NLIMBS(c0),NLIMBS(c));
1693 :
1694 198978306 : c1 = subiispec(LIMBS(c1),LIMBS(c2), NLIMBS(c1),NLIMBS(c2));
1695 : }
1696 : else
1697 : {
1698 765438 : c0 = gen_0;
1699 765438 : c1 = muliispec(a0,b, n0a,nb);
1700 : }
1701 199743744 : c = addshiftw(c,c1, n0);
1702 : }
1703 : else
1704 : {
1705 3490101 : c = muliispec(a,b,na,nb);
1706 3490101 : c0 = muliispec(a0,b,n0a,nb);
1707 : }
1708 203233845 : return gerepileuptoint(av, addshiftw(c,c0, n0));
1709 : }
1710 : GEN
1711 165798 : muluui(ulong x, ulong y, GEN z)
1712 : {
1713 165798 : long t, s = signe(z);
1714 : GEN r;
1715 : LOCAL_HIREMAINDER;
1716 :
1717 165798 : if (!x || !y || !signe(z)) return gen_0;
1718 165501 : t = mulll(x,y);
1719 165501 : if (!hiremainder)
1720 165501 : r = muluispec(t, z+2, lgefint(z)-2);
1721 : else
1722 : {
1723 : long tmp[2];
1724 0 : tmp[0] = hiremainder;
1725 0 : tmp[1] = t;
1726 0 : r = muliispec(z+2,tmp,lgefint(z)-2,2);
1727 : }
1728 165501 : setsigne(r,s); return r;
1729 : }
1730 :
1731 : #define sqrispec_mirror sqrispec
1732 : #define muliispec_mirror muliispec
1733 :
1734 : /* x % (2^n), assuming n >= 0 */
1735 : GEN
1736 18481644 : remi2n(GEN x, long n)
1737 : {
1738 18481644 : long hi,l,k,lx,ly, sx = signe(x);
1739 : GEN z, xd, zd;
1740 :
1741 18481644 : if (!sx || !n) return gen_0;
1742 :
1743 18459015 : k = dvmdsBIL(n, &l);
1744 18459015 : lx = lgefint(x);
1745 18459015 : if (lx < k+3) return icopy(x);
1746 :
1747 18072429 : xd = x + (lx-k-1);
1748 : /* x = |_|...|#|1|...|k| : copy the last l bits of # and the last k words
1749 : * ^--- initial xd */
1750 18072429 : hi = ((ulong)*xd) & ((1UL<<l)-1); /* last l bits of # = top bits of result */
1751 18072429 : if (!hi)
1752 : { /* strip leading zeroes from result */
1753 828492 : xd++; while (k && !*xd) { k--; xd++; }
1754 800958 : if (!k) return gen_0;
1755 602100 : ly = k+2; xd--;
1756 : }
1757 : else
1758 17271471 : ly = k+3;
1759 :
1760 17873571 : zd = z = cgeti(ly);
1761 17873571 : *++zd = evalsigne(sx) | evallgefint(ly);
1762 17873571 : if (hi) *++zd = hi;
1763 102033615 : for ( ;k; k--) *++zd = *++xd;
1764 17873571 : return z;
1765 : }
1766 :
1767 : GEN
1768 907228368 : sqrispec(GEN a, long na)
1769 : {
1770 : GEN a0,c;
1771 : long n0, n0a, i;
1772 : pari_sp av;
1773 :
1774 907228368 : if (na < SQRI_KARATSUBA_LIMIT) return sqrispec_basecase(a,na);
1775 7344918 : if (na >= SQRI_FFT_LIMIT) return sqrispec_fft(a,na);
1776 7343259 : i=(na>>1); n0=na-i; na=i;
1777 7343259 : av=avma; a0=a+na; n0a=n0;
1778 11582631 : while (n0a && !*a0) { a0++; n0a--; }
1779 7343259 : c = sqrispec(a,na);
1780 7343259 : if (n0a)
1781 : {
1782 7333731 : GEN t, c1, c0 = sqrispec(a0,n0a);
1783 : #if 0
1784 : c1 = shifti(muliispec(a0,a, n0a,na),1);
1785 : #else /* faster */
1786 7333731 : t = addiispec(a0,a,n0a,na);
1787 7333731 : t = sqrispec(LIMBS(t),NLIMBS(t));
1788 7333731 : c1= addiispec(LIMBS(c0),LIMBS(c), NLIMBS(c0), NLIMBS(c));
1789 7333731 : c1= subiispec(LIMBS(t),LIMBS(c1), NLIMBS(t), NLIMBS(c1));
1790 : #endif
1791 7333731 : c = addshiftw(c,c1, n0);
1792 7333731 : c = addshiftw(c,c0, n0);
1793 : }
1794 : else
1795 9528 : c = addshiftw(c,gen_0,n0<<1);
1796 7343259 : return gerepileuptoint(av, c);
1797 : }
1798 :
1799 : /********************************************************************/
1800 : /** **/
1801 : /** KARATSUBA SQUARE ROOT **/
1802 : /** adapted from Paul Zimmermann's implementation of **/
1803 : /** his algorithm in GMP (mpn_sqrtrem) **/
1804 : /** **/
1805 : /********************************************************************/
1806 :
1807 : /* Square roots table */
1808 : static const unsigned char approx_tab[192] = {
1809 : 128,128,129,130,131,132,133,134,135,136,137,138,139,140,141,142,
1810 : 143,144,144,145,146,147,148,149,150,150,151,152,153,154,155,155,
1811 : 156,157,158,159,160,160,161,162,163,163,164,165,166,167,167,168,
1812 : 169,170,170,171,172,173,173,174,175,176,176,177,178,178,179,180,
1813 : 181,181,182,183,183,184,185,185,186,187,187,188,189,189,190,191,
1814 : 192,192,193,193,194,195,195,196,197,197,198,199,199,200,201,201,
1815 : 202,203,203,204,204,205,206,206,207,208,208,209,209,210,211,211,
1816 : 212,212,213,214,214,215,215,216,217,217,218,218,219,219,220,221,
1817 : 221,222,222,223,224,224,225,225,226,226,227,227,228,229,229,230,
1818 : 230,231,231,232,232,233,234,234,235,235,236,236,237,237,238,238,
1819 : 239,240,240,241,241,242,242,243,243,244,244,245,245,246,246,247,
1820 : 247,248,248,249,249,250,250,251,251,252,252,253,253,254,254,255
1821 : };
1822 :
1823 : /* N[0], assume N[0] >= 2^(BIL-2).
1824 : * Return r,s such that s^2 + r = N, 0 <= r <= 2s */
1825 : static void
1826 94643775 : p_sqrtu1(ulong *N, ulong *ps, ulong *pr)
1827 : {
1828 94643775 : ulong prec, r, s, q, u, n0 = N[0];
1829 :
1830 94643775 : q = n0 >> (BITS_IN_LONG - 8);
1831 : /* 2^6 = 64 <= q < 256 = 2^8 */
1832 94643775 : s = approx_tab[q - 64]; /* 128 <= s < 255 */
1833 94643775 : r = (n0 >> (BITS_IN_LONG - 16)) - s * s; /* r <= 2*s */
1834 94643775 : if (r > (s << 1)) { r -= (s << 1) | 1; s++; }
1835 :
1836 : /* 8-bit approximation from the high 8-bits of N[0] */
1837 94643775 : prec = 8;
1838 94643775 : n0 <<= 2 * prec;
1839 283931325 : while (2 * prec < BITS_IN_LONG)
1840 : { /* invariant: s has prec bits, and r <= 2*s */
1841 189287550 : r = (r << prec) + (n0 >> (BITS_IN_LONG - prec));
1842 189287550 : n0 <<= prec;
1843 189287550 : u = 2 * s;
1844 189287550 : q = r / u; u = r - q * u;
1845 189287550 : s = (s << prec) + q;
1846 189287550 : u = (u << prec) + (n0 >> (BITS_IN_LONG - prec));
1847 189287550 : q = q * q;
1848 189287550 : r = u - q;
1849 189287550 : if (u < q) { s--; r += (s << 1) | 1; }
1850 189287550 : n0 <<= prec;
1851 189287550 : prec = 2 * prec;
1852 : }
1853 94643775 : *ps = s;
1854 94643775 : *pr = r;
1855 94643775 : }
1856 :
1857 : /* N[0..1], assume N[0] >= 2^(BIL-2).
1858 : * Return 1 if remainder overflows, 0 otherwise */
1859 : static int
1860 91944042 : p_sqrtu2(ulong *N, ulong *ps, ulong *pr)
1861 : {
1862 91944042 : ulong cc, qhl, r, s, q, u, n1 = N[1];
1863 : LOCAL_OVERFLOW;
1864 :
1865 91944042 : p_sqrtu1(N, &s, &r); /* r <= 2s */
1866 137535726 : qhl = 0; while (r >= s) { qhl++; r -= s; }
1867 : /* now r < s < 2^(BIL/2) */
1868 91944042 : r = (r << BITS_IN_HALFULONG) | (n1 >> BITS_IN_HALFULONG);
1869 91944042 : u = s << 1;
1870 91944042 : q = r / u; u = r - q * u;
1871 91944042 : q += (qhl & 1) << (BITS_IN_HALFULONG - 1);
1872 91944042 : qhl >>= 1;
1873 : /* (initial r)<<(BIL/2) + n1>>(BIL/2) = (qhl<<(BIL/2) + q) * 2s + u */
1874 91944042 : s = ((s + qhl) << BITS_IN_HALFULONG) + q;
1875 91944042 : cc = u >> BITS_IN_HALFULONG;
1876 91944042 : r = (u << BITS_IN_HALFULONG) | (n1 & LOWMASK);
1877 91944042 : r = subll(r, q * q);
1878 91944042 : cc -= overflow + qhl;
1879 : /* now subtract 2*q*2^(BIL/2) + 2^BIL if qhl is set */
1880 91944042 : if ((long)cc < 0)
1881 : {
1882 23460060 : if (s) {
1883 23407119 : r = addll(r, s);
1884 23407119 : cc += overflow;
1885 23407119 : s--;
1886 : } else {
1887 52941 : cc++;
1888 52941 : s = ~0UL;
1889 : }
1890 23460060 : r = addll(r, s);
1891 23460060 : cc += overflow;
1892 : }
1893 91944042 : *ps = s;
1894 91944042 : *pr = r; return cc;
1895 : }
1896 :
1897 : static void
1898 90882495 : xmpn_zero(GEN x, long n)
1899 : {
1900 694998138 : while (--n >= 0) x[n]=0;
1901 90882495 : }
1902 : static void
1903 1068008355 : xmpn_copy(GEN z, GEN x, long n)
1904 : {
1905 1068008355 : long k = n;
1906 4196846487 : while (--k >= 0) z[k] = x[k];
1907 1068008355 : }
1908 : /* a[0..la-1] * 2^(lb BIL) | b[0..lb-1] */
1909 : static GEN
1910 468277008 : catii(GEN a, long la, GEN b, long lb)
1911 : {
1912 468277008 : long l = la + lb + 2;
1913 468277008 : GEN z = cgetipos(l);
1914 468277008 : xmpn_copy(LIMBS(z), a, la);
1915 468277008 : xmpn_copy(LIMBS(z) + la, b, lb);
1916 468277008 : return int_normalize(z, 0);
1917 : }
1918 :
1919 : /* sqrt n[0..1], assume n normalized */
1920 : static GEN
1921 91669023 : sqrtispec2(GEN n, GEN *pr)
1922 : {
1923 : ulong s, r;
1924 91669023 : int hi = p_sqrtu2((ulong*)n, &s, &r);
1925 91669023 : GEN S = utoi(s);
1926 91669023 : *pr = hi? uutoi(1,r): utoi(r);
1927 91669023 : return S;
1928 : }
1929 :
1930 : /* sqrt n[0], _dont_ assume n normalized */
1931 : static GEN
1932 2699733 : sqrtispec1_sh(GEN n, GEN *pr)
1933 : {
1934 : GEN S;
1935 2699733 : ulong r, s, u0 = uel(n,0);
1936 2699733 : int sh = bfffo(u0) & ~1UL;
1937 2699733 : if (sh) u0 <<= sh;
1938 2699733 : p_sqrtu1(&u0, &s, &r);
1939 : /* s^2 + r = u0, s < 2^(BIL/2). Rescale back:
1940 : * 2^(2k) n = S^2 + R
1941 : * so 2^(2k) n = (S - s0)^2 + (2*S*s0 - s0^2 + R), s0 = S mod 2^k. */
1942 2699733 : if (sh) {
1943 1629615 : int k = sh >> 1;
1944 1629615 : ulong s0 = s & ((1L<<k) - 1);
1945 1629615 : r += s * (s0<<1);
1946 1629615 : s >>= k;
1947 1629615 : r >>= sh;
1948 : }
1949 2699733 : S = utoi(s);
1950 2699733 : if (pr) *pr = utoi(r);
1951 2699733 : return S;
1952 : }
1953 :
1954 : /* sqrt n[0..1], _dont_ assume n normalized */
1955 : static GEN
1956 275019 : sqrtispec2_sh(GEN n, GEN *pr)
1957 : {
1958 : GEN S;
1959 275019 : ulong U[2], r, s, u0 = uel(n,0), u1 = uel(n,1);
1960 275019 : int hi, sh = bfffo(u0) & ~1UL;
1961 275019 : if (sh) {
1962 247056 : u0 = (u0 << sh) | (u1 >> (BITS_IN_LONG-sh));
1963 247056 : u1 <<= sh;
1964 : }
1965 275019 : U[0] = u0;
1966 275019 : U[1] = u1; hi = p_sqrtu2(U, &s, &r);
1967 : /* s^2 + R = u0|u1. Rescale back:
1968 : * 2^(2k) n = S^2 + R
1969 : * so 2^(2k) n = (S - s0)^2 + (2*S*s0 - s0^2 + R), s0 = S mod 2^k. */
1970 275019 : if (sh) {
1971 247056 : int k = sh >> 1;
1972 247056 : ulong s0 = s & ((1L<<k) - 1);
1973 : LOCAL_HIREMAINDER;
1974 : LOCAL_OVERFLOW;
1975 247056 : r = addll(r, mulll(s, (s0<<1)));
1976 247056 : if (overflow) hiremainder++;
1977 247056 : hiremainder += hi; /* + 0 or 1 */
1978 247056 : s >>= k;
1979 247056 : r = (r>>sh) | (hiremainder << (BITS_IN_LONG-sh));
1980 247056 : hi = (hiremainder & (1L<<sh));
1981 : }
1982 275019 : S = utoi(s);
1983 275019 : if (pr) *pr = hi? uutoi(1,r): utoi(r);
1984 275019 : return S;
1985 : }
1986 :
1987 : /* Let N = N[0..2n-1]. Return S (and set R) s.t S^2 + R = N, 0 <= R <= 2S
1988 : * Assume N normalized */
1989 : static GEN
1990 325807527 : sqrtispec(GEN N, long n, GEN *r)
1991 : {
1992 : GEN S, R, q, z, u;
1993 : long l, h;
1994 :
1995 325807527 : if (n == 1) return sqrtispec2(N, r);
1996 234138504 : l = n >> 1;
1997 234138504 : h = n - l; /* N = a3(h) | a2(h) | a1(l) | a0(l words) */
1998 234138504 : S = sqrtispec(N, h, &R); /* S^2 + R = a3|a2 */
1999 :
2000 234138504 : z = catii(LIMBS(R), NLIMBS(R), N + 2*h, l); /* = R | a1(l) */
2001 234138504 : q = dvmdii(z, shifti(S,1), &u);
2002 234138504 : z = catii(LIMBS(u), NLIMBS(u), N + n + h, l); /* = u | a0(l) */
2003 :
2004 234138504 : S = addshiftw(S, q, l);
2005 234138504 : R = subii(z, sqri(q));
2006 234138504 : if (signe(R) < 0)
2007 : {
2008 40019331 : GEN S2 = shifti(S,1);
2009 40019331 : R = addis(subiispec(LIMBS(S2),LIMBS(R), NLIMBS(S2),NLIMBS(R)), -1);
2010 40019331 : S = addis(S, -1);
2011 : }
2012 234138504 : *r = R; return S;
2013 : }
2014 :
2015 : /* Return S (and set R) s.t S^2 + R = N, 0 <= R <= 2S.
2016 : * As for dvmdii, R is last on stack and guaranteed to be gen_0 in case the
2017 : * remainder is 0. R = NULL is allowed. */
2018 : GEN
2019 3761835 : sqrtremi(GEN N, GEN *r)
2020 : {
2021 : pari_sp av;
2022 3761835 : GEN S, R, n = N+2;
2023 3761835 : long k, l2, ln = NLIMBS(N);
2024 : int sh;
2025 :
2026 3761835 : if (ln <= 2)
2027 : {
2028 2975307 : if (ln == 2) return sqrtispec2_sh(n, r);
2029 2700288 : if (ln == 1) return sqrtispec1_sh(n, r);
2030 555 : if (r) *r = gen_0;
2031 555 : return gen_0;
2032 : }
2033 786528 : av = avma;
2034 786528 : sh = bfffo(n[0]) >> 1;
2035 786528 : l2 = (ln + 1) >> 1;
2036 786528 : if (sh || (ln & 1)) { /* normalize n, so that n[0] >= 2^BIL / 4 */
2037 785835 : GEN s0, t = new_chunk(ln + 1);
2038 785835 : t[ln] = 0;
2039 785835 : if (sh)
2040 783987 : shift_left(t, n, 0,ln-1, 0, sh << 1);
2041 : else
2042 1848 : xmpn_copy(t, n, ln);
2043 785835 : S = sqrtispec(t, l2, &R); /* t normalized, 2 * l2 words */
2044 : /* Rescale back:
2045 : * 2^(2k) n = S^2 + R, k = sh + (ln & 1)*BIL/2
2046 : * so 2^(2k) n = (S - s0)^2 + (2*S*s0 - s0^2 + R), s0 = S mod 2^k. */
2047 785835 : k = sh + (ln & 1) * (BITS_IN_LONG/2);
2048 785835 : s0 = remi2n(S, k);
2049 785835 : R = addii(shifti(R,-1), mulii(s0, S));
2050 785835 : R = shifti(R, 1 - (k<<1));
2051 785835 : S = shifti(S, -k);
2052 : }
2053 : else
2054 693 : S = sqrtispec(n, l2, &R);
2055 :
2056 786528 : if (!r) { set_avma((pari_sp)S); return gerepileuptoint(av, S); }
2057 722787 : *r = R; return gc_all(av, 2, &S, r);
2058 : }
2059 :
2060 : /* compute sqrt(|a|), assuming a != 0 */
2061 :
2062 : #if 1
2063 : GEN
2064 90882495 : sqrtr_abs(GEN x)
2065 : {
2066 90882495 : long l = lg(x) - 2, e = expo(x), er = e>>1;
2067 90882495 : GEN b, c, res = cgetg(2 + l, t_REAL);
2068 90882495 : res[1] = evalsigne(1) | evalexpo(er);
2069 90882495 : if (e&1) {
2070 40569996 : b = new_chunk(l << 1);
2071 40569996 : xmpn_copy(b, x+2, l);
2072 40569996 : xmpn_zero(b + l,l);
2073 40569996 : b = sqrtispec(b, l, &c);
2074 40569996 : xmpn_copy(res+2, b+2, l);
2075 40569996 : if (cmpii(c, b) > 0) roundr_up_ip(res, l+2);
2076 : } else {
2077 : ulong u;
2078 50312499 : b = new_chunk(2 + (l << 1));
2079 50312499 : shift_left(b+1, x+2, 0,l-1, 0, BITS_IN_LONG-1);
2080 50312499 : b[0] = uel(x,2)>>1;
2081 50312499 : xmpn_zero(b + l+1,l+1);
2082 50312499 : b = sqrtispec(b, l+1, &c);
2083 50312499 : xmpn_copy(res+2, b+2, l);
2084 50312499 : u = uel(b,l+2);
2085 50312499 : if ( u&HIGHBIT || (u == ~HIGHBIT && cmpii(c,b) > 0))
2086 24820974 : roundr_up_ip(res, l+2);
2087 : }
2088 90882495 : return gc_const((pari_sp)res, res);
2089 : }
2090 :
2091 : #else /* use t_REAL: currently much slower (quadratic division) */
2092 :
2093 : #ifdef LONG_IS_64BIT
2094 : /* 64 bits of b = sqrt(a[0] * 2^64 + a[1]) [ up to 1ulp ] */
2095 : static ulong
2096 : sqrtu2(ulong *a)
2097 : {
2098 : ulong c, b = dblmantissa( sqrt((double)a[0]) );
2099 : LOCAL_HIREMAINDER;
2100 : LOCAL_OVERFLOW;
2101 :
2102 : /* > 32 correct bits, 1 Newton iteration to reach 64 */
2103 : if (b <= a[0]) return HIGHBIT | (a[0] >> 1);
2104 : hiremainder = a[0]; c = divll(a[1], b);
2105 : return (addll(c, b) >> 1) | HIGHBIT;
2106 : }
2107 : /* 64 bits of sqrt(a[0] * 2^63) */
2108 : static ulong
2109 : sqrtu2_1(ulong *a)
2110 : {
2111 : ulong t[2];
2112 : t[0] = (a[0] >> 1);
2113 : t[1] = (a[0] << (BITS_IN_LONG-1)) | (a[1] >> 1);
2114 : return sqrtu2(t);
2115 : }
2116 : #else
2117 : /* 32 bits of sqrt(a[0] * 2^32) */
2118 : static ulong
2119 : sqrtu2(ulong *a) { return dblmantissa( sqrt((double)a[0]) ); }
2120 : /* 32 bits of sqrt(a[0] * 2^31) */
2121 : static ulong
2122 : sqrtu2_1(ulong *a) { return dblmantissa( sqrt(2. * a[0]) ); }
2123 : #endif
2124 :
2125 : GEN
2126 : sqrtr_abs(GEN x)
2127 : {
2128 : long l1, i, l = lg(x), ex = expo(x);
2129 : GEN a, t, y = cgetg(l, t_REAL);
2130 : pari_sp av, av0 = avma;
2131 :
2132 : a = rtor(x, lg2prec(l+1));
2133 : t = cgetg(l+1, t_REAL);
2134 : if (ex & 1) { /* odd exponent */
2135 : a[1] = evalsigne(1) | _evalexpo(1);
2136 : t[2] = (long)sqrtu2((ulong*)a + 2);
2137 : } else { /* even exponent */
2138 : a[1] = evalsigne(1) | _evalexpo(0);
2139 : t[2] = (long)sqrtu2_1((ulong*)a + 2);
2140 : }
2141 : t[1] = evalsigne(1) | _evalexpo(0);
2142 : for (i = 3; i <= l; i++) t[i] = 0;
2143 :
2144 : /* |x| = 2^(ex/2) a, t ~ sqrt(a) */
2145 : l--; l1 = 1; av = avma;
2146 : while (l1 < l) { /* let t := (t + a/t)/2 */
2147 : l1 <<= 1; if (l1 > l) l1 = l;
2148 : setlg(a, l1 + 2);
2149 : setlg(t, l1 + 2);
2150 : affrr(addrr(t, divrr(a,t)), t); shiftr_inplace(t, -1);
2151 : set_avma(av);
2152 : }
2153 : affrr(t,y); shiftr_inplace(y, (ex>>1));
2154 : return gc_const(av0, y);
2155 : }
2156 :
2157 : #endif
2158 :
2159 : /*******************************************************************
2160 : * *
2161 : * Base Conversion *
2162 : * *
2163 : *******************************************************************/
2164 :
2165 : static void
2166 733710 : convi_dac(GEN x, ulong l, ulong *res)
2167 : {
2168 733710 : pari_sp ltop=avma;
2169 : ulong m;
2170 : GEN x1,x2;
2171 733710 : if (l==1) { *res=itou(x); return; }
2172 348000 : m=l>>1;
2173 348000 : x1=dvmdii(x,powuu(1000000000UL,m),&x2);
2174 348000 : convi_dac(x1,l-m,res+m);
2175 348000 : convi_dac(x2,m,res);
2176 348000 : set_avma(ltop);
2177 : }
2178 :
2179 : /* convert integer --> base 10^9 [not memory clean] */
2180 : ulong *
2181 315896 : convi(GEN x, long *l)
2182 : {
2183 315896 : long lz, lx = lgefint(x);
2184 : ulong *z;
2185 315896 : if (lx == 3 && uel(x,2) < 1000000000UL) {
2186 278186 : z = (ulong*)new_chunk(1);
2187 278186 : *z = x[2];
2188 278186 : *l = 1; return z+1;
2189 : }
2190 37710 : lz = 1 + (long)bit_accuracy_mul(lx, LOG10_2/9);
2191 37710 : z = (ulong*)new_chunk(lz);
2192 37710 : convi_dac(x,(ulong)lz,z);
2193 67716 : while (z[lz-1]==0) lz--;
2194 37710 : *l=lz; return z+lz;
2195 : }
2196 :
|