Line data Source code
1 : /* Copyright (C) 2000 The PARI group.
2 :
3 : This file is part of the PARI/GP package.
4 :
5 : PARI/GP is free software; you can redistribute it and/or modify it under the
6 : terms of the GNU General Public License as published by the Free Software
7 : Foundation; either version 2 of the License, or (at your option) any later
8 : version. It is distributed in the hope that it will be useful, but WITHOUT
9 : ANY WARRANTY WHATSOEVER.
10 :
11 : Check the License for details. You should have received a copy of it, along
12 : with the package; see the file 'COPYING'. If not, write to the Free Software
13 : Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */
14 : #include "pari.h"
15 : #include "paripriv.h"
16 :
17 : #define DEBUGLEVEL DEBUGLEVEL_factorint
18 :
19 : /***********************************************************************/
20 : /** PRIMES IN SUCCESSION **/
21 : /***********************************************************************/
22 :
23 : /* map from prime residue classes mod 210 to their numbers in {0...47}.
24 : * Subscripts into this array take the form ((k-1)%210)/2, ranging from
25 : * 0 to 104. Unused entries are */
26 : #define NPRC 128 /* nonprime residue class */
27 :
28 : static unsigned char prc210_no[] = {
29 : 0, NPRC, NPRC, NPRC, NPRC, 1, 2, NPRC, 3, 4, NPRC, /* 21 */
30 : 5, NPRC, NPRC, 6, 7, NPRC, NPRC, 8, NPRC, 9, /* 41 */
31 : 10, NPRC, 11, NPRC, NPRC, 12, NPRC, NPRC, 13, 14, NPRC, /* 63 */
32 : NPRC, 15, NPRC, 16, 17, NPRC, NPRC, 18, NPRC, 19, /* 83 */
33 : NPRC, NPRC, 20, NPRC, NPRC, NPRC, 21, NPRC, 22, 23, NPRC, /* 105 */
34 : 24, 25, NPRC, 26, NPRC, NPRC, NPRC, 27, NPRC, NPRC, /* 125 */
35 : 28, NPRC, 29, NPRC, NPRC, 30, 31, NPRC, 32, NPRC, NPRC, /* 147 */
36 : 33, 34, NPRC, NPRC, 35, NPRC, NPRC, 36, NPRC, 37, /* 167 */
37 : 38, NPRC, 39, NPRC, NPRC, 40, 41, NPRC, NPRC, 42, NPRC, /* 189 */
38 : 43, 44, NPRC, 45, 46, NPRC, NPRC, NPRC, NPRC, 47, /* 209 */
39 : };
40 :
41 : /* first differences of the preceding */
42 : static unsigned char prc210_d1[] = {
43 : 10, 2, 4, 2, 4, 6, 2, 6, 4, 2, 4, 6, 6, 2, 6, 4, 2, 6,
44 : 4, 6, 8, 4, 2, 4, 2, 4, 8, 6, 4, 6, 2, 4, 6,
45 : 2, 6, 6, 4, 2, 4, 6, 2, 6, 4, 2, 4, 2, 10, 2,
46 : };
47 :
48 : static int
49 999630 : unextprime_overflow(ulong n)
50 : {
51 : #ifdef LONG_IS_64BIT
52 999044 : return (n > (ulong)-59);
53 : #else
54 586 : return (n > (ulong)-5);
55 : #endif
56 : }
57 :
58 : /* return 0 for overflow */
59 : ulong
60 1138406 : unextprime(ulong n)
61 : {
62 : long rc, rc0, rcn;
63 :
64 1138406 : switch(n) {
65 7548 : case 0: case 1: case 2: return 2;
66 2722 : case 3: return 3;
67 2061 : case 4: case 5: return 5;
68 1225 : case 6: case 7: return 7;
69 : }
70 1124850 : if (n <= maxprime())
71 : {
72 125201 : long i = PRIMES_search(n);
73 125201 : return i > 0? n: pari_PRIMES[-i];
74 : }
75 999635 : if (unextprime_overflow(n)) return 0;
76 : /* here n > 7 */
77 999597 : n |= 1; /* make it odd */
78 999597 : rc = rc0 = n % 210;
79 : /* find next prime residue class mod 210 */
80 : for(;;)
81 : {
82 2200432 : rcn = (long)(prc210_no[rc>>1]);
83 2200432 : if (rcn != NPRC) break;
84 1200835 : rc += 2; /* cannot wrap since 209 is coprime and rc odd */
85 : }
86 999597 : if (rc > rc0) n += rc - rc0;
87 : /* now find an actual (pseudo)prime */
88 : for(;;)
89 : {
90 11719451 : if (uisprime(n)) break;
91 10719854 : n += prc210_d1[rcn];
92 10719854 : if (++rcn > 47) rcn = 0;
93 : }
94 999621 : return n;
95 : }
96 :
97 : GEN
98 130788 : nextprime(GEN n)
99 : {
100 : long rc, rc0, rcn;
101 130788 : pari_sp av = avma;
102 :
103 130788 : if (typ(n) != t_INT)
104 : {
105 14 : n = gceil(n);
106 14 : if (typ(n) != t_INT) pari_err_TYPE("nextprime",n);
107 : }
108 130781 : if (signe(n) <= 0) { set_avma(av); return gen_2; }
109 130781 : if (lgefint(n) == 3)
110 : {
111 118710 : ulong k = unextprime(uel(n,2));
112 118710 : set_avma(av);
113 118710 : if (k) return utoipos(k);
114 : #ifdef LONG_IS_64BIT
115 6 : return uutoi(1,13);
116 : #else
117 1 : return uutoi(1,15);
118 : #endif
119 : }
120 : /* here n > 7 */
121 12071 : if (!mod2(n)) n = addui(1,n);
122 12071 : rc = rc0 = umodiu(n, 210);
123 : /* find next prime residue class mod 210 */
124 : for(;;)
125 : {
126 26282 : rcn = (long)(prc210_no[rc>>1]);
127 26282 : if (rcn != NPRC) break;
128 14211 : rc += 2; /* cannot wrap since 209 is coprime and rc odd */
129 : }
130 12071 : if (rc > rc0) n = addui(rc - rc0, n);
131 : /* now find an actual (pseudo)prime */
132 : for(;;)
133 : {
134 110248 : if (BPSW_psp(n)) break;
135 98177 : n = addui(prc210_d1[rcn], n);
136 98177 : if (++rcn > 47) rcn = 0;
137 : }
138 12071 : if (avma == av) return icopy(n);
139 12071 : return gc_INT(av, n);
140 : }
141 :
142 : ulong
143 38 : uprecprime(ulong n)
144 : {
145 : long rc, rc0, rcn;
146 : { /* check if n <= 10 */
147 38 : if (n <= 1) return 0;
148 31 : if (n == 2) return 2;
149 24 : if (n <= 4) return 3;
150 24 : if (n <= 6) return 5;
151 24 : if (n <= 10) return 7;
152 : }
153 24 : if (n <= maxprimelim())
154 : {
155 0 : long i = PRIMES_search(n);
156 0 : return i > 0? n: pari_PRIMES[-i-1];
157 : }
158 : /* here n >= 11 */
159 24 : if (!(n % 2)) n--;
160 24 : rc = rc0 = n % 210;
161 : /* find previous prime residue class mod 210 */
162 : for(;;)
163 : {
164 48 : rcn = (long)(prc210_no[rc>>1]);
165 48 : if (rcn != NPRC) break;
166 24 : rc -= 2; /* cannot wrap since 1 is coprime and rc odd */
167 : }
168 24 : if (rc < rc0) n += rc - rc0;
169 : /* now find an actual (pseudo)prime */
170 : for(;;)
171 : {
172 48 : if (uisprime(n)) break;
173 24 : if (--rcn < 0) rcn = 47;
174 24 : n -= prc210_d1[rcn];
175 : }
176 24 : return n;
177 : }
178 :
179 : GEN
180 56 : precprime(GEN n)
181 : {
182 : long rc, rc0, rcn;
183 56 : pari_sp av = avma;
184 :
185 56 : if (typ(n) != t_INT)
186 : {
187 14 : n = gfloor(n);
188 14 : if (typ(n) != t_INT) pari_err_TYPE("nextprime",n);
189 : }
190 49 : if (signe(n) <= 0) { set_avma(av); return gen_0; }
191 49 : if (lgefint(n) <= 3)
192 : {
193 38 : ulong k = uel(n,2);
194 38 : return gc_utoi(av, uprecprime(k));
195 : }
196 11 : if (!mod2(n)) n = subiu(n,1);
197 11 : rc = rc0 = umodiu(n, 210);
198 : /* find previous prime residue class mod 210 */
199 : for(;;)
200 : {
201 22 : rcn = (long)(prc210_no[rc>>1]);
202 22 : if (rcn != NPRC) break;
203 11 : rc -= 2; /* cannot wrap since 1 is coprime and rc odd */
204 : }
205 11 : if (rc0 > rc) n = subiu(n, rc0 - rc);
206 : /* now find an actual (pseudo)prime */
207 : for(;;)
208 : {
209 50 : if (BPSW_psp(n)) break;
210 39 : if (--rcn < 0) rcn = 47;
211 39 : n = subiu(n, prc210_d1[rcn]);
212 : }
213 11 : if (avma == av) return icopy(n);
214 11 : return gc_INT(av, n);
215 : }
216 :
217 : /* Find next single-word prime strictly larger than p.
218 : * If *n < pari_PRIMES[0], p is *n-th prime, otherwise imitate nextprime().
219 : * *rcn = NPRC or the correct residue class for the current p; we'll use this
220 : * to track the current prime residue class mod 210 once we're out of range of
221 : * the prime table, and we'll update it before that if it isn't NPRC.
222 : *
223 : * *q is incremented whenever q!=NULL and we wrap from 209 mod 210 to
224 : * 1 mod 210 */
225 : static ulong
226 4531317 : snextpr(ulong p, long *n, long *rcn, long *q, int (*ispsp)(ulong))
227 : {
228 4531317 : if (*n < pari_PRIMES[0])
229 : {
230 4531317 : ulong t, p1 = t = pari_PRIMES[++*n]; /* nextprime(p + 1) */
231 4531317 : if (*rcn != NPRC)
232 : {
233 15888894 : while (t > p)
234 : {
235 11373946 : t -= prc210_d1[*rcn];
236 11373946 : if (++*rcn > 47) { *rcn = 0; if (q) (*q)++; }
237 : }
238 : /* assert(d1 == p) */
239 : }
240 4531317 : return p1;
241 : }
242 0 : if (unextprime_overflow(p)) pari_err_OVERFLOW("snextpr");
243 : /* we are beyond the prime table, initialize if needed */
244 0 : if (*rcn == NPRC) *rcn = prc210_no[(p % 210) >> 1]; /* != NPRC */
245 : /* look for the next one */
246 : do {
247 0 : p += prc210_d1[*rcn];
248 0 : if (++*rcn > 47) { *rcn = 0; if (q) (*q)++; }
249 0 : } while (!ispsp(p));
250 0 : return p;
251 : }
252 :
253 : /********************************************************************/
254 : /** **/
255 : /** INTEGER FACTORIZATION **/
256 : /** **/
257 : /********************************************************************/
258 : int factor_add_primes = 0, factor_proven = 0;
259 :
260 : /***********************************************************************/
261 : /** **/
262 : /** FACTORIZATION (ECM) -- GN Jul-Aug 1998 **/
263 : /** Integer factorization using the elliptic curves method (ECM). **/
264 : /** ellfacteur() returns a non trivial factor of N, assuming N>0, **/
265 : /** is composite, and has no prime divisor below tridiv_bound(N) **/
266 : /** Thanks to Paul Zimmermann for much helpful advice and to **/
267 : /** Guillaume Hanrot and Igor Schein for intensive testing **/
268 : /** **/
269 : /***********************************************************************/
270 : #define nbcmax 64 /* max number of simultaneous curves */
271 :
272 : static const ulong TB1[] = {
273 : 142,172,208,252,305,370,450,545,661,801,972,1180,1430,
274 : 1735,2100,2550,3090,3745,4540,5505,6675,8090,9810,11900,
275 : 14420,17490,21200,25700,31160,37780UL,45810UL,55550UL,67350UL,
276 : 81660UL,99010UL,120050UL,145550UL,176475UL,213970UL,259430UL,
277 : 314550UL,381380UL,462415UL,560660UL,679780UL,824220UL,999340UL,
278 : 1211670UL,1469110UL,1781250UL,2159700UL,2618600UL,3175000UL,
279 : 3849600UL,4667500UL,5659200UL,6861600UL,8319500UL,10087100UL,
280 : 12230300UL,14828900UL,17979600UL,21799700UL,26431500UL,
281 : 32047300UL,38856400UL, /* 110 times that still fits into 32bits */
282 : #ifdef LONG_IS_64BIT
283 : 47112200UL,57122100UL,69258800UL,83974200UL,101816200UL,
284 : 123449000UL,149678200UL,181480300UL,220039400UL,266791100UL,
285 : 323476100UL,392204900UL,475536500UL,576573500UL,699077800UL,
286 : 847610500UL,1027701900UL,1246057200UL,1510806400UL,1831806700UL,
287 : 2221009800UL,2692906700UL,3265067200UL,3958794400UL,4799917500UL
288 : #endif
289 : };
290 : static const ulong TB1_for_stage[] = {
291 : /* Start below the optimal B1 for finding factors which would just have been
292 : * missed by pollardbrent(), and escalate, changing curves to give good
293 : * coverage of the small factor ranges. Entries grow faster than what would
294 : * be optimal but a table instead of a 2D array keeps the code simple */
295 : 500,520,560,620,700,800,900,1000,1150,1300,1450,1600,1800,2000,
296 : 2200,2450,2700,2950,3250,3600,4000,4400,4850,5300,5800,6400,
297 : 7100,7850,8700,9600,10600,11700,12900,14200,15700,17300,
298 : 19000,21000,23200,25500,28000,31000,34500UL,38500UL,43000UL,
299 : 48000UL,53800UL,60400UL,67750UL,76000UL,85300UL,95700UL,
300 : 107400UL,120500UL,135400UL,152000UL,170800UL,191800UL,215400UL,
301 : 241800UL,271400UL,304500UL,341500UL,383100UL,429700UL,481900UL,
302 : 540400UL,606000UL,679500UL,761800UL,854100UL,957500UL,1073500UL
303 : };
304 :
305 : /* addition/doubling/multiplication of a point on an 'elliptic curve mod N'
306 : * may result in one of three things:
307 : * - a new bona fide point
308 : * - a point at infinity (denominator divisible by N)
309 : * - a point at infinity mod some p | N but finite mod q | N betraying itself
310 : * by a denominator which has nontrivial gcd with N.
311 : *
312 : * In the second case, addition/doubling aborts, copying one of the summands
313 : * to the destination array of points unless they coincide.
314 : * Multiplication will stop at some unpredictable intermediate stage: The
315 : * destination will contain _some_ multiple of the input point, but not
316 : * necessarily the desired one, which doesn't matter. As long as we're
317 : * multiplying (B1 phase) we simply carry on with the next multiplier.
318 : * During the B2 phase, the only additions are the giant steps, and the
319 : * worst that can happen here is that we lose one residue class mod 210
320 : * of prime multipliers on 4 of the curves, so again, we ignore the problem
321 : * and just carry on.)
322 : *
323 : * Idea: select nbc curves mod N and one point P on each of them. For each
324 : * such P, compute [M]P = Q where M is the product of all powers <= B2 of
325 : * primes <= nextprime(B1). Then check whether [p]Q for p < nextprime(B2)
326 : * betrays a factor. This second stage looks separately at the primes in
327 : * each residue class mod 210, four curves at a time, and steps additively
328 : * to ever larger multipliers, by comparing X coordinates of points which we
329 : * would need to add in order to reach another prime multiplier in the same
330 : * residue class. 'Comparing' means that we accumulate a product of
331 : * differences of X coordinates, and from time to time take a gcd of this
332 : * product with N. Montgomery's multi-inverse trick is used heavily. */
333 :
334 : /* *** auxiliary functions for ellfacteur: *** */
335 : /* (Rx,Ry) <- (Px,Py)+(Qx,Qy) over Z/NZ, z=1/(Px-Qx). If Ry = NULL, don't set */
336 : static void
337 8291496 : FpE_add_i(GEN N, GEN z, GEN Px, GEN Py, GEN Qx, GEN Qy, GEN *Rx, GEN *Ry)
338 : {
339 8291496 : GEN slope = modii(mulii(subii(Py, Qy), z), N);
340 8291496 : GEN t = subii(sqri(slope), addii(Qx, Px));
341 8291496 : affii(modii(t, N), *Rx);
342 8291496 : if (Ry) {
343 8219188 : t = subii(mulii(slope, subii(Px, *Rx)), Py);
344 8219188 : affii(modii(t, N), *Ry);
345 : }
346 8291496 : }
347 : /* X -> Z; cannot add on one of the curves: make sure Z contains
348 : * something useful before letting caller proceed */
349 : static void
350 25650 : ZV_aff(long n, GEN *X, GEN *Z)
351 : {
352 25650 : if (X != Z) {
353 : long k;
354 1569330 : for (k = n; k--; ) affii(X[k],Z[k]);
355 : }
356 25650 : }
357 :
358 : /* Parallel addition on nbc curves, assigning the result to locations at and
359 : * following *X3, *Y3. (If Y-coords of result not desired, set Y=NULL.)
360 : * Safe even if (X3,Y3) = (X2,Y2), _not_ if (X1,Y1). It is also safe to
361 : * overwrite Y2 with X3. If nbc1 < nbc, the first summand is
362 : * assumed to hold only nbc1 distinct points, repeated as often as we need
363 : * them (to add one point on each of a few curves to several other points on
364 : * the same curves): only used with nbc1 = nbc or nbc1 = 4 | nbc.
365 : *
366 : * Return 0 [SUCCESS], 1 [N | den], 2 [gcd(den, N) is a factor of N, preserved
367 : * in gl.
368 : * Stack space is bounded by a constant multiple of lgefint(N)*nbc:
369 : * - Phase 2 creates 12 items on the stack per iteration, of which 4 are twice
370 : * as long and 1 is thrice as long as N, i.e. 18 units per iteration.
371 : * - Phase 1 creates 4 units.
372 : * Total can be as large as 4*nbcmax + 18*8 units; ecm_elladd2() is
373 : * just as bad, and elldouble() comes to 3*nbcmax + 29*8 units. */
374 : static int
375 240431 : ecm_elladd0(GEN N, GEN *gl, long nbc, long nbc1,
376 : GEN *X1, GEN *Y1, GEN *X2, GEN *Y2, GEN *X3, GEN *Y3)
377 : {
378 240431 : const ulong mask = (nbc1 == 4)? 3: ~0UL; /*nbc1 = 4 or nbc*/
379 240431 : GEN W[2*nbcmax], *A = W+nbc; /* W[0],A[0] unused */
380 : long i;
381 240431 : pari_sp av = avma;
382 :
383 240431 : W[1] = subii(X1[0], X2[0]);
384 7825896 : for (i=1; i<nbc; i++)
385 : { /*prepare for multi-inverse*/
386 7585465 : A[i] = subii(X1[i&mask], X2[i]); /* don't waste time reducing mod N */
387 7585465 : W[i+1] = modii(mulii(A[i], W[i]), N);
388 : }
389 240431 : if (!invmod(W[nbc], N, gl))
390 : {
391 18 : if (!equalii(N,*gl)) return 2;
392 0 : ZV_aff(nbc, X2,X3);
393 0 : if (Y3) ZV_aff(nbc, Y2,Y3);
394 0 : return gc_int(av,1);
395 : }
396 :
397 7825032 : while (i--) /* nbc times */
398 : {
399 7825032 : pari_sp av2 = avma;
400 7825032 : GEN Px = X1[i&mask], Py = Y1[i&mask], Qx = X2[i], Qy = Y2[i];
401 7825032 : GEN z = i? mulii(*gl,W[i]): *gl; /*1/(Px-Qx)*/
402 7825032 : FpE_add_i(N,z, Px,Py,Qx,Qy, X3+i, Y3? Y3+i: NULL);
403 7825032 : if (!i) break;
404 7584619 : set_avma(av2); *gl = modii(mulii(*gl, A[i]), N);
405 : }
406 240413 : return gc_int(av,0);
407 : }
408 :
409 : /* Shortcut, for use in cases where Y coordinates follow their corresponding
410 : * X coordinates, and first summand doesn't need to be repeated */
411 : static int
412 234487 : ecm_elladd(GEN N, GEN *gl, long nbc, GEN *X1, GEN *X2, GEN *X3) {
413 234487 : return ecm_elladd0(N, gl, nbc, nbc, X1, X1+nbc, X2, X2+nbc, X3, X3+nbc);
414 : }
415 :
416 : /* As ecm_elladd except it does twice as many additions (and hides even more
417 : * of the cost of the modular inverse); the net effect is the same as
418 : * ecm_elladd(nbc,X1,X2,X3) && ecm_elladd(nbc,X4,X5,X6). Safe to
419 : * have X2=X3, X5=X6, or X1,X2 coincide with X4,X5 in any order. */
420 : static int
421 7194 : ecm_elladd2(GEN N, GEN *gl, long nbc,
422 : GEN *X1, GEN *X2, GEN *X3, GEN *X4, GEN *X5, GEN *X6)
423 : {
424 7194 : GEN *Y1 = X1+nbc, *Y2 = X2+nbc, *Y3 = X3+nbc;
425 7194 : GEN *Y4 = X4+nbc, *Y5 = X5+nbc, *Y6 = X6+nbc;
426 7194 : GEN W[4*nbcmax], *A = W+2*nbc; /* W[0],A[0] unused */
427 : long i, j;
428 7194 : pari_sp av = avma;
429 :
430 7194 : W[1] = subii(X1[0], X2[0]);
431 233232 : for (i=1; i<nbc; i++)
432 : {
433 226038 : A[i] = subii(X1[i], X2[i]); /* don't waste time reducing mod N here */
434 226038 : W[i+1] = modii(mulii(A[i], W[i]), N);
435 : }
436 240426 : for (j=0; j<nbc; i++,j++)
437 : {
438 233232 : A[i] = subii(X4[j], X5[j]);
439 233232 : W[i+1] = modii(mulii(A[i], W[i]), N);
440 : }
441 7194 : if (!invmod(W[2*nbc], N, gl))
442 : {
443 0 : if (!equalii(N,*gl)) return 2;
444 0 : ZV_aff(2*nbc, X2,X3); /* hack: 2*nbc => copy Y2->Y3 */
445 0 : ZV_aff(2*nbc, X5,X6); /* also copy Y5->Y6 */
446 0 : return gc_int(av,1);
447 : }
448 :
449 240426 : while (j--) /* nbc times */
450 : {
451 233232 : pari_sp av2 = avma;
452 233232 : GEN Px = X4[j], Py = Y4[j], Qx = X5[j], Qy = Y5[j];
453 233232 : GEN z = mulii(*gl,W[--i]); /*1/(Px-Qx)*/
454 233232 : FpE_add_i(N,z, Px,Py, Qx,Qy, X6+j,Y6+j);
455 233232 : set_avma(av2); *gl = modii(mulii(*gl, A[i]), N);
456 : }
457 233232 : while (i--) /* nbc times */
458 : {
459 233232 : pari_sp av2 = avma;
460 233232 : GEN Px = X1[i], Py = Y1[i], Qx = X2[i], Qy = Y2[i];
461 233232 : GEN z = i? mulii(*gl, W[i]): *gl; /*1/(Px-Qx)*/
462 233232 : FpE_add_i(N,z, Px,Py, Qx,Qy, X3+i,Y3+i);
463 233232 : if (!i) break;
464 226038 : set_avma(av2); *gl = modii(mulii(*gl, A[i]), N);
465 : }
466 7194 : return gc_int(av,0);
467 : }
468 :
469 : /* Parallel doubling on nbc curves, assigning the result to locations at
470 : * and following *X2. Safe to be called with X2 equal to X1. Return
471 : * value as for ecm_elladd. If we find a point at infinity mod N,
472 : * and if X1 != X2, we copy the points at X1 to X2. */
473 : static int
474 40073 : elldouble(GEN N, GEN *gl, long nbc, GEN *X1, GEN *X2)
475 : {
476 40073 : GEN *Y1 = X1+nbc, *Y2 = X2+nbc;
477 : GEN W[nbcmax+1]; /* W[0] unused */
478 : long i;
479 40073 : pari_sp av = avma;
480 40073 : /*W[0] = gen_1;*/ W[1] = Y1[0];
481 1233544 : for (i=1; i<nbc; i++) W[i+1] = modii(mulii(Y1[i], W[i]), N);
482 40073 : if (!invmod(W[nbc], N, gl))
483 : {
484 0 : if (!equalii(N,*gl)) return 2;
485 0 : ZV_aff(2*nbc,X1,X2); /* also copies Y1->Y2 */
486 0 : return gc_int(av,1);
487 : }
488 1273617 : while (i--) /* nbc times */
489 : {
490 : pari_sp av2;
491 1233544 : GEN v, w, L, z = i? mulii(*gl,W[i]): *gl;
492 1233544 : if (i) *gl = modii(mulii(*gl, Y1[i]), N);
493 1233544 : av2 = avma;
494 1233544 : L = modii(mulii(addui(1, mului(3, Fp_sqr(X1[i],N))), z), N);
495 1233544 : if (signe(L)) /* half of zero is still zero */
496 1233544 : L = shifti(mod2(L)? addii(L, N): L, -1);
497 1233544 : v = modii(subii(sqri(L), shifti(X1[i],1)), N);
498 1233544 : w = modii(subii(mulii(L, subii(X1[i], v)), Y1[i]), N);
499 1233544 : affii(v, X2[i]);
500 1233544 : affii(w, Y2[i]);
501 1233544 : set_avma(av2);
502 : }
503 40073 : return gc_int(av,0);
504 : }
505 :
506 : /* Parallel multiplication by an odd prime k on nbc curves, storing the
507 : * result to locations at and following *X2. Safe to be called with X2 = X1.
508 : * Return values as ecm_elladd. Uses (a simplified variant of) Montgomery's
509 : * PRAC algorithm; see ftp://ftp.cwi.nl/pub/pmontgom/Lucas.ps.gz .
510 : * With thanks to Paul Zimmermann for the reference. --GN1998Aug13 */
511 : static int
512 208727 : get_rule(ulong d, ulong e)
513 : {
514 208727 : if (d <= e + (e>>2)) /* floor(1.25*e) */
515 : {
516 16630 : if ((d+e)%3 == 0) return 0; /* rule 1 */
517 9928 : if ((d-e)%6 == 0) return 1; /* rule 2 */
518 : }
519 : /* d <= 4*e but no ofl */
520 201971 : if ((d+3)>>2 <= e) return 2; /* rule 3, common case */
521 12148 : if ((d&1)==(e&1)) return 1; /* rule 4 = rule 2 */
522 6344 : if (!(d&1)) return 3; /* rule 5 */
523 1769 : if (d%3 == 0) return 4; /* rule 6 */
524 417 : if ((d+e)%3 == 0) return 5; /* rule 7 */
525 0 : if ((d-e)%3 == 0) return 6; /* rule 8 */
526 : /* when we get here, e is even, otherwise one of rules 4,5 would apply */
527 0 : return 7; /* rule 9 */
528 : }
529 :
530 : /* PRAC implementation notes - main changes against the paper version:
531 : * (1) The general function [m+n]P = f([m]P,[n]P,[m-n]P) collapses (for m!=n)
532 : * to an ecm_elladd() which does not depend on the third argument; thus
533 : * references to the third variable (C in the paper) can be eliminated.
534 : * (2) Since our multipliers are prime, the outer loop of the paper
535 : * version executes only once, and thus is invisible above.
536 : * (3) The first step in the inner loop of the paper version will always be
537 : * rule 3, but the addition requested by this rule amounts to a doubling, and
538 : * will always be followed by a swap, so we have unrolled this first iteration.
539 : * (4) Simplifications in rules 6 and 7 are possible given the above, and we
540 : * save one addition in each of the two cases. NB none of the other
541 : * ecm_elladd()s in the loop can ever degenerate into an elldouble.
542 : * (5) I tried to optimize for rule 3, which is used more frequently than all
543 : * others together, but it didn't improve things, so I removed the nested
544 : * tight loop again. --GN */
545 : /* The main loop body of ellfacteur() runs _slower_ under PRAC than under a
546 : * straightforward left-shift binary multiplication when N has <30 digits and
547 : * B1 is small; PRAC wins when N and B1 get larger. Weird. --GN */
548 : /* k>2 assumed prime, XAUX = scratchpad */
549 : static int
550 25650 : ellmult(GEN N, GEN *gl, long nbc, ulong k, GEN *X1, GEN *X2, GEN *XAUX)
551 : {
552 : ulong r, d, e, e1;
553 : int res;
554 25650 : GEN *A = X2, *B = XAUX, *T = XAUX + 2*nbc;
555 :
556 25650 : ZV_aff(2*nbc,X1,XAUX);
557 : /* first doubling picks up X1; after this we'll be working in XAUX and
558 : * X2 only, mostly via A and B and T */
559 25650 : if ((res = elldouble(N, gl, nbc, X1, X2)) != 0) return res;
560 :
561 : /* split the work at the golden ratio */
562 25650 : r = (ulong)(k*0.61803398875 + .5);
563 25650 : d = k - r;
564 25650 : e = r - d; /* d+e == r, so no danger of ofl below */
565 234377 : while (d != e)
566 : { /* apply one of the nine transformations from PM's Table 4. */
567 208727 : switch(get_rule(d,e))
568 : {
569 6702 : case 0: /* rule 1 */
570 6702 : if ( (res = ecm_elladd(N, gl, nbc, A, B, T)) ) return res;
571 6702 : if ( (res = ecm_elladd2(N, gl, nbc, T, A, A, T, B, B)) != 0) return res;
572 6702 : e1 = d - e; d = (d + e1)/3; e = (e - e1)/3; break;
573 5858 : case 1: /* rules 2 and 4 */
574 5858 : if ( (res = ecm_elladd(N, gl, nbc, A, B, B)) ) return res;
575 5858 : if ( (res = elldouble(N, gl, nbc, A, A)) ) return res;
576 5858 : d = (d-e)>>1; break;
577 4575 : case 3: /* rule 5 */
578 4575 : if ( (res = elldouble(N, gl, nbc, A, A)) ) return res;
579 4575 : d >>= 1; break;
580 1352 : case 4: /* rule 6 */
581 1352 : if ( (res = elldouble(N, gl, nbc, A, T)) ) return res;
582 1352 : if ( (res = ecm_elladd(N, gl, nbc, T, A, A)) ) return res;
583 1352 : if ( (res = ecm_elladd(N, gl, nbc, A, B, B)) ) return res;
584 1352 : d = d/3 - e; break;
585 189823 : case 2: /* rule 3 */
586 189823 : if ( (res = ecm_elladd(N, gl, nbc, A, B, B)) ) return res;
587 189823 : d -= e; break;
588 417 : case 5: /* rule 7 */
589 417 : if ( (res = elldouble(N, gl, nbc, A, T)) ) return res;
590 417 : if ( (res = ecm_elladd2(N, gl, nbc, T, A, A, T, B, B)) != 0) return res;
591 417 : d = (d - 2*e)/3; break;
592 0 : case 6: /* rule 8 */
593 0 : if ( (res = ecm_elladd(N, gl, nbc, A, B, B)) ) return res;
594 0 : if ( (res = elldouble(N, gl, nbc, A, T)) ) return res;
595 0 : if ( (res = ecm_elladd(N, gl, nbc, T, A, A)) ) return res;
596 0 : d = (d - e)/3; break;
597 0 : case 7: /* rule 9 */
598 0 : if ( (res = elldouble(N, gl, nbc, B, B)) ) return res;
599 0 : e >>= 1; break;
600 : }
601 : /* swap d <-> e and A <-> B if necessary */
602 208727 : if (d < e) { lswap(d,e); pswap(A,B); }
603 : }
604 25650 : return ecm_elladd(N, gl, nbc, XAUX, X2, X2);
605 : }
606 :
607 : struct ECM {
608 : pari_timer T;
609 : long nbc, nbc2, seed;
610 : GEN *X, *XAUX, *XT, *XD, *XB, *XB2, *XH, *Xh, *Yh;
611 : };
612 :
613 : /* memory layout in ellfacteur(): a large array of GEN pointers, and one
614 : * huge chunk of memory containing all the actual GEN (t_INT) objects.
615 : * nbc is constant throughout the invocation:
616 : * - The B1 stage of each iteration through the main loop needs little
617 : * space: enough for the X and Y coordinates of the current points,
618 : * and twice as much again as scratchpad for ellmult().
619 : * - The B2 stage, starting from some current set of points Q, needs, in
620 : * succession:
621 : * + space for [2]Q, [4]Q, ..., [10]Q, and [p]Q for building the helix;
622 : * + space for 48*nbc X and Y coordinates to hold the helix. This could
623 : * re-use [2]Q,...,[8]Q, but only with difficulty, since we don't
624 : * know in advance which residue class mod 210 our p is going to be in.
625 : * It can and should re-use [p]Q, though;
626 : * + space for (temporarily [30]Q and then) [210]Q, [420]Q, and several
627 : * further doublings until the giant step multiplier is reached. This
628 : * can re-use the remaining cells from above. The computation of [210]Q
629 : * will have been the last call to ellmult() within this iteration of the
630 : * main loop, so the scratchpad is now also free to be re-used. We also
631 : * compute [630]Q by a parallel addition; we'll need it later to get the
632 : * baby-step table bootstrapped a little faster.
633 : * + Finally, for no more than 4 curves at a time, room for up to 1024 X
634 : * coordinates only: the Y coordinates needed whilst setting up this baby
635 : * step table are temporarily stored in the upper half, and overwritten
636 : * during the last series of additions.
637 : *
638 : * Graphically: after end of B1 stage (X,Y are the coords of Q):
639 : * +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--
640 : * | X Y | scratch | [2]Q| [4]Q| [6]Q| [8]Q|[10]Q| ... | ...
641 : * +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--
642 : * *X *XAUX *XT *XD *XB
643 : *
644 : * [30]Q is computed from [10]Q. [210]Q can go into XY, etc:
645 : * +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--
646 : * |[210]|[420]|[630]|[840]|[1680,3360,6720,...,2048*210] |bstp table...
647 : * +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--
648 : * *X *XAUX *XT *XD [*XG, somewhere here] *XB .... *XH
649 : *
650 : * So we need (13 + 48) * 2 * nbc slots here + 4096 slots for the baby step
651 : * table (not all of which will be used when we start with a small B1, but
652 : * better to allocate and initialize ahead of time all the slots that might
653 : * be needed later).
654 : *
655 : * Note on memory locality: During the B2 phase, accesses to the helix
656 : * (once it is set up) will be clustered by curves (4 out of nbc at a time).
657 : * Accesses to the baby steps table will wander from one end of the array to
658 : * the other and back, one such cycle per giant step, and during a full cycle
659 : * we would expect on the order of 2E4 accesses when using the largest giant
660 : * step size. Thus we shouldn't be doing too bad with respect to thrashing
661 : * a 512KBy L2 cache. However, we don't want the baby step table to grow
662 : * larger than this, even if it would reduce the number of EC operations by a
663 : * few more per cent for very large B2, lest cache thrashing slow down
664 : * everything disproportionally. --GN */
665 : /* Auxiliary routines need < (3*nbc+240)*lN words on the PARI stack, in
666 : * addition to the spc*(lN+1) words occupied by our main table. */
667 : static void
668 57 : ECM_alloc(struct ECM *E, long lN)
669 : {
670 57 : const long bstpmax = 1024; /* max number of baby step table entries */
671 57 : long spc = (13 + 48) * E->nbc2 + bstpmax * 4;
672 57 : long len = spc + 385 + spc*lN;
673 57 : long i, tw = _evallg(lN) | evaltyp(t_INT);
674 57 : GEN w, *X = (GEN*)new_chunk(len);
675 : /* hack for X[i] = cgeti(lN). X = current point in B1 phase */
676 57 : w = (GEN)(X + spc + 385);
677 377001 : for (i = spc-1; i >= 0; i--) { X[i] = w; *w = tw; w += lN; }
678 57 : E->X = X;
679 57 : E->XAUX = E->X + E->nbc2; /* scratchpad for ellmult() */
680 57 : E->XT = E->XAUX + E->nbc2; /* ditto, will later hold [3*210]Q */
681 57 : E->XD = E->XT + E->nbc2; /* room for various multiples */
682 57 : E->XB = E->XD + 10*E->nbc2; /* start of baby steps table */
683 57 : E->XB2 = E->XB + 2 * bstpmax; /* middle of baby steps table */
684 57 : E->XH = E->XB2 + 2 * bstpmax; /* end of bstps table, start of helix */
685 57 : E->Xh = E->XH + 48*E->nbc2; /* little helix, X coords */
686 57 : E->Yh = E->XH + 192; /* ditto, Y coords */
687 : /* XG,YG set inside the main loop, since they depend on B2 */
688 : /* E.Xh range of 384 pointers not set; these will later duplicate the pointers
689 : * in the E.XH range, 4 curves at a time. Some of the cells reserved here for
690 : * the E.XB range will never be used, instead, we'll warp the pointers to
691 : * connect to (read-only) GENs in the X/E.XD range */
692 57 : }
693 : /* N.B. E->seed is not initialized here */
694 : static void
695 57 : ECM_init(struct ECM *E, GEN N, long nbc)
696 : {
697 57 : if (nbc < 0)
698 : { /* choose a sensible default */
699 57 : const long size = expi(N) + 1;
700 57 : nbc = ((size >> 3) << 2) - 80;
701 57 : if (nbc < 8) nbc = 8;
702 : }
703 57 : if (nbc > nbcmax) nbc = nbcmax;
704 57 : E->nbc = nbc;
705 57 : E->nbc2 = nbc << 1;
706 57 : ECM_alloc(E, lgefint(N));
707 57 : }
708 :
709 : static GEN
710 93 : ECM_loop(struct ECM *E, GEN N, ulong B1)
711 : {
712 93 : const ulong B2 = 110 * B1, B2_rt = usqrt(B2);
713 93 : const ulong nbc = E->nbc, nbc2 = E->nbc2;
714 : pari_sp av1, avtmp;
715 : long i, np, np0, gse, gss, bstp, bstp0, rcn0, rcn;
716 : ulong B2_p, m, p, p0;
717 : GEN g, *XG, *YG;
718 93 : GEN *X = E->X, *XAUX = E->XAUX, *XT = E->XT, *XD = E->XD;
719 93 : GEN *XB = E->XB, *XB2 = E->XB2, *XH = E->XH, *Xh = E->Xh, *Yh = E->Yh;
720 : /* pick curves */
721 4461 : for (i = nbc2; i--; ) affui(E->seed++, X[i]);
722 : /* pick giant step exponent and size */
723 93 : gse = B1 < 656
724 : ? (B1 < 200? 5: 6)
725 93 : : (B1 < 10500
726 : ? (B1 < 2625? 7: 8)
727 : : (B1 < 42000? 9: 10));
728 93 : gss = 1UL << gse;
729 : /* With 32 baby steps, a giant step corresponds to 32*420 = 13440,
730 : * appropriate for the smallest B2s. With 1024, a giant step will be 430080;
731 : * appropriate for B1 >~ 42000, where 512 baby steps would imply roughly
732 : * the same number of curve additions. */
733 93 : XG = XT + gse*nbc2; /* will later hold [2^(gse+1)*210]Q */
734 93 : YG = XG + nbc;
735 :
736 93 : if (DEBUGLEVEL >= 4) {
737 0 : err_printf("ECM: time = %6ld ms\nECM: B1 = %4lu,", timer_delay(&E->T), B1);
738 0 : err_printf("\tB2 = %6lu,\tgss = %4ld*420\n", B2, gss);
739 : }
740 93 : p = 2; np = 1; /* p is np-th prime */
741 :
742 : /* ---B1 PHASE--- */
743 : /* treat p=2 separately */
744 93 : B2_p = B2 >> 1;
745 1603 : for (m=1; m<=B2_p; m<<=1)
746 : {
747 1510 : int fl = elldouble(N, &g, nbc, X, X);
748 1510 : if (fl > 1) return g; else if (fl) break;
749 : }
750 93 : rcn = NPRC; /* multipliers begin at the beginning */
751 : /* p=3,...,nextprime(B1) */
752 6538 : while (p < B1 && p <= B2_rt)
753 : {
754 6445 : pari_sp av2 = avma;
755 6445 : p = snextpr(p, &np, &rcn, NULL, uisprime);
756 6445 : B2_p = B2/p; /* beware integer overflow on 32-bit CPUs */
757 22021 : for (m=1; m<=B2_p; m*=p)
758 : {
759 15576 : int fl = ellmult(N, &g, nbc, p, X, X, XAUX);
760 15576 : if (fl > 1) return g; else if (fl) break;
761 15576 : set_avma(av2);
762 : }
763 6445 : set_avma(av2);
764 : }
765 : /* primes p larger than sqrt(B2) appear only to the 1st power */
766 9924 : while (p < B1)
767 : {
768 9849 : pari_sp av2 = avma;
769 9849 : p = snextpr(p, &np, &rcn, NULL, uisprime);
770 9849 : if (ellmult(N, &g, nbc, p, X, X, XAUX) > 1) return g;
771 9831 : set_avma(av2);
772 : }
773 75 : if (DEBUGLEVEL >= 4) {
774 0 : err_printf("ECM: time = %6ld ms, B1 phase done, ", timer_delay(&E->T));
775 0 : err_printf("p = %lu, setting up for B2\n", p);
776 : }
777 :
778 : /* ---B2 PHASE--- */
779 : /* compute [2]Q,...,[10]Q, needed to build the helix */
780 75 : if (elldouble(N, &g, nbc, X, XD) > 1) return g; /*[2]Q*/
781 75 : if (elldouble(N, &g, nbc, XD, XD + nbc2) > 1) return g; /*[4]Q*/
782 75 : if (ecm_elladd(N, &g, nbc,
783 75 : XD, XD + nbc2, XD + (nbc<<2)) > 1) return g; /* [6]Q */
784 75 : if (ecm_elladd2(N, &g, nbc,
785 : XD, XD + (nbc<<2), XT + (nbc<<3),
786 75 : XD + nbc2, XD + (nbc<<2), XD + (nbc<<3)) > 1)
787 0 : return g; /* [8]Q and [10]Q */
788 75 : if (DEBUGLEVEL >= 7) err_printf("\t(got [2]Q...[10]Q)\n");
789 :
790 : /* get next prime (still using the foolproof test) */
791 75 : p = snextpr(p, &np, &rcn, NULL, uisprime);
792 : /* make sure we have the residue class number (mod 210) */
793 75 : if (rcn == NPRC)
794 : {
795 75 : rcn = prc210_no[(p % 210) >> 1];
796 75 : if (rcn == NPRC)
797 : {
798 0 : err_printf("ECM: %lu should have been prime but isn\'t\n", p);
799 0 : pari_err_BUG("ellfacteur");
800 : }
801 : }
802 :
803 : /* compute [p]Q and put it into its place in the helix */
804 75 : if (ellmult(N, &g, nbc, p, X, XH + rcn*nbc2, XAUX) > 1)
805 0 : return g;
806 75 : if (DEBUGLEVEL >= 7)
807 0 : err_printf("\t(got [p]Q, p = %lu = prc210_rp[%ld] mod 210)\n", p, rcn);
808 :
809 : /* save current p, np, and rcn; we'll need them more than once below */
810 75 : p0 = p; np0 = np; rcn0 = rcn;
811 75 : bstp0 = 0; /* p is at baby-step offset 0 from itself */
812 :
813 : /* fill up the helix, stepping forward through the prime residue classes
814 : * mod 210 until we're back at the r'class of p0. Keep updating p so
815 : * that we can print meaningful diagnostics if a factor shows up; don't
816 : * bother checking which of these p's are in fact prime */
817 3600 : for (i = 47; i; i--) /* 47 iterations */
818 : {
819 3525 : ulong dp = (ulong)prc210_d1[rcn];
820 3525 : p += dp;
821 3525 : if (rcn == 47)
822 : { /* wrap mod 210 */
823 75 : if (ecm_elladd(N, &g, nbc, XT+dp*nbc, XH+rcn*nbc2, XH) > 1) return g;
824 75 : rcn = 0; continue;
825 : }
826 3450 : if (ecm_elladd(N, &g, nbc, XT+dp*nbc, XH+rcn*nbc2, XH+rcn*nbc2+nbc2) > 1)
827 0 : return g;
828 3450 : rcn++;
829 : }
830 75 : if (DEBUGLEVEL >= 7) err_printf("\t(got initial helix)\n");
831 : /* compute [210]Q etc, needed for the baby step table */
832 75 : if (ellmult(N, &g, nbc, 3, XD + (nbc<<3), X, XAUX) > 1) return g;
833 75 : if (ellmult(N, &g, nbc, 7, X, X, XAUX) > 1) return g; /* [210]Q */
834 : /* this was the last call to ellmult() in the main loop body; may now
835 : * overwrite XAUX and slots XD and following */
836 75 : if (elldouble(N, &g, nbc, X, XAUX) > 1) return g; /* [420]Q */
837 75 : if (ecm_elladd(N, &g, nbc, X, XAUX, XT) > 1) return g;/*[630]Q*/
838 75 : if (ecm_elladd(N, &g, nbc, X, XT, XD) > 1) return g; /*[840]Q*/
839 561 : for (i=1; i <= gse; i++)
840 486 : if (elldouble(N, &g, nbc, XT + i*nbc2, XD + i*nbc2) > 1) return g;
841 : /* (the last iteration has initialized XG to [210*2^(gse+1)]Q) */
842 :
843 75 : if (DEBUGLEVEL >= 4)
844 0 : err_printf("ECM: time = %6ld ms, entering B2 phase, p = %lu\n",
845 : timer_delay(&E->T), p);
846 :
847 391 : for (i = nbc - 4; i >= 0; i -= 4)
848 : { /* loop over small sets of 4 curves at a time */
849 : GEN *Xb;
850 : long j, k;
851 323 : if (DEBUGLEVEL >= 6)
852 0 : err_printf("ECM: finishing curves %ld...%ld\n", i, i+3);
853 : /* Copy relevant pointers from XH to Xh. Memory layout in XH:
854 : * nbc X coordinates, nbc Y coordinates for residue class
855 : * 1 mod 210, then the same for r.c. 11 mod 210, etc. Memory layout for
856 : * Xh is: four X coords for 1 mod 210, four for 11 mod 210, ..., four
857 : * for 209 mod 210, then the corresponding Y coordinates in the same
858 : * order. This allows a giant step on Xh using just three calls to
859 : * ecm_elladd0() each acting on 64 points in parallel */
860 15827 : for (j = 48; j--; )
861 : {
862 15504 : k = nbc2*j + i;
863 15504 : m = j << 2; /* X coordinates */
864 15504 : Xh[m] = XH[k]; Xh[m+1] = XH[k+1];
865 15504 : Xh[m+2] = XH[k+2]; Xh[m+3] = XH[k+3];
866 15504 : k += nbc; /* Y coordinates */
867 15504 : Yh[m] = XH[k]; Yh[m+1] = XH[k+1];
868 15504 : Yh[m+2] = XH[k+2]; Yh[m+3] = XH[k+3];
869 : }
870 : /* Build baby step table of X coords of multiples of [210]Q. XB[4*j]
871 : * will point at X coords on four curves from [(j+1)*210]Q. Until
872 : * we're done, we need some Y coords as well, which we keep in the
873 : * second half of the table, overwriting them at the end when gse=10.
874 : * Multiples which we already have (by 1,2,3,4,8,16,...,2^gse) are
875 : * entered simply by copying the pointers, ignoring the few slots in w
876 : * that were initially reserved for them. Here are the initial entries */
877 969 : for (Xb=XB,k=2,j=i; k--; Xb=XB2,j+=nbc) /* first X, then Y coords */
878 : {
879 646 : Xb[0] = X[j]; Xb[1] = X[j+1]; /* [210]Q */
880 646 : Xb[2] = X[j+2]; Xb[3] = X[j+3];
881 646 : Xb[4] = XAUX[j]; Xb[5] = XAUX[j+1]; /* [420]Q */
882 646 : Xb[6] = XAUX[j+2]; Xb[7] = XAUX[j+3];
883 646 : Xb[8] = XT[j]; Xb[9] = XT[j+1]; /* [630]Q */
884 646 : Xb[10] = XT[j+2]; Xb[11] = XT[j+3];
885 646 : Xb += 4; /* points at [420]Q */
886 : /* ... entries at powers of 2 times 210 .... */
887 4057 : for (m = 2; m < (ulong)gse+k; m++) /* omit Y coords of [2^gse*210]Q */
888 : {
889 3411 : long m2 = m*nbc2 + j;
890 3411 : Xb += (2UL<<m); /* points at [2^m*210]Q */
891 3411 : Xb[0] = XAUX[m2]; Xb[1] = XAUX[m2+1];
892 3411 : Xb[2] = XAUX[m2+2]; Xb[3] = XAUX[m2+3];
893 : }
894 : }
895 323 : if (DEBUGLEVEL >= 7)
896 0 : err_printf("\t(extracted precomputed helix / baby step entries)\n");
897 : /* ... glue in between, up to 16*210 ... */
898 323 : if (ecm_elladd0(N, &g, 12, 4, /* 12 pts + (4 pts replicated thrice) */
899 : XB + 12, XB2 + 12,
900 : XB, XB2,
901 0 : XB + 16, XB2 + 16) > 1) return g; /*4+{1,2,3} = {5,6,7}*/
902 323 : if (ecm_elladd0(N, &g, 28, 4, /* 28 pts + (4 pts replicated 7fold) */
903 : XB + 28, XB2 + 28,
904 : XB, XB2,
905 0 : XB + 32, XB2 + 32) > 1) return g;/*8+{1...7} = {9...15}*/
906 : /* ... and the remainder of the lot */
907 1221 : for (m = 5; m <= (ulong)gse; m++)
908 : { /* fill in from 2^(m-1)+1 to 2^m-1 in chunks of 64 and 60 points */
909 898 : ulong m2 = 2UL << m; /* will point at 2^(m-1)+1 */
910 1977 : for (j = 0; (ulong)j < m2-64; j+=64) /* executed 0 times when m = 5 */
911 : {
912 1906 : if (ecm_elladd0(N, &g, 64, 4,
913 1079 : XB + m2-4, XB2 + m2-4,
914 1079 : XB + j, XB2 + j,
915 1906 : XB + m2+j, (m<(ulong)gse? XB2+m2+j: NULL)) > 1)
916 0 : return g;
917 : } /* j = m2-64 here, 60 points left */
918 1221 : if (ecm_elladd0(N, &g, 60, 4,
919 898 : XB + m2-4, XB2 + m2-4,
920 898 : XB + j, XB2 + j,
921 1221 : XB + m2+j, (m<(ulong)gse? XB2+m2+j: NULL)) > 1)
922 0 : return g;
923 : /* when m=gse, drop Y coords of result, and when both equal 1024,
924 : * overwrite Y coords of second argument with X coords of result */
925 : }
926 323 : if (DEBUGLEVEL >= 7) err_printf("\t(baby step table complete)\n");
927 : /* initialize a few other things */
928 323 : bstp = bstp0; p = p0; np = np0; rcn = rcn0;
929 323 : g = gen_1; av1 = avma;
930 : /* scratchspace for prod (x_i-x_j) */
931 323 : avtmp = (pari_sp)new_chunk(8 * lgefint(N));
932 : /* The correct entry in XB to use depends on bstp and on where we are
933 : * on the helix. As we skip from prime to prime, bstp is incremented
934 : * by snextpr each time we wrap around through residue class number 0
935 : * (1 mod 210), but the baby step should not be taken until rcn>=rcn0,
936 : * i.e. until we pass again the residue class of p0.
937 : *
938 : * The correct signed multiplier is thus k = bstp - (rcn < rcn0),
939 : * and the offset from XB is four times (|k| - 1). When k=0, we ignore
940 : * the current prime: if it had led to a factorization, this
941 : * would have been noted during the last giant step, or -- when we
942 : * first get here -- whilst initializing the helix. When k > gss,
943 : * we must do a giant step and bump bstp back by -2*gss.
944 : *
945 : * The gcd of the product of X coord differences against N is taken just
946 : * before we do a giant step. */
947 4515264 : while (p < B2)
948 : {/* loop over probable primes p0 < p <= nextprime(B2), inserting giant
949 : * steps as necessary */
950 4514948 : p = snextpr(p, &np, &rcn, &bstp, uis2psp); /* next probable prime */
951 : /* work out the corresponding baby-step multiplier */
952 4514948 : k = bstp - (rcn < rcn0 ? 1 : 0);
953 4514948 : if (k > gss)
954 : { /* giant-step time, take gcd */
955 1114 : g = gcdii(g, N);
956 1114 : if (!is_pm1(g) && !equalii(g, N)) return g;
957 1107 : g = gen_1; set_avma(av1);
958 2214 : while (k > gss)
959 : { /* giant step */
960 1107 : if (DEBUGLEVEL >= 7) err_printf("\t(giant step at p = %lu)\n", p);
961 1107 : if (ecm_elladd0(N, &g, 64, 4, XG + i, YG + i,
962 0 : Xh, Yh, Xh, Yh) > 1) return g;
963 1107 : if (ecm_elladd0(N, &g, 64, 4, XG + i, YG + i,
964 : Xh + 64, Yh + 64, Xh + 64, Yh + 64) > 1)
965 0 : return g;
966 1107 : if (ecm_elladd0(N, &g, 64, 4, XG + i, YG + i,
967 : Xh + 128, Yh + 128, Xh + 128, Yh + 128) > 1)
968 0 : return g;
969 1107 : bstp -= (gss << 1);
970 1107 : k = bstp - (rcn < rcn0? 1: 0); /* recompute multiplier */
971 : }
972 : }
973 4514941 : if (!k) continue; /* point of interest is already in Xh */
974 4490276 : if (k < 0) k = -k;
975 4490276 : m = ((ulong)k - 1) << 2;
976 : /* accumulate product of differences of X coordinates */
977 4490276 : j = rcn<<2;
978 4490276 : avma = avtmp; /* go to garbage zone; don't use set_avma */
979 4490276 : g = modii(mulii(g, subii(XB[m], Xh[j])), N);
980 4490276 : g = modii(mulii(g, subii(XB[m+1], Xh[j+1])), N);
981 4490276 : g = modii(mulii(g, subii(XB[m+2], Xh[j+2])), N);
982 4490276 : g = mulii(g, subii(XB[m+3], Xh[j+3]));
983 4490276 : set_avma(av1);
984 4490276 : g = modii(g, N);
985 : }
986 316 : set_avma(av1);
987 : }
988 68 : return NULL;
989 : }
990 :
991 : /* ellfacteur() tuned to be useful as a first stage before MPQS, especially for
992 : * large arguments, when 'insist' is false, and now also for the case when
993 : * 'insist' is true, vaguely following suggestions by Paul Zimmermann
994 : * (http://www.loria.fr/~zimmerma/records/ecmnet.html). --GN 1998Jul,Aug */
995 : static GEN
996 3262 : ellfacteur(GEN N, int insist)
997 : {
998 3262 : const long size = expi(N) + 1;
999 3262 : pari_sp av = avma;
1000 : struct ECM E;
1001 3262 : long nbc, dsn, dsnmax, rep = 0;
1002 3262 : if (insist)
1003 : {
1004 0 : const long DSNMAX = numberof(TB1)-1;
1005 0 : dsnmax = (size >> 2) - 10;
1006 0 : if (dsnmax < 0) dsnmax = 0;
1007 0 : else if (dsnmax > DSNMAX) dsnmax = DSNMAX;
1008 0 : E.seed = 1 + (nbcmax<<7)*(size&0xffff); /* seed for choice of curves */
1009 :
1010 0 : dsn = (size >> 3) - 5;
1011 0 : if (dsn < 0) dsn = 0; else if (dsn > 47) dsn = 47;
1012 : /* pick up the torch where noninsistent stage would have given up */
1013 0 : nbc = dsn + (dsn >> 2) + 9; /* 8 or more curves in parallel */
1014 0 : nbc &= ~3; /* 4 | nbc */
1015 : }
1016 : else
1017 : {
1018 3262 : dsn = (size - 140) >> 3;
1019 3262 : if (dsn < 0)
1020 : {
1021 : #ifndef __EMX__ /* unless DOS/EMX: MPQS's disk access is abysmally slow */
1022 3205 : if (DEBUGLEVEL >= 4)
1023 0 : err_printf("ECM: number too small to justify this stage\n");
1024 3205 : return NULL; /* too small, decline the task */
1025 : #endif
1026 : dsn = 0;
1027 57 : } else if (dsn > 12) dsn = 12;
1028 57 : rep = (size <= 248 ?
1029 57 : (size <= 176 ? (size - 124) >> 4 : (size - 148) >> 3) :
1030 18 : (size - 224) >> 1);
1031 : #ifdef __EMX__ /* DOS/EMX: extra rounds (shun MPQS) */
1032 : rep += 20;
1033 : #endif
1034 57 : dsnmax = 72;
1035 : /* Use disjoint sets of curves for non-insist and insist phases; moreover,
1036 : * repeated calls acting on factors of the same original number should try
1037 : * to use fresh curves. The following achieves this */
1038 57 : E.seed = 1 + (nbcmax<<3)*(size & 0xf);
1039 57 : nbc = -1;
1040 : }
1041 57 : ECM_init(&E, N, nbc);
1042 57 : if (DEBUGLEVEL >= 4)
1043 : {
1044 0 : timer_start(&E.T);
1045 0 : err_printf("ECM: working on %ld curves at a time; initializing", E.nbc);
1046 0 : if (!insist)
1047 : {
1048 0 : if (rep == 1) err_printf(" for one round");
1049 0 : else err_printf(" for up to %ld rounds", rep);
1050 : }
1051 0 : err_printf("...\n");
1052 : }
1053 57 : if (dsn > dsnmax) dsn = dsnmax;
1054 : for(;;)
1055 36 : {
1056 93 : ulong B1 = insist? TB1[dsn]: TB1_for_stage[dsn];
1057 93 : GEN g = ECM_loop(&E, N, B1);
1058 93 : if (g)
1059 : {
1060 25 : if (DEBUGLEVEL >= 4)
1061 0 : err_printf("ECM: time = %6ld ms\n\tfound factor = %Ps\n",
1062 : timer_delay(&E.T), g);
1063 25 : return gc_GEN(av, g);
1064 : }
1065 68 : if (dsn < dsnmax)
1066 : {
1067 68 : if (insist) dsn++;
1068 68 : else { dsn += 2; if (dsn > dsnmax) dsn = dsnmax; }
1069 : }
1070 68 : if (!insist && !--rep)
1071 : {
1072 32 : if (DEBUGLEVEL >= 4)
1073 0 : err_printf("ECM: time = %6ld ms,\tellfacteur giving up.\n",
1074 : timer_delay(&E.T));
1075 32 : return gc_NULL(av);
1076 : }
1077 : }
1078 : }
1079 : /* assume rounds >= 1, seed >= 1, B1 <= ULONG_MAX / 110 */
1080 : GEN
1081 0 : Z_ECM(GEN N, long rounds, long seed, ulong B1)
1082 : {
1083 0 : pari_sp av = avma;
1084 : struct ECM E;
1085 : long i;
1086 0 : E.seed = seed;
1087 0 : ECM_init(&E, N, -1);
1088 0 : if (DEBUGLEVEL >= 4) timer_start(&E.T);
1089 0 : for (i = rounds; i--; )
1090 : {
1091 0 : GEN g = ECM_loop(&E, N, B1);
1092 0 : if (g) return gc_GEN(av, g);
1093 : }
1094 0 : return gc_NULL(av);
1095 : }
1096 :
1097 : /***********************************************************************/
1098 : /** **/
1099 : /** FACTORIZATION (Pollard-Brent rho) --GN1998Jun18-26 **/
1100 : /** pollardbrent() returns a nontrivial factor of n, assuming n is **/
1101 : /** composite and has no small prime divisor, or NULL if going on **/
1102 : /** would take more time than we want to spend. Sometimes it finds **/
1103 : /** more than one factor, and returns a structure suitable for **/
1104 : /** interpretation by ifac_crack. (Cf Algo 8.5.2 in ACiCNT) **/
1105 : /** **/
1106 : /***********************************************************************/
1107 : #define VALUE(x) gel(x,0)
1108 : #define EXPON(x) gel(x,1)
1109 : #define CLASS(x) gel(x,2)
1110 :
1111 : INLINE void
1112 51414 : INIT(GEN x, GEN v, GEN e, GEN c) {
1113 51414 : VALUE(x) = v;
1114 51414 : EXPON(x) = e;
1115 51414 : CLASS(x) = c;
1116 51414 : }
1117 : static void
1118 45508 : ifac_delete(GEN x) { INIT(x,NULL,NULL,NULL); }
1119 :
1120 : static void
1121 0 : rho_dbg(pari_timer *T, long c, long msg_mask)
1122 : {
1123 0 : if (c & msg_mask) return;
1124 0 : err_printf("Rho: time = %6ld ms,\t%3ld round%s\n",
1125 : timer_delay(T), c, (c==1?"":"s"));
1126 : }
1127 :
1128 : static void
1129 28251983 : one_iter(GEN *x, GEN *P, GEN x1, GEN n, long delta)
1130 : {
1131 28251983 : *x = addis(remii(sqri(*x), n), delta);
1132 28188691 : *P = modii(mulii(*P, subii(x1, *x)), n);
1133 28251531 : }
1134 : /* Return NULL when we run out of time, or a single t_INT containing a
1135 : * nontrivial factor of n, or a vector of t_INTs, each triple of successive
1136 : * entries containing a factor, an exponent (equal to one), and a factor
1137 : * class (NULL for unknown or zero for known composite), matching the
1138 : * internal representation used by the ifac_*() routines below. Repeated
1139 : * factors may arise; the caller will sort the factors anyway. Result
1140 : * is not GC-able (contains NULL) */
1141 : static GEN
1142 802 : pollardbrent_i(GEN n, long size, long c0, long retries)
1143 : {
1144 802 : long tf = lgefint(n), delta, msg_mask, c, k, k1, l;
1145 : pari_sp av;
1146 : GEN x, x1, y, P, g, g1, res;
1147 : pari_timer T;
1148 :
1149 802 : if (DEBUGLEVEL >= 4) timer_start(&T);
1150 802 : c = c0 << 5; /* 2^5 iterations per round */
1151 1604 : msg_mask = (size >= 448? 0x1fff:
1152 802 : (size >= 192? (256L<<((size-128)>>6))-1: 0xff));
1153 802 : y = cgeti(tf);
1154 802 : x1= cgeti(tf);
1155 802 : av = avma;
1156 :
1157 802 : PB_RETRY:
1158 : /* trick to make a 'random' choice determined by n. Don't use x^2+0 or
1159 : * x^2-2, ever. Don't use x^2-3 or x^2-7 with a starting value of 2.
1160 : * x^2+4, x^2+9 are affine conjugate to x^2+1, so don't use them either.
1161 : *
1162 : * (the point being that when we get called again on a composite cofactor
1163 : * of something we've already seen, we had better avoid the same delta) */
1164 802 : switch ((size + retries) & 7)
1165 : {
1166 107 : case 0: delta= 1; break;
1167 177 : case 1: delta= -1; break;
1168 92 : case 2: delta= 3; break;
1169 73 : case 3: delta= 5; break;
1170 72 : case 4: delta= -5; break;
1171 56 : case 5: delta= 7; break;
1172 141 : case 6: delta= 11; break;
1173 : /* case 7: */
1174 84 : default: delta=-11; break;
1175 : }
1176 802 : if (DEBUGLEVEL >= 4)
1177 : {
1178 0 : if (!retries)
1179 0 : err_printf("Rho: searching small factor of %ld-bit integer\n", size);
1180 : else
1181 0 : err_printf("Rho: restarting for remaining rounds...\n");
1182 0 : err_printf("Rho: using X^2%+1ld for up to %ld rounds of 32 iterations\n",
1183 : delta, c >> 5);
1184 : }
1185 802 : x = gen_2; P = gen_1; g1 = NULL; k = 1; l = 1;
1186 802 : affui(2, y);
1187 802 : affui(2, x1);
1188 : for (;;) /* terminated under the control of c */
1189 : { /* use the polynomial x^2 + delta */
1190 13203665 : one_iter(&x, &P, x1, n, delta);
1191 :
1192 13205268 : if ((--c & 0x1f)==0)
1193 : { /* one round complete */
1194 412575 : g = gcdii(n, P); if (!is_pm1(g)) goto fin;
1195 412338 : if (c <= 0)
1196 : { /* getting bored */
1197 396 : if (DEBUGLEVEL >= 4)
1198 0 : err_printf("Rho: time = %6ld ms,\tPollard-Brent giving up.\n",
1199 : timer_delay(&T));
1200 396 : return NULL;
1201 : }
1202 411942 : P = gen_1;
1203 411942 : if (DEBUGLEVEL >= 4) rho_dbg(&T, c0-(c>>5), msg_mask);
1204 411942 : affii(x,y); x = y; set_avma(av);
1205 : }
1206 :
1207 13203121 : if (--k) continue; /* normal end of loop body */
1208 :
1209 8613 : if (c & 0x1f) /* otherwise, we already checked */
1210 : {
1211 4812 : g = gcdii(n, P); if (!is_pm1(g)) goto fin;
1212 4812 : P = gen_1;
1213 : }
1214 :
1215 : /* Fast forward phase, doing l inner iterations without computing gcds.
1216 : * Check first whether it would take us beyond the alloted time.
1217 : * Fast forward rounds count only half (although they're taking
1218 : * more like 2/3 the time of normal rounds). This to counteract the
1219 : * nuisance that all c0 between 4096 and 6144 would act exactly as
1220 : * 4096; with the halving trick only the range 4096..5120 collapses
1221 : * (similarly for all other powers of two) */
1222 8613 : if ((c -= (l>>1)) <= 0)
1223 : { /* got bored */
1224 179 : if (DEBUGLEVEL >= 4)
1225 0 : err_printf("Rho: time = %6ld ms,\tPollard-Brent giving up.\n",
1226 : timer_delay(&T));
1227 179 : return NULL;
1228 : }
1229 8434 : c &= ~0x1f; /* keep it on multiples of 32 */
1230 :
1231 : /* Fast forward loop */
1232 8434 : affii(x, x1); set_avma(av); x = x1;
1233 8434 : k = l; l <<= 1;
1234 : /* don't show this for the first several (short) fast forward phases. */
1235 8434 : if (DEBUGLEVEL >= 4 && (l>>7) > msg_mask)
1236 0 : err_printf("Rho: fast forward phase (%ld rounds of 64)...\n", l>>7);
1237 15080559 : for (k1=k; k1; k1--)
1238 : {
1239 15072172 : one_iter(&x, &P, x1, n, delta);
1240 15070255 : if ((k1 & 0x1f) == 0) (void)gc_all(av, 2, &x, &P);
1241 : }
1242 8387 : if (DEBUGLEVEL >= 4 && (l>>7) > msg_mask)
1243 0 : err_printf("Rho: time = %6ld ms,\t%3ld rounds, back to normal mode\n",
1244 0 : timer_delay(&T), c0-(c>>5));
1245 8387 : affii(x,y); P = gc_INT(av, P); x = y;
1246 : } /* forever */
1247 :
1248 227 : fin:
1249 : /* An accumulated gcd was > 1 */
1250 227 : if (!equalii(g,n))
1251 : { /* if it isn't n, and looks prime, return it */
1252 227 : if (MR_Jaeschke(g))
1253 : {
1254 227 : if (DEBUGLEVEL >= 4)
1255 : {
1256 0 : rho_dbg(&T, c0-(c>>5), 0);
1257 0 : err_printf("\tfound factor = %Ps\n",g);
1258 : }
1259 227 : return g;
1260 : }
1261 0 : set_avma(av); g1 = icopy(g); /* known composite, keep it safe */
1262 0 : av = avma;
1263 : }
1264 0 : else g1 = n; /* and work modulo g1 for backtracking */
1265 :
1266 : /* Here g1 is known composite */
1267 0 : if (DEBUGLEVEL >= 4 && size > 192)
1268 0 : err_printf("Rho: hang on a second, we got something here...\n");
1269 0 : x = y;
1270 : for(;;)
1271 : { /* backtrack until period recovered. Must terminate */
1272 0 : x = addis(remii(sqri(x), g1), delta);
1273 0 : g = gcdii(subii(x1, x), g1); if (!is_pm1(g)) break;
1274 :
1275 0 : if (DEBUGLEVEL >= 4 && (--c & 0x1f) == 0) rho_dbg(&T, c0-(c>>5), msg_mask);
1276 : }
1277 :
1278 0 : if (g1 == n || equalii(g,g1))
1279 : {
1280 0 : if (g1 == n && equalii(g,g1))
1281 : { /* out of luck */
1282 0 : if (DEBUGLEVEL >= 4)
1283 : {
1284 0 : rho_dbg(&T, c0-(c>>5), 0);
1285 0 : err_printf("\tPollard-Brent failed.\n");
1286 : }
1287 0 : if (++retries >= 4) pari_err_BUG("");
1288 0 : goto PB_RETRY;
1289 : }
1290 : /* half lucky: we've split n, but g1 equals either g or n */
1291 0 : if (DEBUGLEVEL >= 4)
1292 : {
1293 0 : rho_dbg(&T, c0-(c>>5), 0);
1294 0 : err_printf("\tfound %sfactor = %Ps\n", (g1!=n ? "composite " : ""), g);
1295 : }
1296 0 : res = cgetg(7, t_VEC);
1297 : /* g^1: known composite when g1!=n */
1298 0 : INIT(res+1, g, gen_1, (g1!=n? gen_0: NULL));
1299 : /* cofactor^1: status unknown */
1300 0 : INIT(res+4, diviiexact(n,g), gen_1, NULL);
1301 0 : return res;
1302 : }
1303 : /* g < g1 < n : our lucky day -- we've split g1, too */
1304 0 : res = cgetg(10, t_VEC);
1305 : /* unknown status for all three factors */
1306 0 : INIT(res+1, g, gen_1, NULL);
1307 0 : INIT(res+4, diviiexact(g1,g), gen_1, NULL);
1308 0 : INIT(res+7, diviiexact(n,g1), gen_1, NULL);
1309 0 : if (DEBUGLEVEL >= 4)
1310 : {
1311 0 : rho_dbg(&T, c0-(c>>5), 0);
1312 0 : err_printf("\tfound factors = %Ps, %Ps,\n\tand %Ps\n",
1313 0 : gel(res,1), gel(res,4), gel(res,7));
1314 : }
1315 0 : return res;
1316 : }
1317 : /* decline if n < 2^96 */
1318 : static GEN
1319 3489 : pollardbrent(GEN n)
1320 : {
1321 3489 : const long tune = 14; /* FIXME: retune this */
1322 3489 : long c0, size, tf = lgefint(n);
1323 : #ifdef LONG_IS_64BIT
1324 3039 : if (tf < 4 || (tf == 4 && uel(n,2) < (1UL << 32))) return NULL;
1325 : #else /* 32 bits */
1326 450 : if (tf < 5) return NULL;
1327 : #endif
1328 802 : size = expi(n) + 1;
1329 : /* nonlinear increase in effort, kicking in around 80 bits */
1330 802 : if (size <= 301) /* 301 gives 48121 + tune */
1331 795 : c0 = tune + size-60 + ((size-73)>>1)*((size-70)>>3)*((size-56)>>4);
1332 : else
1333 7 : c0 = 49152; /* ECM is faster when it'd take longer */
1334 802 : return pollardbrent_i(n, size, c0, 0);
1335 : }
1336 : GEN
1337 0 : Z_pollardbrent(GEN n, long rounds, long seed)
1338 : {
1339 0 : pari_sp av = avma;
1340 0 : GEN v = pollardbrent_i(n, expi(n)+1, rounds, seed);
1341 0 : if (!v) return NULL;
1342 0 : if (typ(v) == t_INT) v = mkvec2(v, diviiexact(n,v));
1343 0 : else if (lg(v) == 7) v = mkvec2(gel(v,1), gel(v,4));
1344 0 : else v = mkvec3(gel(v,1), gel(v,4), gel(v,7));
1345 0 : return gc_GEN(av, v);
1346 : }
1347 :
1348 : /***********************************************************************/
1349 : /** FACTORIZATION (Shanks' SQUFOF) --GN2000Sep30-Oct01 **/
1350 : /** squfof() returns a proper factor of n, or NULL (failure). Assume **/
1351 : /** n is composite, not a square, and has no small prime divisors. **/
1352 : /** Works on two discriminants at once: n and 5n or 3n and 4n **/
1353 : /** Present implementation is limited to input <2^59, and works most **/
1354 : /** of the time in signed arithmetic on integers <2^31 in absolute **/
1355 : /** size. (Cf. Algo 8.7.2 in ACiCNT) **/
1356 : /***********************************************************************/
1357 :
1358 : /* squfof_ambig walks back along the ambiguous cycle until we hit an ambiguous
1359 : * form and thus the desired factor, which it returns. Returs 0 on failure.
1360 : *
1361 : * Input: a form (A, B, -C) with A = a^2, where a isn't blacklisted and
1362 : * (a, B) = 1. We should now proceed reducing the form (a, -B, -aC), but the
1363 : * first reduction step always sends this to (-aC, B, a), and the next one,
1364 : * with q computed as usual from B and a (occupying the c position), gives a
1365 : * reduced form, whose third member is easiest to recover by going back to D.
1366 : * From this point onwards, we're once again working with single-word numbers.
1367 : * No need to track signs, just work with the abs values of the coefficients.
1368 : * HACK: if LONG_IS_64BIT, D is actually a typecast long */
1369 : static long
1370 2007 : squfof_ambig(long a, long B, long dd, GEN D)
1371 : {
1372 : long b, c, q, qa, a0, b0, b1;
1373 2007 : long cnt = 0; /* count reduction steps on the cycle */
1374 :
1375 2007 : q = (dd + (B>>1)) / a;
1376 2007 : qa = q * a;
1377 2007 : b = (qa - B) + qa; /* avoid overflow */
1378 : #ifdef LONG_IS_64BIT
1379 1548 : c = (((long)D - b*b) >> 2) / a;
1380 : #else
1381 : {
1382 459 : pari_sp av = avma;
1383 459 : c = itos(divis(shifti(subii(D, sqrs(b)), -2), a));
1384 459 : set_avma(av);
1385 : }
1386 : #endif
1387 2007 : a0 = a; b0 = b1 = b; /* end of loop detection and safeguard */
1388 : for (;;)
1389 957465 : { /* reduction step */
1390 959472 : long c0 = c, qc, qcb;
1391 959472 : if (c0 > dd)
1392 267956 : q = 1;
1393 : else
1394 691516 : q = (dd + (b>>1)) / c0;
1395 959472 : if (q == 1)
1396 : {
1397 396957 : qcb = c0 - b; b = c0 + qcb; c = a - qcb;
1398 : }
1399 : else
1400 : {
1401 562515 : qc = q*c0; qcb = qc - b; b = qc + qcb; c = a - q*qcb;
1402 : }
1403 959472 : a = c0;
1404 :
1405 959472 : cnt++; if (b == b1) break;
1406 :
1407 : /* safeguard against infinite loop: we walked the cycle in vain.
1408 : * (I don't think this can actually happen.) */
1409 957465 : if (b == b0 && a == a0) return 0;
1410 :
1411 957465 : b1 = b;
1412 : }
1413 2007 : q = a&1 ? a : a>>1;
1414 2007 : if (DEBUGLEVEL >= 4)
1415 : {
1416 0 : if (q > 1)
1417 0 : err_printf("SQUFOF: found factor %ld from ambiguous form\n"
1418 : "\tafter %ld steps on the ambiguous cycle\n",
1419 0 : q / ugcd(q,15), cnt);
1420 : else
1421 0 : err_printf("SQUFOF: ...found nothing on the ambiguous cycle\n"
1422 : "\tafter %ld steps there\n", cnt);
1423 0 : if (DEBUGLEVEL >= 6) err_printf("SQUFOF: squfof_ambig returned %ld\n", q);
1424 : }
1425 2007 : return q;
1426 : }
1427 :
1428 : #define SQUFOF_BLACKLIST_SZ 64
1429 :
1430 : /* assume (n,30) = 1 */
1431 : static GEN
1432 5057 : squfof(GEN n)
1433 : {
1434 : ulong d1, d2;
1435 : #ifdef LONG_IS_64BIT
1436 : ulong uD1, uD2;
1437 : #endif
1438 5057 : long tf = lgefint(n), nm4, cnt = 0;
1439 : long a1, b1, c1, dd1, L1, a2, b2, c2, dd2, L2, a, q, c, qc, qcb;
1440 : GEN D1, D2;
1441 5057 : pari_sp av = avma;
1442 : long blacklist1[SQUFOF_BLACKLIST_SZ], blacklist2[SQUFOF_BLACKLIST_SZ];
1443 5057 : long blp1 = 0, blp2 = 0;
1444 5057 : int act1 = 1, act2 = 1;
1445 :
1446 : #ifdef LONG_IS_64BIT
1447 4263 : if (tf > 3 || (tf == 3 && uel(n,2) >= (1UL << 46)))
1448 : #else /* 32 bits */
1449 794 : if (tf > 4 || (tf == 4 && (ulong)(*int_MSW(n)) >= (1UL << 17))) /* 49 */
1450 : #endif
1451 3489 : return NULL; /* n too large */
1452 :
1453 : /* now we have 5 < n < 2^59 */
1454 1568 : nm4 = mod4(n);
1455 : #ifdef LONG_IS_64BIT
1456 1224 : if (nm4 == 1)
1457 : { /* n = 1 (mod4): run one iteration on D1 = n, another on D2 = 5n */
1458 564 : uD1 = n[2];
1459 564 : uD2 = 5 * n[2]; d2 = usqrt(uD2); dd2 = (long)((d2>>1) + (d2&1));
1460 564 : b2 = (long)((d2-1) | 1); /* b1, b2 will always stay odd */
1461 : }
1462 : else
1463 : { /* n = 3 (mod4): run one iteration on D1 = 3n, another on D2 = 4n */
1464 660 : uD1 = 3 * n[2];
1465 660 : uD2 = 4 * n[2]; dd2 = usqrt(n[2]); d2 = dd2 << 1;
1466 660 : b2 = (long)(d2 & (~1UL)); /* largest even below d2, will stay even */
1467 : }
1468 1224 : D1 = (GEN)uD1;
1469 1224 : D2 = (GEN)uD2;
1470 1224 : d1 = usqrt(uD1);
1471 1224 : b1 = (long)((d1-1) | 1); /* largest odd number not exceeding d1 */
1472 : /* c1 != 0 else n or 3n would be a square */
1473 1224 : c1 = (uD1 - b1*b1) / 4;
1474 : /* c2 != 0 else 5n would be a square */
1475 1224 : c2 = (uD2 - b2*b2) / 4;
1476 : #else
1477 344 : if (nm4 == 1)
1478 : { /* n = 1 (mod4): run one iteration on D1 = n, another on D2 = 5n */
1479 173 : D1 = n;
1480 173 : D2 = mului(5,n); d2 = itou(sqrti(D2)); dd2 = (long)((d2>>1) + (d2&1));
1481 173 : b2 = (long)((d2-1) | 1); /* b1, b2 will always stay odd */
1482 : }
1483 : else
1484 : { /* n = 3 (mod4): run one iteration on D1 = 3n, another on D2 = 4n */
1485 171 : D1 = mului(3,n);
1486 171 : D2 = shifti(n,2); dd2 = itou(sqrti(n)); d2 = dd2 << 1;
1487 171 : b2 = (long)(d2 & (~1UL)); /* largest even below d2, will stay even */
1488 : }
1489 344 : d1 = itou(sqrti(D1));
1490 344 : b1 = (long)((d1-1) | 1); /* largest odd number not exceeding d1 */
1491 : /* c1 != 0 else n or 3n would be a square */
1492 344 : c1 = itos(shifti(subii(D1, sqru((ulong)b1)), -2));
1493 : /* c2 != 0 else 5n would be a square */
1494 344 : c2 = itos(shifti(subii(D2, sqru((ulong)b2)), -2));
1495 : #endif
1496 1568 : L1 = (long)usqrt(d1);
1497 1568 : L2 = (long)usqrt(d2);
1498 : /* dd1 used to compute floor((d1+b1)/2) as dd1+floor(b1/2), without
1499 : * overflowing the 31bit signed integer size limit. Same for dd2. */
1500 1568 : dd1 = (long) ((d1>>1) + (d1&1));
1501 1568 : a1 = a2 = 1;
1502 :
1503 : /* The two (identity) forms (a1,b1,-c1) and (a2,b2,-c2) are now set up.
1504 : *
1505 : * a1 and c1 represent the absolute values of the a,c coefficients; we keep
1506 : * track of the sign separately, via the iteration counter cnt: when cnt is
1507 : * even, c < 0 and a > 0, else c > 0 and a < 0.
1508 : *
1509 : * L1, L2 are the limits for blacklisting small leading coefficients
1510 : * on the principal cycle, to guarantee that when we find a square form,
1511 : * its square root will belong to an ambiguous cycle, i.e. won't be an
1512 : * earlier form on the principal cycle.
1513 : *
1514 : * When n = 3(mod 4), D2 = 12(mod 16), and b^2 is 0 or 4 mod 16.
1515 : * It follows that 4*a*c must be 4 or 8 mod 16, respectively, so at most
1516 : * one of a,c can be divisible by 2 at most to the first power. This fact
1517 : * is used a couple of times below.
1518 : *
1519 : * The flags act1, act2 remain true while the respective cycle is still
1520 : * active; we drop them to false when we return to the identity form with-
1521 : * out having found a square form (or when the blacklist overflows, which
1522 : * shouldn't happen). */
1523 1568 : if (DEBUGLEVEL >= 4)
1524 0 : err_printf("SQUFOF: entering main loop with forms\n"
1525 : "\t(1, %ld, %ld) and (1, %ld, %ld)\n", b1, -c1, b2, -c2);
1526 :
1527 : /* MAIN LOOP: walk around the principal cycle looking for a square form.
1528 : * Blacklist small leading coefficients.
1529 : *
1530 : * The reduction operator can be computed entirely in 32-bit arithmetic:
1531 : * Let q = floor(floor((d1+b1)/2)/c1) (when c1>dd1, q=1, which happens
1532 : * often enough to special-case it). Then the new b1 = (q*c1-b1) + q*c1,
1533 : * which does not overflow, and the new c1 = a1 - q*(q*c1-b1), which is
1534 : * bounded by d1 in abs size since both the old and the new a1 are positive
1535 : * and bounded by d1. */
1536 1388286 : while (act1 || act2)
1537 : {
1538 1388286 : if (act1)
1539 : { /* send first form through reduction operator if active */
1540 1388286 : c = c1;
1541 1388286 : q = (c > dd1)? 1: (dd1 + (b1>>1)) / c;
1542 1388286 : if (q == 1)
1543 575778 : { qcb = c - b1; b1 = c + qcb; c1 = a1 - qcb; }
1544 : else
1545 812508 : { qc = q*c; qcb = qc - b1; b1 = qc + qcb; c1 = a1 - q*qcb; }
1546 1388286 : a1 = c;
1547 :
1548 1388286 : if (a1 <= L1)
1549 : { /* blacklist this */
1550 1017 : if (blp1 >= SQUFOF_BLACKLIST_SZ) /* overflows: shouldn't happen */
1551 0 : act1 = 0;
1552 : else
1553 : {
1554 1017 : if (DEBUGLEVEL >= 6)
1555 0 : err_printf("SQUFOF: blacklisting a = %ld on first cycle\n", a1);
1556 1017 : blacklist1[blp1++] = a1;
1557 : }
1558 : }
1559 : }
1560 1388286 : if (act2)
1561 : { /* send second form through reduction operator if active */
1562 1388094 : c = c2;
1563 1388094 : q = (c > dd2)? 1: (dd2 + (b2>>1)) / c;
1564 1388094 : if (q == 1)
1565 575488 : { qcb = c - b2; b2 = c + qcb; c2 = a2 - qcb; }
1566 : else
1567 812606 : { qc = q*c; qcb = qc - b2; b2 = qc + qcb; c2 = a2 - q*qcb; }
1568 1388094 : a2 = c;
1569 :
1570 1388094 : if (a2 <= L2)
1571 : { /* blacklist this */
1572 1073 : if (blp2 >= SQUFOF_BLACKLIST_SZ) /* overflows: shouldn't happen */
1573 0 : act2 = 0;
1574 : else
1575 : {
1576 1073 : if (DEBUGLEVEL >= 6)
1577 0 : err_printf("SQUFOF: blacklisting a = %ld on second cycle\n", a2);
1578 1073 : blacklist2[blp2++] = a2;
1579 : }
1580 : }
1581 : }
1582 :
1583 1388286 : if (++cnt & 1) continue; /* odd iteration */
1584 : /* even iteration: the leading coefficients are positive */
1585 :
1586 : /* examine first form if active */
1587 694143 : if (act1 && a1 == 1) /* back to identity */
1588 : { /* drop this discriminant */
1589 0 : act1 = 0;
1590 0 : if (DEBUGLEVEL >= 4)
1591 0 : err_printf("SQUFOF: first cycle exhausted after %ld iterations,\n"
1592 : "\tdropping it\n", cnt);
1593 : }
1594 694143 : if (act1)
1595 : {
1596 694143 : if (uissquareall((ulong)a1, (ulong*)&a))
1597 : { /* square form */
1598 1274 : if (DEBUGLEVEL >= 4)
1599 0 : err_printf("SQUFOF: square form (%ld^2, %ld, %ld) on first cycle\n"
1600 : "\tafter %ld iterations\n", a, b1, -c1, cnt);
1601 1274 : if (a <= L1)
1602 : { /* blacklisted? */
1603 : long j;
1604 2394 : for (j = 0; j < blp1; j++)
1605 1578 : if (a == blacklist1[j]) { a = 0; break; }
1606 : }
1607 1274 : if (a > 0)
1608 : { /* not blacklisted */
1609 816 : q = ugcd(a, b1); /* imprimitive form? */
1610 816 : if (q > 1)
1611 : { /* q^2 divides D1 hence n [ assuming n % 3 != 0 ] */
1612 0 : set_avma(av);
1613 0 : if (DEBUGLEVEL >= 4) err_printf("SQUFOF: found factor %ld^2\n", q);
1614 0 : return mkvec3(utoipos(q), gen_2, NULL);/* q^2, unknown status */
1615 : }
1616 : /* chase the inverse root form back along the ambiguous cycle */
1617 816 : q = squfof_ambig(a, b1, dd1, D1);
1618 816 : if (q > 3)
1619 : {
1620 670 : if (nm4 == 3 && q % 3 == 0) q /= 3;
1621 670 : return gc_utoipos(av, q); /* SUCCESS! */
1622 : }
1623 : }
1624 458 : else if (DEBUGLEVEL >= 4) /* blacklisted */
1625 0 : err_printf("SQUFOF: ...but the root form seems to be on the "
1626 : "principal cycle\n");
1627 : }
1628 : }
1629 :
1630 : /* examine second form if active */
1631 693473 : if (act2 && a2 == 1) /* back to identity form */
1632 : { /* drop this discriminant */
1633 2 : act2 = 0;
1634 2 : if (DEBUGLEVEL >= 4)
1635 0 : err_printf("SQUFOF: second cycle exhausted after %ld iterations,\n"
1636 : "\tdropping it\n", cnt);
1637 : }
1638 693473 : if (act2)
1639 : {
1640 693377 : if (uissquareall((ulong)a2, (ulong*)&a))
1641 : { /* square form */
1642 1458 : if (DEBUGLEVEL >= 4)
1643 0 : err_printf("SQUFOF: square form (%ld^2, %ld, %ld) on second cycle\n"
1644 : "\tafter %ld iterations\n", a, b2, -c2, cnt);
1645 1458 : if (a <= L2)
1646 : { /* blacklisted? */
1647 : long j;
1648 2575 : for (j = 0; j < blp2; j++)
1649 1384 : if (a == blacklist2[j]) { a = 0; break; }
1650 : }
1651 1458 : if (a > 0)
1652 : { /* not blacklisted */
1653 1191 : q = ugcd(a, b2); /* imprimitive form? */
1654 : /* NB if b2 is even, a is odd, so the gcd is always odd */
1655 1191 : if (q > 1)
1656 : { /* q^2 divides D2 hence n [ assuming n % 5 != 0 ] */
1657 0 : set_avma(av);
1658 0 : if (DEBUGLEVEL >= 4) err_printf("SQUFOF: found factor %ld^2\n", q);
1659 0 : return mkvec3(utoipos(q), gen_2, NULL);/* q^2, unknown status */
1660 : }
1661 : /* chase the inverse root form along the ambiguous cycle */
1662 1191 : q = squfof_ambig(a, b2, dd2, D2);
1663 1191 : if (q > 5)
1664 : {
1665 898 : if (nm4 == 1 && q % 5 == 0) q /= 5;
1666 898 : return gc_utoipos(av, q); /* SUCCESS! */
1667 : }
1668 : }
1669 267 : else if (DEBUGLEVEL >= 4) /* blacklisted */
1670 0 : err_printf("SQUFOF: ...but the root form seems to be on the "
1671 : "principal cycle\n");
1672 : }
1673 : }
1674 : } /* end main loop */
1675 :
1676 0 : if (DEBUGLEVEL>=4) err_printf("SQUFOF: giving up\n");
1677 0 : return gc_NULL(av);
1678 : }
1679 :
1680 : /***********************************************************************/
1681 : /* DETECTING ODD POWERS --GN1998Jun28 */
1682 : /* Factoring engines like MPQS which ultimately rely on computing */
1683 : /* gcd(N, x^2-y^2) to find a nontrivial factor of N can't split */
1684 : /* N = p^k for an odd prime p, since (Z/p^k)^* is then cyclic. Here */
1685 : /* is an analogue of Z_issquareall() for 3rd, 5th and 7th powers. */
1686 : /* The general case is handled by is_kth_power */
1687 : /***********************************************************************/
1688 :
1689 : /* Multistage sieve. First stages work mod 211, 209, 61, 203 in this order
1690 : * (first reduce mod the product of these and then take the remainder apart).
1691 : * Second stages use 117, 31, 43, 71. Moduli which are no longer interesting
1692 : * are skipped. Everything is encoded in a table of 106 24-bit masks. We only
1693 : * need the first half of the residues. Three bits per modulus indicate which
1694 : * residues are 7th (bit 2), 5th (bit 1) or 3rd (bit 0) powers; the eight
1695 : * moduli above are assigned right-to-left. The table was generated using: */
1696 :
1697 : #if 0
1698 : L = [71, 43, 31, [O(3^2),O(13)], [O(7),O(29)], 61, [O(11),O(19)], 211];
1699 : ispow(x, N, k)=
1700 : {
1701 : if (type(N) == "t_INT", return (ispower(Mod(x,N), k)));
1702 : for (i = 1, #N, if (!ispower(x + N[i], k), return (0))); 1
1703 : }
1704 : check(r) =
1705 : {
1706 : print1(" 0");
1707 : for (i=1,#L,
1708 : N = 0;
1709 : if (ispow(r, L[i], 3), N += 1);
1710 : if (ispow(r, L[i], 5), N += 2);
1711 : if (ispow(r, L[i], 7), N += 4);
1712 : print1(N);
1713 : ); print("ul, /* ", r, " */")
1714 : }
1715 : for (r = 0, 105, check(r))
1716 : #endif
1717 : static ulong powersmod[106] = {
1718 : 077777777ul, /* 0 */
1719 : 077777777ul, /* 1 */
1720 : 013562440ul, /* 2 */
1721 : 012402540ul, /* 3 */
1722 : 013562440ul, /* 4 */
1723 : 052662441ul, /* 5 */
1724 : 016603440ul, /* 6 */
1725 : 016463450ul, /* 7 */
1726 : 013573551ul, /* 8 */
1727 : 012462540ul, /* 9 */
1728 : 012462464ul, /* 10 */
1729 : 013462771ul, /* 11 */
1730 : 012406473ul, /* 12 */
1731 : 012463641ul, /* 13 */
1732 : 052463646ul, /* 14 */
1733 : 012503446ul, /* 15 */
1734 : 013562440ul, /* 16 */
1735 : 052466440ul, /* 17 */
1736 : 012472451ul, /* 18 */
1737 : 012462454ul, /* 19 */
1738 : 032463550ul, /* 20 */
1739 : 013403664ul, /* 21 */
1740 : 013463460ul, /* 22 */
1741 : 032562565ul, /* 23 */
1742 : 012402540ul, /* 24 */
1743 : 052662441ul, /* 25 */
1744 : 032672452ul, /* 26 */
1745 : 013573551ul, /* 27 */
1746 : 012467541ul, /* 28 */
1747 : 012567640ul, /* 29 */
1748 : 032706450ul, /* 30 */
1749 : 012762452ul, /* 31 */
1750 : 033762662ul, /* 32 */
1751 : 012502562ul, /* 33 */
1752 : 032463562ul, /* 34 */
1753 : 013563440ul, /* 35 */
1754 : 016663440ul, /* 36 */
1755 : 036662550ul, /* 37 */
1756 : 012462552ul, /* 38 */
1757 : 033502450ul, /* 39 */
1758 : 012462643ul, /* 40 */
1759 : 033467540ul, /* 41 */
1760 : 017403441ul, /* 42 */
1761 : 017463462ul, /* 43 */
1762 : 017472460ul, /* 44 */
1763 : 033462470ul, /* 45 */
1764 : 052566450ul, /* 46 */
1765 : 013562640ul, /* 47 */
1766 : 032403640ul, /* 48 */
1767 : 016463450ul, /* 49 */
1768 : 016463752ul, /* 50 */
1769 : 033402440ul, /* 51 */
1770 : 012462540ul, /* 52 */
1771 : 012472540ul, /* 53 */
1772 : 053562462ul, /* 54 */
1773 : 012463465ul, /* 55 */
1774 : 012663470ul, /* 56 */
1775 : 052607450ul, /* 57 */
1776 : 012566553ul, /* 58 */
1777 : 013466440ul, /* 59 */
1778 : 012502741ul, /* 60 */
1779 : 012762744ul, /* 61 */
1780 : 012763740ul, /* 62 */
1781 : 012763443ul, /* 63 */
1782 : 013573551ul, /* 64 */
1783 : 013462471ul, /* 65 */
1784 : 052502460ul, /* 66 */
1785 : 012662463ul, /* 67 */
1786 : 012662451ul, /* 68 */
1787 : 012403550ul, /* 69 */
1788 : 073567540ul, /* 70 */
1789 : 072463445ul, /* 71 */
1790 : 072462740ul, /* 72 */
1791 : 012472442ul, /* 73 */
1792 : 012462644ul, /* 74 */
1793 : 013406650ul, /* 75 */
1794 : 052463471ul, /* 76 */
1795 : 012563474ul, /* 77 */
1796 : 013503460ul, /* 78 */
1797 : 016462441ul, /* 79 */
1798 : 016462440ul, /* 80 */
1799 : 012462540ul, /* 81 */
1800 : 013462641ul, /* 82 */
1801 : 012463454ul, /* 83 */
1802 : 013403550ul, /* 84 */
1803 : 057563540ul, /* 85 */
1804 : 017466441ul, /* 86 */
1805 : 017606471ul, /* 87 */
1806 : 053666573ul, /* 88 */
1807 : 012562561ul, /* 89 */
1808 : 013473641ul, /* 90 */
1809 : 032573440ul, /* 91 */
1810 : 016763440ul, /* 92 */
1811 : 016702640ul, /* 93 */
1812 : 033762552ul, /* 94 */
1813 : 012562550ul, /* 95 */
1814 : 052402451ul, /* 96 */
1815 : 033563441ul, /* 97 */
1816 : 012663561ul, /* 98 */
1817 : 012677560ul, /* 99 */
1818 : 012462464ul, /* 100 */
1819 : 032562642ul, /* 101 */
1820 : 013402551ul, /* 102 */
1821 : 032462450ul, /* 103 */
1822 : 012467445ul, /* 104 */
1823 : 032403440ul, /* 105 */
1824 : };
1825 :
1826 : static int
1827 3927875 : check_res(ulong x, ulong N, int shift, ulong *mask)
1828 : {
1829 3927875 : long r = x%N; if ((ulong)r> (N>>1)) r = N - r;
1830 3927875 : *mask &= (powersmod[r] >> shift);
1831 3927875 : return *mask;
1832 : }
1833 :
1834 : /* is x mod 211*209*61*203*117*31*43*71 a 3rd, 5th or 7th power ? */
1835 : int
1836 2421443 : uis_357_powermod(ulong x, ulong *mask)
1837 : {
1838 2421443 : if ( !check_res(x, 211UL, 0, mask)) return 0;
1839 977975 : if (*mask & 3 && !check_res(x, 209UL, 3, mask)) return 0;
1840 399496 : if (*mask & 3 && !check_res(x, 61UL, 6, mask)) return 0;
1841 222404 : if (*mask & 5 && !check_res(x, 203UL, 9, mask)) return 0;
1842 56984 : if (*mask & 1 && !check_res(x, 117UL,12, mask)) return 0;
1843 32993 : if (*mask & 3 && !check_res(x, 31UL,15, mask)) return 0;
1844 24761 : if (*mask & 5 && !check_res(x, 43UL,18, mask)) return 0;
1845 7521 : if (*mask & 6 && !check_res(x, 71UL,21, mask)) return 0;
1846 4060 : return 1;
1847 : }
1848 : /* asume x > 0 and pt != NULL */
1849 : int
1850 2366915 : uis_357_power(ulong x, ulong *pt, ulong *mask)
1851 : {
1852 : double logx;
1853 2366915 : if (!odd(x))
1854 : {
1855 9088 : long v = vals(x);
1856 9088 : if (v % 7) *mask &= ~4;
1857 9088 : if (v % 5) *mask &= ~2;
1858 9088 : if (v % 3) *mask &= ~1;
1859 9088 : if (!*mask) return 0;
1860 : }
1861 2359322 : if (!uis_357_powermod(x, mask)) return 0;
1862 2953 : logx = log((double)x);
1863 3825 : while (*mask)
1864 : {
1865 : long e, b;
1866 : ulong y, ye;
1867 2953 : if (*mask & 1) { b = 1; e = 3; }
1868 873 : else if (*mask & 2) { b = 2; e = 5; }
1869 355 : else { b = 4; e = 7; }
1870 2953 : y = (ulong)(exp(logx / e) + 0.5);
1871 2953 : ye = upowuu(y,e);
1872 2953 : if (ye == x) { *pt = y; return e; }
1873 : #ifdef LONG_IS_64BIT
1874 750 : if (ye > x) y--; else y++;
1875 750 : ye = upowuu(y,e);
1876 750 : if (ye == x) { *pt = y; return e; }
1877 : #endif
1878 872 : *mask &= ~b; /* turn the bit off */
1879 : }
1880 872 : return 0;
1881 : }
1882 :
1883 : #ifndef LONG_IS_64BIT
1884 : /* as above, split in two functions */
1885 : /* is x mod 211*209*61*203 a 3rd, 5th or 7th power ? */
1886 : static int
1887 14330 : uis_357_powermod_32bit_1(ulong x, ulong *mask)
1888 : {
1889 14330 : if ( !check_res(x, 211UL, 0, mask)) return 0;
1890 7906 : if (*mask & 3 && !check_res(x, 209UL, 3, mask)) return 0;
1891 4099 : if (*mask & 3 && !check_res(x, 61UL, 6, mask)) return 0;
1892 2933 : if (*mask & 5 && !check_res(x, 203UL, 9, mask)) return 0;
1893 847 : return 1;
1894 : }
1895 : /* is x mod 117*31*43*71 a 3rd, 5th or 7th power ? */
1896 : static int
1897 847 : uis_357_powermod_32bit_2(ulong x, ulong *mask)
1898 : {
1899 847 : if (*mask & 1 && !check_res(x, 117UL,12, mask)) return 0;
1900 678 : if (*mask & 3 && !check_res(x, 31UL,15, mask)) return 0;
1901 551 : if (*mask & 5 && !check_res(x, 43UL,18, mask)) return 0;
1902 283 : if (*mask & 6 && !check_res(x, 71UL,21, mask)) return 0;
1903 227 : return 1;
1904 : }
1905 : #endif
1906 :
1907 : /* Returns 3, 5, or 7 if x is a cube (but not a 5th or 7th power), a 5th
1908 : * power (but not a 7th), or a 7th power, and in this case creates the
1909 : * base on the stack and assigns its address to *pt. Otherwise returns 0.
1910 : * x must be of type t_INT and positive; this is not checked. The *mask
1911 : * argument tells us which things to check -- bit 0: 3rd, bit 1: 5th,
1912 : * bit 2: 7th pwr; set a bit to have the corresponding power examined --
1913 : * and is updated appropriately for a possible follow-up call */
1914 : int
1915 2800941 : is_357_power(GEN x, GEN *pt, ulong *mask)
1916 : {
1917 2800941 : long lx = lgefint(x);
1918 : ulong r;
1919 : pari_sp av;
1920 : GEN y;
1921 :
1922 2800941 : if (!*mask) return 0; /* useful when running in a loop */
1923 2429557 : if (DEBUGLEVEL>4)
1924 0 : err_printf("OddPwrs: examining %ld-bit integer\n", expi(x)+1);
1925 2429557 : if (lgefint(x) == 3) {
1926 : ulong t;
1927 2353104 : long e = uis_357_power(x[2], &t, mask);
1928 2353104 : if (e)
1929 : {
1930 2055 : if (pt) *pt = utoi(t);
1931 2055 : return e;
1932 : }
1933 2351049 : return 0;
1934 : }
1935 : #ifdef LONG_IS_64BIT
1936 62123 : r = (lx == 3)? uel(x,2): umodiu(x, 6046846918939827UL);
1937 62122 : if (!uis_357_powermod(r, mask)) return 0;
1938 : #else
1939 14330 : r = (lx == 3)? uel(x,2): umodiu(x, 211*209*61*203);
1940 14330 : if (!uis_357_powermod_32bit_1(r, mask)) return 0;
1941 847 : r = (lx == 3)? uel(x,2): umodiu(x, 117*31*43*71);
1942 847 : if (!uis_357_powermod_32bit_2(r, mask)) return 0;
1943 : #endif
1944 1337 : av = avma;
1945 2608 : while (*mask)
1946 : {
1947 : long e, b;
1948 : /* priority to higher powers: if we have a 21st, it is easier to rediscover
1949 : * that its 7th root is a cube than that its cube root is a 7th power */
1950 1967 : if (*mask & 4) { b = 4; e = 7; }
1951 1368 : else if (*mask & 2) { b = 2; e = 5; }
1952 499 : else { b = 1; e = 3; }
1953 1967 : y = mpround( sqrtnr(itor(x, nbits2prec(64 + bit_accuracy(lx) / e)), e) );
1954 1967 : if (equalii(powiu(y,e), x))
1955 : {
1956 696 : if (!pt) return gc_int(av,e);
1957 682 : set_avma((pari_sp)y); *pt = gc_INT(av, y);
1958 682 : return e;
1959 : }
1960 1271 : *mask &= ~b; /* turn the bit off */
1961 1271 : set_avma(av);
1962 : }
1963 641 : return 0;
1964 : }
1965 :
1966 : /* Is x a n-th power ? If pt != NULL, it receives the n-th root */
1967 : ulong
1968 480071 : is_kth_power(GEN x, ulong n, GEN *pt)
1969 : {
1970 : forprime_t T;
1971 : long j;
1972 : ulong q, residue;
1973 : GEN y;
1974 480071 : pari_sp av = avma;
1975 :
1976 480071 : (void)u_forprime_arith_init(&T, odd(n)? 2*n+1: n+1, ULONG_MAX, 1,n);
1977 : /* we'll start at q, smallest prime >= n */
1978 :
1979 : /* Modular checks, use small primes q congruent 1 mod n */
1980 : /* A non n-th power nevertheless passes the test with proba n^(-#checks),
1981 : * We'd like this < 1e-6 but let j = floor(log(1e-6) / log(n)) which
1982 : * ensures much less. */
1983 479833 : if (n < 16)
1984 116717 : j = 5;
1985 363116 : else if (n < 32)
1986 151054 : j = 4;
1987 212062 : else if (n < 101)
1988 190274 : j = 3;
1989 21788 : else if (n < 1001)
1990 5374 : j = 2;
1991 16414 : else if (n < 17886697) /* smallest such that smallest suitable q is > 2^32 */
1992 16303 : j = 1;
1993 : else
1994 275 : j = 0;
1995 534883 : for (; j > 0; j--)
1996 : {
1997 530660 : if (!(q = u_forprime_next(&T))) break;
1998 : /* q a prime = 1 mod n */
1999 530999 : residue = umodiu(x, q);
2000 530983 : if (residue == 0)
2001 : {
2002 483 : if (Z_lval(x,q) % n) return gc_ulong(av,0);
2003 49 : continue;
2004 : }
2005 : /* n-th power mod q ? */
2006 530500 : if (Fl_powu(residue, (q-1)/n, q) != 1) return gc_ulong(av,0);
2007 : }
2008 4223 : set_avma(av);
2009 :
2010 4193 : if (DEBUGLEVEL>4) err_printf("\nOddPwrs: [%lu] passed modular checks\n",n);
2011 : /* go to the horse's mouth... */
2012 4193 : y = roundr( sqrtnr(itor(x, nbits2prec(expi(x)/n + 16)), n) );
2013 4193 : if (!equalii(powiu(y, n), x)) {
2014 3244 : if (DEBUGLEVEL>4) err_printf("\tBut it wasn't a pure power.\n");
2015 3244 : return gc_ulong(av,0);
2016 : }
2017 949 : if (!pt) set_avma(av); else { set_avma((pari_sp)y); *pt = gc_INT(av,y); }
2018 949 : return 1;
2019 : }
2020 :
2021 : /* is x a p^i-th power, p >= 11 prime ? Similar to is_357_power(), but instead
2022 : * of the mask, we keep the current test exponent around. Cut off when
2023 : * log_2 x^(1/k) < cutoffbits since we would have found it by trial division.
2024 : * Everything needed here (primitive roots etc.) is computed from scratch on
2025 : * the fly; compared to the size of numbers under consideration, these
2026 : * word-sized computations take negligible time.
2027 : * Any cutoffbits > 0 is safe, but direct root extraction attempts are faster
2028 : * when trial division has been used to discover very small bases. We become
2029 : * competitive at cutoffbits ~ 10 */
2030 : int
2031 68545 : is_pth_power(GEN x, GEN *pt, forprime_t *T, ulong cutoffbits)
2032 : {
2033 68545 : long cnt=0, size = expi(x) /* not +1 */;
2034 : ulong p;
2035 68545 : pari_sp av = avma;
2036 494351 : while ((p = u_forprime_next(T)) && size/p >= cutoffbits) {
2037 425813 : long v = 1;
2038 425813 : if (DEBUGLEVEL>5 && cnt++==2000)
2039 0 : { cnt=0; err_printf("%lu%% ", 100*p*cutoffbits/size); }
2040 425867 : while (is_kth_power(x, p, pt)) {
2041 56 : v *= p; x = *pt;
2042 56 : size = expi(x);
2043 : }
2044 425848 : if (v > 1)
2045 : {
2046 42 : if (DEBUGLEVEL>5) err_printf("\nOddPwrs: is a %ld power\n",v);
2047 42 : return v;
2048 : }
2049 : }
2050 68482 : if (DEBUGLEVEL>5) err_printf("\nOddPwrs: not a power\n",p);
2051 68482 : return gc_int(av,0); /* give up */
2052 : }
2053 :
2054 : /***********************************************************************/
2055 : /** FACTORIZATION (master iteration) **/
2056 : /** Driver for the various methods of finding large factors **/
2057 : /** (after trial division has cast out the very small ones). **/
2058 : /** GN1998Jun24--30 **/
2059 : /***********************************************************************/
2060 :
2061 : /* Direct use:
2062 : * ifac_start_hint(n,moebius,hint) registers with the iterative factorizer
2063 : * - an integer n (without prime factors < tridiv_bound(n))
2064 : * - registers whether or not we should terminate early if we find a square
2065 : * factor,
2066 : * - a hint about which method(s) to use.
2067 : * This must always be called first. If input is not composite, oo loop.
2068 : * The routine decomposes n nontrivially into a product of two factors except
2069 : * in squarefreeness ('Moebius') mode.
2070 : *
2071 : * ifac_start(n,moebius) same using default hint.
2072 : *
2073 : * ifac_primary_factor() returns a prime divisor (not necessarily the
2074 : * smallest) and the corresponding exponent.
2075 : *
2076 : * Encapsulated user interface: Many arithmetic functions have a 'contributor'
2077 : * ifac_xxx, to be called on any large composite cofactor left over after trial
2078 : * division by small primes: xxx is one of moebius, issquarefree, totient, etc.
2079 : *
2080 : * We never test whether the input number is prime or composite, since
2081 : * presumably it will have come out of the small factors finder stage
2082 : * (which doesn't really exist yet but which will test the left-over
2083 : * cofactor for primality once it does). */
2084 :
2085 : /* The data structure in which we preserve whatever we know about our number N
2086 : * is kept on the PARI stack, and updated as needed.
2087 : * This makes the machinery re-entrant, and avoids memory leaks when a lengthy
2088 : * factorization is interrupted. We try to keep the whole affair connected,
2089 : * and the parent object is always older than its children. This may in
2090 : * rare cases lead to some extra copying around, and knowing what is garbage
2091 : * at any given time is not trivial. See below for examples how to do it right.
2092 : * (Connectedness is destroyed if callers of ifac_main() create stuff on the
2093 : * stack in between calls. This is harmless as long as ifac_realloc() is used
2094 : * to re-create a connected object at the head of the stack just before
2095 : * collecting garbage.)
2096 : * A t_INT may well have > 10^6 distinct prime factors larger than 2^16. Since
2097 : * we need not find factors in order of increasing size, we must be prepared to
2098 : * drag a very large amount of data around. We start with a small structure
2099 : * and extend it when necessary. */
2100 :
2101 : /* The idea of the algorithm is:
2102 : * Let N0 be whatever is currently left of N after dividing off all the
2103 : * prime powers we have already returned to the caller. Then we maintain
2104 : * N0 as a product
2105 : * (1) N0 = \prod_i P_i^{e_i} * \prod_j Q_j^{f_j} * \prod_k C_k^{g_k}
2106 : * where the P_i and Q_j are distinct primes, each C_k is known composite,
2107 : * none of the P_i divides any C_k, and we also know the total ordering
2108 : * of all the P_i, Q_j and C_k; in particular, we will never try to divide
2109 : * a C_k by a larger Q_j. Some of the C_k may have common factors.
2110 : *
2111 : * Caveat implementor: Taking gcds among C_k's is very likely to cost at
2112 : * least as much time as dividing off any primes as we find them, and book-
2113 : * keeping would be tough (since D=gcd(C_1,C_2) can still have common factors
2114 : * with both C_1/D and C_2/D, and so on...).
2115 : *
2116 : * At startup, we just initialize the structure to
2117 : * (2) N = C_1^1 (composite).
2118 : *
2119 : * Whenever ifac_primary_factor() or one of the arithmetic user interface
2120 : * routines needs a primary factor, and the smallest thing in our list is P_1,
2121 : * we return that and its exponent, and remove it from our list. (When nothing
2122 : * is left, we return a sentinel value -- gen_1. And in Moebius mode, when we
2123 : * see something with exponent > 1, whether prime or composite, we return gen_0
2124 : * or 0, depending on the function). In all other cases, ifac_main() iterates
2125 : * the following steps until we have a P_1 in the smallest position.
2126 : *
2127 : * When the smallest item is C_1, as it is initially:
2128 : * (3.1) Crack C_1 into a nontrivial product U_1 * U_2 by whatever method
2129 : * comes to mind for this size. (U for 'unknown'.) Cracking will detect
2130 : * perfect powers, so we may instead see a power of some U_1 here, or even
2131 : * something of the form U_1^k*U_2^k; of course the exponent already attached
2132 : * to C_1 is taken into account in the following.
2133 : * (3.2) If we have U_1*U_2, sort the two factors (distinct: squares are caught
2134 : * in stage 3.1). N.B. U_1 and U_2 are smaller than anything else in our list.
2135 : * (3.3) Check U_1 and U_2 for primality, and flag them accordingly.
2136 : * (3.4) Iterate.
2137 : *
2138 : * When the smallest item is Q_1:
2139 : * This is the unpleasant case. We go through the entire list and try to
2140 : * divide Q_1 off each of the current C_k's, which usually fails, but may
2141 : * succeed several times. When a division was successful, the corresponding
2142 : * C_k is removed from our list, and the cofactor becomes a U_l for the moment
2143 : * unless it is 1 (which happens when C_k was a power of Q_1). When we're
2144 : * through we upgrade Q_1 to P_1 status, then do a primality check on each U_l
2145 : * and sort it back into the list either as a Q_j or as a C_k. If during the
2146 : * insertion sort we discover that some U_l equals some P_i or Q_j or C_k we
2147 : * already have, we just add U_l's exponent to that of its twin. (The sorting
2148 : * therefore happens before the primality test). Since this may produce one or
2149 : * more elements smaller than the P_1 we just confirmed, we may have to repeat
2150 : * the iteration.
2151 : * A trick avoids some Q_1 instances: just after the sweep classifying
2152 : * all current unknowns as either composites or primes, we do another downward
2153 : * sweep beginning with the largest current factor and stopping just above the
2154 : * largest current composite. Every Q_j we pass is turned into a P_i.
2155 : * (Different primes are automatically coprime among each other, and primes do
2156 : * not divide smaller composites.)
2157 : * NB: We have no use for comparing the square of a prime to N0. Normally
2158 : * we will get called after casting out only the smallest primes, and
2159 : * since we cannot guarantee that we see the large prime factors in as-
2160 : * cending order, we cannot stop when we find one larger than sqrt(N0). */
2161 :
2162 : /* Data structure: We keep everything in a single t_VEC of t_INTs. The
2163 : * first 2 components are read-only:
2164 : * 1) the first records whether we're doing full (NULL) or Moebius (gen_1)
2165 : * factorization; in the latter case subroutines return a sentinel value as
2166 : * soon as they spot an exponent > 1.
2167 : * 2) the second records the hint from factorint()'s optional flag, for use by
2168 : * ifac_crack().
2169 : *
2170 : * The remaining components (initially 15) are used in groups of three:
2171 : * [ factor (t_INT), exponent (t_INT), factor class ], where factor class is
2172 : * NULL : unknown
2173 : * gen_0: known composite C_k
2174 : * gen_1: known prime Q_j awaiting trial division
2175 : * gen_2: finished prime P_i.
2176 : * When during the division stage we re-sort a C_k-turned-U_l to a lower
2177 : * position, we rotate any intervening material upward towards its old
2178 : * slot. When a C_k was divided down to 1, its slot is left empty at
2179 : * first; similarly when the re-sorting detects a repeated factor.
2180 : * After the sorting phase, we de-fragment the list and squeeze all the
2181 : * occupied slots together to the high end, so that ifac_crack() has room
2182 : * for new factors. When this doesn't suffice, we abandon the current vector
2183 : * and allocate a somewhat larger one, defragmenting again while copying.
2184 : *
2185 : * For internal use: note that all exponents will fit into C longs, given
2186 : * PARI's lgefint field size. When we work with them, we sometimes read
2187 : * out the GEN pointer, and sometimes do an itos, whatever is more con-
2188 : * venient for the task at hand. */
2189 :
2190 : /*** Overview ***/
2191 :
2192 : /* The '*where' argument in the following points into *partial at the first of
2193 : * the three fields of the first occupied slot. It's there because the caller
2194 : * would already know where 'here' is, so we don't want to search for it again.
2195 : * We do not preserve this from one user-interface call to the next. */
2196 :
2197 : /* In the most cases, control flows from the user interface to ifac_main() and
2198 : * then to a succession of ifac_crack()s and ifac_divide()s, with (typically)
2199 : * none of the latter finding anything. */
2200 :
2201 : #define LAST(x) x+lg(x)-3
2202 : #define FIRST(x) x+3
2203 :
2204 : #define MOEBIUS(x) gel(x,1)
2205 : #define HINT(x) gel(x,2)
2206 :
2207 : /* y <- x */
2208 : INLINE void
2209 0 : SHALLOWCOPY(GEN x, GEN y) {
2210 0 : VALUE(y) = VALUE(x);
2211 0 : EXPON(y) = EXPON(x);
2212 0 : CLASS(y) = CLASS(x);
2213 0 : }
2214 : /* y <- x */
2215 : INLINE void
2216 0 : COPY(GEN x, GEN y) {
2217 0 : icopyifstack(VALUE(x), VALUE(y));
2218 0 : icopyifstack(EXPON(x), EXPON(y));
2219 0 : CLASS(y) = CLASS(x);
2220 0 : }
2221 :
2222 : /* Diagnostics */
2223 : static void
2224 0 : ifac_factor_dbg(GEN x)
2225 : {
2226 0 : GEN c = CLASS(x), v = VALUE(x);
2227 0 : if (c == gen_2) err_printf("IFAC: factor %Ps\n\tis prime (finished)\n", v);
2228 0 : else if (c == gen_1) err_printf("IFAC: factor %Ps\n\tis prime\n", v);
2229 0 : else if (c == gen_0) err_printf("IFAC: factor %Ps\n\tis composite\n", v);
2230 0 : }
2231 : static void
2232 0 : ifac_check(GEN partial, GEN where)
2233 : {
2234 0 : if (!where || where < FIRST(partial) || where > LAST(partial))
2235 0 : pari_err_BUG("ifac_check ['where' out of bounds]");
2236 0 : }
2237 : static void
2238 0 : ifac_print(GEN part, GEN where)
2239 : {
2240 0 : long l = lg(part);
2241 : GEN p;
2242 :
2243 0 : err_printf("ifac partial factorization structure: %ld slots, ", (l-3)/3);
2244 0 : if (MOEBIUS(part)) err_printf("Moebius mode, ");
2245 0 : err_printf("hint = %ld\n", itos(HINT(part)));
2246 0 : ifac_check(part, where);
2247 0 : for (p = part+3; p < part + l; p += 3)
2248 : {
2249 0 : GEN v = VALUE(p), e = EXPON(p), c = CLASS(p);
2250 0 : const char *s = "";
2251 0 : if (!v) { err_printf("[empty slot]\n"); continue; }
2252 0 : if (c == NULL) s = "unknown";
2253 0 : else if (c == gen_0) s = "composite";
2254 0 : else if (c == gen_1) s = "unfinished prime";
2255 0 : else if (c == gen_2) s = "prime";
2256 0 : else pari_err_BUG("unknown factor class");
2257 0 : err_printf("[%Ps, %Ps, %s]\n", v, e, s);
2258 : }
2259 0 : err_printf("Done.\n");
2260 0 : }
2261 :
2262 : static const long decomp_default_hint = 0;
2263 : /* assume n > 0, which we can assign to */
2264 : /* return initial data structure, see ifac_crack() for the hint argument */
2265 : static GEN
2266 5899 : ifac_start_hint(GEN n, int moebius, long hint)
2267 : {
2268 5899 : const long ifac_initial_length = 3 + 7*3;
2269 : /* codeword, moebius, hint, 7 slots -- a 512-bit product of distinct 8-bit
2270 : * primes needs at most 7 slots at a time) */
2271 5899 : GEN here, part = cgetg(ifac_initial_length, t_VEC);
2272 :
2273 5899 : MOEBIUS(part) = moebius? gen_1 : NULL;
2274 5899 : HINT(part) = stoi(hint);
2275 : /* fill first slot at the top end */
2276 5899 : here = part + ifac_initial_length - 3; /* LAST(part) */
2277 5899 : INIT(here, n,gen_1,gen_0); /* n^1: composite */
2278 41293 : while ((here -= 3) > part) ifac_delete(here);
2279 5899 : return part;
2280 : }
2281 : GEN
2282 2523 : ifac_start(GEN n, int moebius)
2283 2523 : { return ifac_start_hint(n,moebius,decomp_default_hint); }
2284 :
2285 : /* Return next nonempty slot after 'here', NULL if none exist */
2286 : static GEN
2287 15115 : ifac_find(GEN partial)
2288 : {
2289 15115 : GEN scan, end = partial + lg(partial);
2290 :
2291 : #ifdef IFAC_DEBUG
2292 : ifac_check(partial, partial);
2293 : #endif
2294 110204 : for (scan = partial+3; scan < end; scan += 3)
2295 105535 : if (VALUE(scan)) return scan;
2296 4669 : return NULL;
2297 : }
2298 :
2299 : /* Defragment: squeeze out unoccupied slots above *where. Unoccupied slots
2300 : * arise when a composite factor dissolves completely whilst dividing off a
2301 : * prime, or when ifac_resort() spots a coincidence and merges two factors.
2302 : * Update *where */
2303 : static void
2304 14 : ifac_defrag(GEN *partial, GEN *where)
2305 : {
2306 14 : GEN scan_new = LAST(*partial), scan_old;
2307 :
2308 42 : for (scan_old = scan_new; scan_old >= *where; scan_old -= 3)
2309 : {
2310 28 : if (!VALUE(scan_old)) continue; /* empty slot */
2311 28 : if (scan_old < scan_new) SHALLOWCOPY(scan_old, scan_new);
2312 28 : scan_new -= 3; /* point at next slot to be written */
2313 : }
2314 14 : scan_new += 3; /* back up to last slot written */
2315 14 : *where = scan_new;
2316 84 : while ((scan_new -= 3) > *partial) ifac_delete(scan_new); /* erase junk */
2317 14 : }
2318 :
2319 : /* Move to a larger main vector, updating *where if it points into it, and
2320 : * *partial in any case. Can be used as a specialized gcopy before
2321 : * a gc_upto() (pass 0 as the new length). Normally, one would pass
2322 : * new_lg=1 to let this function guess the new size. To be used sparingly.
2323 : * Complex version of ifac_defrag(), combined with reallocation. If new_lg
2324 : * is 0, use the old length, so this acts just like gcopy except that the
2325 : * 'where' pointer is carried along; if it is 1, we make an educated guess.
2326 : * Exception: If new_lg is 0, the vector is full to the brim, and the first
2327 : * entry is composite, we make it longer to avoid being called again a
2328 : * microsecond later. It is safe to call this with *where = NULL:
2329 : * if it doesn't point anywhere within the old structure, it is left alone */
2330 : static void
2331 0 : ifac_realloc(GEN *partial, GEN *where, long new_lg)
2332 : {
2333 0 : long old_lg = lg(*partial);
2334 : GEN newpart, scan_new, scan_old;
2335 :
2336 0 : if (new_lg == 1)
2337 0 : new_lg = 2*old_lg - 6; /* from 7 slots to 13 to 25... */
2338 0 : else if (new_lg <= old_lg) /* includes case new_lg == 0 */
2339 : {
2340 0 : GEN first = *partial + 3;
2341 0 : new_lg = old_lg;
2342 : /* structure full and first entry composite or unknown */
2343 0 : if (VALUE(first) && (CLASS(first) == gen_0 || CLASS(first)==NULL))
2344 0 : new_lg += 6; /* give it a little more breathing space */
2345 : }
2346 0 : newpart = cgetg(new_lg, t_VEC);
2347 0 : if (DEBUGMEM >= 3)
2348 0 : err_printf("IFAC: new partial factorization structure (%ld slots)\n",
2349 0 : (new_lg - 3)/3);
2350 0 : MOEBIUS(newpart) = MOEBIUS(*partial);
2351 0 : icopyifstack(HINT(*partial), HINT(newpart));
2352 : /* Downward sweep through the old *partial. Pick up 'where' and carry it
2353 : * over if we pass it. (Only useful if it pointed at a nonempty slot.)
2354 : * Factors are COPY'd so that we again have a nice object (parent older
2355 : * than children, connected), except the one factor that may still be living
2356 : * in a clone where n originally was; exponents are similarly copied if they
2357 : * aren't global constants; class-of-factor fields are global constants so we
2358 : * need only copy them as pointers. Caller may then do a gc_upto() */
2359 0 : scan_new = newpart + new_lg - 3; /* LAST(newpart) */
2360 0 : scan_old = *partial + old_lg - 3; /* LAST(*partial) */
2361 0 : for (; scan_old > *partial + 2; scan_old -= 3)
2362 : {
2363 0 : if (*where == scan_old) *where = scan_new;
2364 0 : if (!VALUE(scan_old)) continue; /* skip empty slots */
2365 0 : COPY(scan_old, scan_new); scan_new -= 3;
2366 : }
2367 0 : scan_new += 3; /* back up to last slot written */
2368 0 : while ((scan_new -= 3) > newpart) ifac_delete(scan_new);
2369 0 : *partial = newpart;
2370 0 : }
2371 :
2372 : /* Re-sort one (typically unknown) entry from washere to a new position,
2373 : * rotating intervening entries upward to fill the vacant space. If the new
2374 : * position is the same as the old one, or the new value of the entry coincides
2375 : * with a value already occupying a lower slot, then we just add exponents (and
2376 : * use the 'more known' class, and return 1 immediately when in Moebius mode).
2377 : * Slots between *where and washere must be in sorted order, so a sweep using
2378 : * this to re-sort several unknowns must proceed upward, see ifac_resort().
2379 : * Bubble-sort-of-thing sort. Won't be exercised frequently, so this is ok */
2380 : static void
2381 7 : ifac_sort_one(GEN *where, GEN washere)
2382 : {
2383 7 : GEN old, scan = washere - 3;
2384 : GEN value, exponent, class0, class1;
2385 : long cmp_res;
2386 :
2387 7 : if (scan < *where) return; /* nothing to do, washere==*where */
2388 7 : value = VALUE(washere);
2389 7 : exponent = EXPON(washere);
2390 7 : class0 = CLASS(washere);
2391 7 : cmp_res = -1; /* sentinel */
2392 7 : while (scan >= *where) /* at least once */
2393 : {
2394 7 : if (VALUE(scan))
2395 : { /* current slot nonempty, check against where */
2396 7 : cmp_res = cmpii(value, VALUE(scan));
2397 7 : if (cmp_res >= 0) break; /* have found where to stop */
2398 : }
2399 : /* copy current slot upward by one position and move pointers down */
2400 0 : SHALLOWCOPY(scan, scan+3);
2401 0 : scan -= 3;
2402 : }
2403 7 : scan += 3;
2404 : /* At this point there are the following possibilities:
2405 : * 1) cmp_res == -1. Either value is less than that at *where, or *where was
2406 : * pointing at vacant slots and any factors we saw en route were larger than
2407 : * value. At any rate, scan == *where now, and scan is pointing at an empty
2408 : * slot, into which we'll stash our entry.
2409 : * 2) cmp_res == 0. The entry at scan-3 is the one, we compare class0
2410 : * fields and add exponents, and put it all into the vacated scan slot,
2411 : * NULLing the one at scan-3 (and possibly updating *where).
2412 : * 3) cmp_res == 1. The slot at scan is the one to store our entry into. */
2413 7 : if (cmp_res)
2414 : {
2415 7 : if (cmp_res < 0 && scan != *where)
2416 0 : pari_err_BUG("ifact_sort_one [misaligned partial]");
2417 7 : INIT(scan, value, exponent, class0); return;
2418 : }
2419 : /* case cmp_res == 0: repeated factor detected */
2420 0 : if (DEBUGLEVEL >= 4)
2421 0 : err_printf("IFAC: repeated factor %Ps\n\tin ifac_sort_one\n", value);
2422 0 : old = scan - 3;
2423 : /* if old class0 was composite and new is prime, or vice versa, complain
2424 : * (and if one class0 was unknown and the other wasn't, use the known one) */
2425 0 : class1 = CLASS(old);
2426 0 : if (class0) /* should never be used */
2427 : {
2428 0 : if (class1)
2429 : {
2430 0 : if (class0 == gen_0 && class1 != gen_0)
2431 0 : pari_err_BUG("ifac_sort_one (composite = prime)");
2432 0 : else if (class0 != gen_0 && class1 == gen_0)
2433 0 : pari_err_BUG("ifac_sort_one (prime = composite)");
2434 0 : else if (class0 == gen_2)
2435 0 : CLASS(scan) = class0;
2436 : }
2437 : else
2438 0 : CLASS(scan) = class0;
2439 : }
2440 : /* else stay with the existing known class0 */
2441 0 : CLASS(scan) = class1;
2442 : /* in any case, add exponents */
2443 0 : if (EXPON(old) == gen_1 && exponent == gen_1)
2444 0 : EXPON(scan) = gen_2;
2445 : else
2446 0 : EXPON(scan) = addii(EXPON(old), exponent);
2447 : /* move the value over and null out the vacated slot below */
2448 0 : old = scan - 3;
2449 0 : *scan = *old;
2450 0 : ifac_delete(old);
2451 : /* finally, see whether *where should be pulled in */
2452 0 : if (old == *where) *where += 3;
2453 : }
2454 :
2455 : /* Sort all current unknowns downward to where they belong. Sweeps in the
2456 : * upward direction. Not needed after ifac_crack(), only when ifac_divide()
2457 : * returned true. Update *where. */
2458 : static void
2459 7 : ifac_resort(GEN *partial, GEN *where)
2460 : {
2461 : GEN scan, end;
2462 7 : ifac_defrag(partial, where); end = LAST(*partial);
2463 21 : for (scan = *where; scan <= end; scan += 3)
2464 14 : if (VALUE(scan) && !CLASS(scan)) ifac_sort_one(where, scan); /*unknown*/
2465 7 : ifac_defrag(partial, where); /* remove newly created gaps */
2466 7 : }
2467 :
2468 : /* Let x be a t_INT known not to have small divisors (< 661, and < 2^14 for huge
2469 : * x > 2^512). Return 0 if x is a proven composite. Return 1 if we believe it
2470 : * to be prime (fully proven prime if factor_proven is set). */
2471 : int
2472 27940 : ifac_isprime(GEN x)
2473 : {
2474 27940 : if (!BPSW_psp_nosmalldiv(x)) return 0; /* composite */
2475 19622 : if (factor_proven && ! BPSW_isprime(x))
2476 : {
2477 0 : pari_warn(warner,
2478 : "IFAC: pseudo-prime %Ps\n\tis not prime. PLEASE REPORT!\n", x);
2479 0 : return 0;
2480 : }
2481 19622 : return 1;
2482 : }
2483 :
2484 : static int
2485 11183 : ifac_checkprime(GEN x)
2486 : {
2487 11183 : int res = ifac_isprime(VALUE(x));
2488 11183 : CLASS(x) = res? gen_1: gen_0;
2489 11183 : if (DEBUGLEVEL>2) ifac_factor_dbg(x);
2490 11183 : return res;
2491 : }
2492 :
2493 : /* Determine primality or compositeness of all current unknowns, and set
2494 : * class Q primes to finished (class P) if everything larger is already
2495 : * known to be prime. When after_crack >= 0, only look at the
2496 : * first after_crack things in the list (do nothing when it's 0) */
2497 : static void
2498 5753 : ifac_whoiswho(GEN *partial, GEN *where, long after_crack)
2499 : {
2500 5753 : GEN scan, scan_end = LAST(*partial);
2501 :
2502 : #ifdef IFAC_DEBUG
2503 : ifac_check(*partial, *where);
2504 : #endif
2505 5753 : if (after_crack == 0) return;
2506 5112 : if (after_crack > 0) /* check at most after_crack entries */
2507 5105 : scan = *where + 3*(after_crack - 1); /* assert(scan <= scan_end) */
2508 : else
2509 7 : for (scan = scan_end; scan >= *where; scan -= 3)
2510 : {
2511 7 : if (CLASS(scan))
2512 : { /* known class of factor */
2513 0 : if (CLASS(scan) == gen_0) break;
2514 0 : if (CLASS(scan) == gen_1)
2515 : {
2516 0 : if (DEBUGLEVEL>=3)
2517 : {
2518 0 : err_printf("IFAC: factor %Ps\n\tis prime (no larger composite)\n",
2519 0 : VALUE(*where));
2520 0 : err_printf("IFAC: prime %Ps\n\tappears with exponent = %ld\n",
2521 0 : VALUE(*where), itos(EXPON(*where)));
2522 : }
2523 0 : CLASS(scan) = gen_2;
2524 : }
2525 0 : continue;
2526 : }
2527 7 : if (!ifac_checkprime(scan)) break; /* must disable Q-to-P */
2528 0 : CLASS(scan) = gen_2; /* P_i, finished prime */
2529 0 : if (DEBUGLEVEL>2) ifac_factor_dbg(scan);
2530 : }
2531 : /* go on, Q-to-P trick now disabled */
2532 15612 : for (; scan >= *where; scan -= 3)
2533 : {
2534 10500 : if (CLASS(scan)) continue;
2535 10465 : (void)ifac_checkprime(scan); /* Qj | Ck */
2536 : }
2537 : }
2538 :
2539 : /* if y | x, set x /= y and return 1; else return 0 */
2540 : static int
2541 219 : dvdii_inplace(GEN x, GEN y)
2542 : {
2543 219 : pari_sp av = avma;
2544 219 : GEN r, q = dvmdii(x, y, &r);
2545 219 : if (r != gen_0) return gc_bool(av, 0);
2546 14 : affii(q, x); return gc_bool(av, 1);
2547 : }
2548 : /* return v = v_p(x), set x /= p^v in place */
2549 : static long
2550 765 : Z_pval_inplace(GEN x, GEN p)
2551 : {
2552 765 : pari_sp av = avma;
2553 765 : GEN r, q = dvmdii(x, p, &r);
2554 : long v;
2555 765 : if (r != gen_0) return gc_long(av, 0);
2556 231 : for (v = 1;; v++)
2557 98 : {
2558 329 : GEN Q = dvmdii(q, p, &r);
2559 329 : if (r != gen_0) break;
2560 98 : q = Q;
2561 : }
2562 231 : affii(q, x); return gc_long(av, v);
2563 : }
2564 :
2565 : /* Divide all current composites by first (prime, class Q) entry, updating its
2566 : * exponent, and turning it into a finished prime (class P). Return 1 if any
2567 : * such divisions succeeded (in Moebius mode, the update may then not have
2568 : * been completed), or 0 if none of them succeeded. Doesn't modify *where.
2569 : * Here we normally do not check that the first entry is a not-finished
2570 : * prime. Stack management: we may allocate a new exponent */
2571 : static long
2572 9724 : ifac_divide(GEN *partial, GEN *where, long moebius_mode)
2573 : {
2574 9724 : GEN scan, scan_end = LAST(*partial);
2575 9724 : long res = 0, exponent, newexp, otherexp;
2576 :
2577 : #ifdef IFAC_DEBUG
2578 : ifac_check(*partial, *where);
2579 : if (CLASS(*where) != gen_1)
2580 : pari_err_BUG("ifac_divide [division by composite or finished prime]");
2581 : if (!VALUE(*where)) pari_err_BUG("ifac_divide [division by nothing]");
2582 : #endif
2583 9724 : newexp = exponent = itos(EXPON(*where));
2584 9724 : if (exponent > 1 && moebius_mode) return 1;
2585 : /* should've been caught by caller */
2586 :
2587 15375 : for (scan = *where+3; scan <= scan_end; scan += 3)
2588 : {
2589 5651 : if (CLASS(scan) != gen_0) continue; /* the other thing ain't composite */
2590 205 : otherexp = 0;
2591 219 : while (dvdii_inplace(VALUE(scan), VALUE(*where)))
2592 : {
2593 14 : if (moebius_mode) return 1; /* immediately */
2594 14 : if (!otherexp) otherexp = itos(EXPON(scan));
2595 14 : newexp += otherexp;
2596 : }
2597 205 : if (newexp > exponent) /* did anything happen? */
2598 : {
2599 7 : EXPON(*where) = (newexp == 2 ? gen_2 : utoipos(newexp));
2600 7 : exponent = newexp;
2601 7 : if (is_pm1((GEN)*scan)) /* factor dissolved completely */
2602 : {
2603 0 : ifac_delete(scan);
2604 0 : if (DEBUGLEVEL >= 4)
2605 0 : err_printf("IFAC: a factor was a power of another prime factor\n");
2606 : } else {
2607 7 : CLASS(scan) = NULL; /* at any rate it's Unknown now */
2608 7 : if (DEBUGLEVEL >= 4)
2609 0 : err_printf("IFAC: a factor was divisible by another prime factor,\n"
2610 : "\tleaving a cofactor = %Ps\n", VALUE(scan));
2611 : }
2612 7 : res = 1;
2613 7 : if (DEBUGLEVEL >= 5)
2614 0 : err_printf("IFAC: prime %Ps\n\tappears at least to the power %ld\n",
2615 0 : VALUE(*where), newexp);
2616 : }
2617 : } /* for */
2618 9724 : CLASS(*where) = gen_2; /* make it a finished prime */
2619 9724 : if (DEBUGLEVEL >= 3)
2620 0 : err_printf("IFAC: prime %Ps\n\tappears with exponent = %ld\n",
2621 0 : VALUE(*where), newexp);
2622 9724 : return res;
2623 : }
2624 :
2625 : /* found out our integer was factor^exp. Update */
2626 : static void
2627 887 : update_pow(GEN where, GEN factor, long exp, pari_sp *av)
2628 : {
2629 887 : GEN ex = EXPON(where);
2630 887 : if (DEBUGLEVEL>3)
2631 0 : err_printf("IFAC: found %Ps =\n\t%Ps ^%ld\n", *where, factor, exp);
2632 887 : affii(factor, VALUE(where)); set_avma(*av);
2633 887 : if (ex == gen_1)
2634 698 : { EXPON(where) = exp == 2? gen_2: utoipos(exp); *av = avma; }
2635 189 : else if (ex == gen_2)
2636 175 : { EXPON(where) = utoipos(exp<<1); *av = avma; }
2637 : else
2638 14 : affsi(exp * itos(ex), EXPON(where));
2639 887 : }
2640 : /* hint = 0 : Use a default strategy
2641 : * hint & 1 : avoid MPQS
2642 : * hint & 2 : avoid first-stage ECM (may fall back to ECM if MPQS gives up)
2643 : * hint & 4 : avoid Pollard and SQUFOF stages.
2644 : * hint & 8 : avoid final ECM; may flag a composite as prime. */
2645 : #define get_hint(partial) (itos(HINT(*partial)) & 15)
2646 :
2647 : /* Complete ifac_crack's job when a factoring engine splits the current factor
2648 : * into a product of three or more new factors. Makes room for them if
2649 : * necessary, sorts them, gives them the right exponents and class. Returns the
2650 : * number of factors actually written, which may be less than #facvec if there
2651 : * are duplicates. Vectors of factors (cf pollardbrent() or mpqs()) contain
2652 : * 'slots' of 3 GENs per factor, interpreted as in our partial factorization
2653 : * data structure. Thus engines can tell us what they already know about
2654 : * factors being prime/composite or appearing to a power larger than thefirst.
2655 : * Don't collect garbage. No diagnostics: engine has printed what it found.
2656 : * facvec contains slots of three components per factor; repeated factors are
2657 : * allowed (their classes shouldn't contradict each other whereas their
2658 : * exponents will be added up) */
2659 : static long
2660 3279 : ifac_insert_multiplet(GEN *partial, GEN *where, GEN facvec, long moebius_mode)
2661 : {
2662 3279 : long j,k=1, lfv=lg(facvec)-1, nf=lfv/3, room=(long)(*where-*partial);
2663 : /* one of the factors will go into the *where slot, so room is now 3 times
2664 : * the number of slots we can use */
2665 3279 : long needroom = lfv - room;
2666 3279 : GEN newexp, cur, sorted, auxvec = cgetg(nf+1, t_VEC), factor;
2667 3279 : long E = itos(EXPON(*where)); /* the old exponent */
2668 :
2669 3279 : if (DEBUGLEVEL >= 5) /* squfof may return a single squared factor as a set */
2670 0 : err_printf("IFAC: incorporating set of %ld factor(s)\n", nf);
2671 3279 : if (needroom > 0) ifac_realloc(partial, where, lg(*partial) + needroom);
2672 :
2673 : /* create sort permutation from the values of the factors */
2674 10120 : for (j=nf; j; j--) gel(auxvec,j) = gel(facvec,3*j-2);
2675 3279 : sorted = ZV_indexsort(auxvec);
2676 : /* store factors, beginning at *where, and catching any duplicates */
2677 3279 : cur = facvec + 3*sorted[nf]-2; /* adjust for triple spacing */
2678 3279 : VALUE(*where) = VALUE(cur);
2679 3279 : newexp = EXPON(cur);
2680 : /* if new exponent is 1, the old exponent already in place will do */
2681 3279 : if (newexp != gen_1) EXPON(*where) = mului(E,newexp);
2682 3279 : CLASS(*where) = CLASS(cur);
2683 3279 : if (DEBUGLEVEL >= 6) err_printf("\tstored (largest) factor no. %ld...\n", nf);
2684 :
2685 6841 : for (j=nf-1; j; j--)
2686 : {
2687 : GEN e;
2688 3562 : cur = facvec + 3*sorted[j]-2;
2689 3562 : factor = VALUE(cur);
2690 3562 : if (equalii(factor, VALUE(*where)))
2691 : {
2692 0 : if (DEBUGLEVEL >= 6)
2693 0 : err_printf("\tfactor no. %ld is a duplicate%s\n", j, (j>1? "...": ""));
2694 : /* update exponent, ignore class which would already have been set,
2695 : * then forget current factor */
2696 0 : newexp = EXPON(cur);
2697 0 : if (newexp != gen_1) /* new exp > 1 */
2698 0 : e = addiu(EXPON(*where), E * itou(newexp));
2699 0 : else if (EXPON(*where) == gen_1 && E == 1)
2700 0 : e = gen_2;
2701 : else
2702 0 : e = addiu(EXPON(*where), E);
2703 0 : EXPON(*where) = e;
2704 :
2705 0 : if (moebius_mode) return 0; /* stop now, with exponent updated */
2706 0 : continue;
2707 : }
2708 :
2709 3562 : *where -= 3;
2710 3562 : CLASS(*where) = CLASS(cur); /* class as given */
2711 3562 : newexp = EXPON(cur);
2712 3562 : if (newexp != gen_1) /* new exp > 1 */
2713 99 : e = (E == 1 && newexp == gen_2)? gen_2: mului(E, newexp);
2714 : else /* inherit parent's exponent */
2715 3463 : e = (E == 1 ? gen_1 : (E == 2 ? gen_2 : utoipos(E)));
2716 3562 : EXPON(*where) = e;
2717 : /* keep components younger than *partial */
2718 3562 : icopyifstack(factor, VALUE(*where));
2719 3562 : k++;
2720 3562 : if (DEBUGLEVEL >= 6)
2721 0 : err_printf("\tfactor no. %ld was unique%s\n", j, j>1? " (so far)...": "");
2722 : }
2723 3279 : return k;
2724 : }
2725 :
2726 : /* x /= y; exact division */
2727 : static void
2728 1820 : diviiexact_inplace(GEN x, GEN y)
2729 1820 : { pari_sp av = avma; affii(diviiexact(x, y), x); set_avma(av); }
2730 :
2731 : /* Split the first (composite) entry. There must already be room for another
2732 : * factor below *where, and *where is updated. Two cases:
2733 : * - entry is a pure power: factor^k is inserted, leaving *where unchanged;
2734 : * - entry = factor * cofactor (not necessarily coprime): both factors are
2735 : * inserted in the correct order, updating *where
2736 : * The inserted factors class is set to unknown, they inherit the exponent
2737 : * (or a multiple thereof) of their ancestor.
2738 : *
2739 : * Returns number of factors written into the structure, usually 2; only 1
2740 : * if pure power, and > 2 if a factoring engine returned a vector of factors.
2741 : * Can reallocate the data structure in the rare > 2 case; may create one or
2742 : * more objects: new factors or exponents > 2 */
2743 : static long
2744 5748 : ifac_crack(GEN *partial, GEN *where, long moebius_mode)
2745 : {
2746 5748 : long hint = get_hint(partial);
2747 : GEN cofactor, factor, exponent;
2748 :
2749 : #ifdef IFAC_DEBUG
2750 : ifac_check(*partial, *where);
2751 : if (*where < *partial + 6)
2752 : pari_err_BUG("ifac_crack ['*where' out of bounds]");
2753 : if (!(VALUE(*where)) || typ(VALUE(*where)) != t_INT)
2754 : pari_err_BUG("ifac_crack [incorrect VALUE(*where)]");
2755 : if (CLASS(*where) != gen_0)
2756 : pari_err_BUG("ifac_crack [operand not known composite]");
2757 : #endif
2758 :
2759 5748 : if (DEBUGLEVEL>2) {
2760 0 : err_printf("IFAC: cracking composite\n\t%Ps\n", **where);
2761 0 : if (DEBUGLEVEL>3) err_printf("IFAC: checking for pure square\n");
2762 : }
2763 : /* MPQS cannot factor prime powers. Look for pure powers even if MPQS is
2764 : * blocked by hint: fast and useful in bounded factorization */
2765 : {
2766 : forprime_t T;
2767 5748 : ulong exp = 1, mask = 7;
2768 5748 : long good = 0;
2769 5748 : pari_sp av = avma;
2770 5748 : (void)u_forprime_init(&T, 11, ULONG_MAX);
2771 : /* crack squares */
2772 6585 : while (Z_issquareall(VALUE(*where), &factor))
2773 : {
2774 838 : good = 1; /* remember we succeeded once */
2775 838 : update_pow(*where, factor, 2, &av);
2776 1479 : if (moebius_mode) return 0; /* no need to carry on */
2777 : }
2778 5796 : while ( (exp = is_357_power(VALUE(*where), &factor, &mask)) )
2779 : {
2780 49 : good = 1; /* remember we succeeded once */
2781 49 : update_pow(*where, factor, exp, &av);
2782 49 : if (moebius_mode) return 0; /* no need to carry on */
2783 : }
2784 : /* cutoff at 14 bits: OK if tridiv_bound >= 2^14 OR if >= 661 for
2785 : * an integer < 701^11 (103 bits). */
2786 5747 : while ( (exp = is_pth_power(VALUE(*where), &factor, &T, 15)) )
2787 : {
2788 0 : good = 1; /* remember we succeeded once */
2789 0 : update_pow(*where, factor, exp, &av);
2790 0 : if (moebius_mode) return 0; /* no need to carry on */
2791 : }
2792 :
2793 5747 : if (good && hint != 15 && ifac_checkprime(*where))
2794 : { /* our composite was a prime power */
2795 641 : if (DEBUGLEVEL>3)
2796 0 : err_printf("IFAC: factor %Ps\n\tis prime\n", VALUE(*where));
2797 641 : return 0; /* bypass subsequent ifac_whoiswho() call */
2798 : }
2799 : } /* pure power stage */
2800 :
2801 5106 : factor = NULL;
2802 5106 : if (!(hint & 4))
2803 : { /* SQUFOF then Rho */
2804 5057 : if (DEBUGLEVEL >= 4)
2805 0 : err_printf("IFAC: trying Shanks' SQUFOF, will fail silently if input\n"
2806 : " is too large for it.\n");
2807 5057 : factor = squfof(VALUE(*where));
2808 5057 : if (!factor)
2809 : {
2810 3489 : if (DEBUGLEVEL >= 4) err_printf("IFAC: trying Pollard-Brent rho\n");
2811 3489 : factor = pollardbrent(VALUE(*where));
2812 : }
2813 : }
2814 5106 : if (!factor && !(hint & 2))
2815 : { /* First ECM stage */
2816 3262 : if (DEBUGLEVEL >= 4) err_printf("IFAC: trying Lenstra-Montgomery ECM\n");
2817 3262 : factor = ellfacteur(VALUE(*where), 0); /* do not insist */
2818 : }
2819 5106 : if (!factor && !(hint & 1))
2820 : { /* MPQS stage */
2821 3286 : if (DEBUGLEVEL >= 4) err_printf("IFAC: trying MPQS\n");
2822 3286 : factor = mpqs(VALUE(*where));
2823 : }
2824 5106 : if (!factor && !(hint & 8))
2825 : { /* Final ECM stage, guaranteed to succeed */
2826 0 : if (DEBUGLEVEL >= 4)
2827 0 : err_printf("IFAC: forcing ECM, may take some time\n");
2828 0 : factor = ellfacteur(VALUE(*where), 1);
2829 : }
2830 5106 : if (!factor)
2831 : { /* limited factorization */
2832 7 : if (DEBUGLEVEL >= 2)
2833 : {
2834 0 : pari_warn(warner, hint==15? "IFAC: untested integer declared prime"
2835 : : "IFAC: unfactored composite declared prime");
2836 : /* don't print it out at level 3 or above, where it would appear
2837 : * several times before and after this message already */
2838 0 : if (DEBUGLEVEL == 2) err_printf("\t%Ps\n", VALUE(*where));
2839 : }
2840 7 : CLASS(*where) = gen_1; /* might as well trial-divide by it... */
2841 7 : return 1;
2842 : }
2843 : /* At least two factors */
2844 5099 : if (typ(factor) == t_VEC)
2845 3279 : return ifac_insert_multiplet(partial, where, factor, moebius_mode);
2846 :
2847 : /* Single factor (t_INT): work out cofactor in place */
2848 1820 : diviiexact_inplace(VALUE(*where), factor);
2849 1820 : cofactor = VALUE(*where);
2850 : /* factoring engines reported factor; tell about the cofactor */
2851 1820 : if (DEBUGLEVEL >= 4) err_printf("IFAC: cofactor = %Ps\n", cofactor);
2852 1820 : CLASS(*where) = NULL; /* mark factor /cofactor 'unknown' */
2853 1820 : exponent = EXPON(*where); /* common exponent */
2854 :
2855 1820 : *where -= 3;
2856 1820 : CLASS(*where) = NULL; /* mark factor /cofactor 'unknown' */
2857 1820 : icopyifstack(exponent, EXPON(*where)); /* copy common exponent */
2858 :
2859 1820 : if (cmpii(factor, cofactor) < 0)
2860 1656 : VALUE(*where) = factor; /* common case */
2861 : else
2862 : { /* factor > cofactor, swap. Exponent is the same, so no need to swap. */
2863 164 : GEN old = *where + 3;
2864 164 : VALUE(*where) = VALUE(old); /* move cofactor pointer to lowest slot */
2865 164 : VALUE(old) = factor; /* save factor */
2866 : }
2867 1820 : return 2;
2868 : }
2869 :
2870 : /* main loop: iterate until smallest entry is a finished prime; returns
2871 : * a 'where' pointer, or NULL if nothing left, or gen_0 in Moebius mode if
2872 : * we aren't squarefree */
2873 : static GEN
2874 14035 : ifac_main(GEN *partial)
2875 : {
2876 14035 : const long moebius_mode = !!MOEBIUS(*partial);
2877 14035 : GEN here = ifac_find(*partial);
2878 : long nf;
2879 :
2880 14035 : if (!here) return NULL; /* nothing left */
2881 : /* loop until first entry is a finished prime. May involve reallocations,
2882 : * thus updates of *partial */
2883 25196 : while (CLASS(here) != gen_2)
2884 : {
2885 15472 : if (CLASS(here) == gen_0) /* composite: crack it */
2886 : { /* make sure there's room for another factor */
2887 5748 : if (here < *partial + 6)
2888 : {
2889 0 : ifac_defrag(partial, &here);
2890 0 : if (here < *partial + 6) ifac_realloc(partial, &here, 1); /* no luck */
2891 : }
2892 5748 : nf = ifac_crack(partial, &here, moebius_mode);
2893 5748 : if (moebius_mode && EXPON(here) != gen_1) /* that was a power */
2894 : {
2895 2 : if (DEBUGLEVEL >= 3)
2896 0 : err_printf("IFAC: main loop: repeated new factor\n\t%Ps\n", *here);
2897 2 : return gen_0;
2898 : }
2899 : /* deal with the new unknowns. No sort: ifac_crack did it */
2900 5746 : ifac_whoiswho(partial, &here, nf);
2901 5746 : continue;
2902 : }
2903 9724 : if (CLASS(here) == gen_1) /* prime but not yet finished: finish it */
2904 : {
2905 9724 : if (ifac_divide(partial, &here, moebius_mode))
2906 : {
2907 7 : if (moebius_mode)
2908 : {
2909 0 : if (DEBUGLEVEL >= 3)
2910 0 : err_printf("IFAC: main loop: another factor was divisible by\n"
2911 : "\t%Ps\n", *here);
2912 0 : return gen_0;
2913 : }
2914 7 : ifac_resort(partial, &here); /* sort new cofactors down */
2915 7 : ifac_whoiswho(partial, &here, -1);
2916 : }
2917 9724 : continue;
2918 : }
2919 0 : pari_err_BUG("ifac_main [nonexistent factor class]");
2920 : } /* while */
2921 9724 : if (moebius_mode && EXPON(here) != gen_1)
2922 : {
2923 0 : if (DEBUGLEVEL >= 3)
2924 0 : err_printf("IFAC: after main loop: repeated old factor\n\t%Ps\n", *here);
2925 0 : return gen_0;
2926 : }
2927 9724 : if (DEBUGLEVEL >= 4)
2928 : {
2929 0 : nf = (*partial + lg(*partial) - here - 3)/3;
2930 0 : if (nf)
2931 0 : err_printf("IFAC: main loop: %ld factor%s left\n", nf, (nf>1)? "s": "");
2932 : else
2933 0 : err_printf("IFAC: main loop: this was the last factor\n");
2934 : }
2935 9724 : if (factor_add_primes && !(get_hint(partial) & 8))
2936 : {
2937 0 : GEN p = VALUE(here);
2938 0 : if (lgefint(p)>3 || uel(p,2) > 0x1000000UL) (void)addprimes(p);
2939 : }
2940 9724 : return here;
2941 : }
2942 :
2943 : /* Encapsulated routines */
2944 :
2945 : /* prime/exponent pairs need to appear contiguously on the stack, but we also
2946 : * need our data structure somewhere, and we don't know in advance how many
2947 : * primes will turn up. The following discipline achieves this: When
2948 : * ifac_decomp() is called, n should point at an object older than the oldest
2949 : * small prime/exponent pair (ifactor() guarantees this).
2950 : * We allocate sufficient space to accommodate several pairs -- eleven pairs
2951 : * ought to fit in a space not much larger than n itself -- before calling
2952 : * ifac_start(). If we manage to complete the factorization before we run out
2953 : * of space, we free the data structure and cull the excess reserved space
2954 : * before returning. When we do run out, we have to leapfrog to generate more
2955 : * (guesstimating the requirements from what is left in the partial
2956 : * factorization structure); room for fresh pairs is allocated at the head of
2957 : * the stack, followed by an ifac_realloc() to reconnect the data structure and
2958 : * move it out of the way, followed by a few pointer tweaks to connect the new
2959 : * pairs space to the old one. This whole affair translates into a surprisingly
2960 : * compact routine. */
2961 :
2962 : /* find primary factors of n; destroy n */
2963 : static long
2964 2569 : ifac_decomp(GEN n, long hint)
2965 : {
2966 2569 : pari_sp av = avma;
2967 2569 : long nb = 0;
2968 2569 : GEN part, here, workspc, pairs = (GEN)av;
2969 :
2970 : /* workspc will be doled out in pairs of smaller t_INTs. For n = prod p^{e_p}
2971 : * (p not necessarily prime), need room to store all p and e_p [ cgeti(3) ],
2972 : * bounded by
2973 : * sum_{p | n} ( log_{2^BIL} (p) + 6 ) <= log_{2^BIL} n + 6 log_2 n */
2974 2569 : workspc = new_chunk((expi(n) + 1) * 7);
2975 2569 : part = ifac_start_hint(n, 0, hint);
2976 : for (;;)
2977 : {
2978 7558 : here = ifac_main(&part);
2979 7558 : if (!here) break;
2980 4989 : if (gc_needed(av,1))
2981 : {
2982 : long offset;
2983 0 : if(DEBUGMEM>1)
2984 : {
2985 0 : pari_warn(warnmem,"[2] ifac_decomp");
2986 0 : ifac_print(part, here);
2987 : }
2988 0 : ifac_realloc(&part, &here, 0);
2989 0 : offset = here - part;
2990 0 : part = gc_upto((pari_sp)workspc, part);
2991 0 : here = part + offset;
2992 : }
2993 4989 : nb++;
2994 4989 : pairs = icopy_avma(VALUE(here), (pari_sp)pairs);
2995 4989 : pairs = icopy_avma(EXPON(here), (pari_sp)pairs);
2996 4989 : ifac_delete(here);
2997 : }
2998 2569 : set_avma((pari_sp)pairs);
2999 2569 : if (DEBUGLEVEL >= 3)
3000 0 : err_printf("IFAC: found %ld large prime (power) factor%s.\n",
3001 : nb, (nb>1? "s": ""));
3002 2569 : return nb;
3003 : }
3004 :
3005 : /***********************************************************************/
3006 : /** ARITHMETIC FUNCTIONS WITH EARLY-ABORT **/
3007 : /** needing direct access to the factoring machinery to avoid work: **/
3008 : /** e.g. if we find a square factor, moebius returns 0, core doesn't **/
3009 : /** need to factor it, etc. **/
3010 : /***********************************************************************/
3011 : /* memory management */
3012 : static void
3013 0 : ifac_GC(pari_sp av, GEN *part)
3014 : {
3015 0 : GEN here = NULL;
3016 0 : if(DEBUGMEM>1) pari_warn(warnmem,"ifac_xxx");
3017 0 : ifac_realloc(part, &here, 0);
3018 0 : *part = gc_upto(av, *part);
3019 0 : }
3020 :
3021 : /* destroys n */
3022 : static long
3023 236 : ifac_moebius(GEN n)
3024 : {
3025 236 : long mu = 1;
3026 236 : pari_sp av = avma;
3027 236 : GEN part = ifac_start(n, 1);
3028 : for(;;)
3029 468 : {
3030 : long v;
3031 : GEN p;
3032 704 : if (!ifac_next(&part,&p,&v)) return v? 0: mu;
3033 468 : mu = -mu;
3034 468 : if (gc_needed(av,1)) ifac_GC(av,&part);
3035 : }
3036 : }
3037 :
3038 : int
3039 760 : ifac_read(GEN part, GEN *p, long *e)
3040 : {
3041 760 : GEN here = ifac_find(part);
3042 760 : if (!here) return 0;
3043 400 : *p = VALUE(here);
3044 400 : *e = EXPON(here)[2];
3045 400 : return 1;
3046 : }
3047 : void
3048 320 : ifac_skip(GEN part)
3049 : {
3050 320 : GEN here = ifac_find(part);
3051 320 : if (here) ifac_delete(here);
3052 320 : }
3053 :
3054 : /* destroys n */
3055 : static int
3056 7 : ifac_ispowerful(GEN n)
3057 : {
3058 7 : pari_sp av = avma;
3059 7 : GEN part = ifac_start(n, 0);
3060 : for(;;)
3061 7 : {
3062 : long e;
3063 : GEN p;
3064 14 : if (!ifac_read(part,&p,&e)) return 1;
3065 : /* power: skip */
3066 7 : if (e != 1 || Z_isanypower(p,NULL)) { ifac_skip(part); continue; }
3067 0 : if (!ifac_next(&part,&p,&e)) return 1;
3068 0 : if (e == 1) return 0;
3069 0 : if (gc_needed(av,1)) ifac_GC(av,&part);
3070 : }
3071 : }
3072 : /* destroys n; assume n != 0 is composite */
3073 : static GEN
3074 353 : ifac_core(GEN n)
3075 : {
3076 353 : GEN m = gen_1, c = cgeti(lgefint(n));
3077 353 : pari_sp av = avma;
3078 353 : GEN part = ifac_start(n, 0);
3079 : for(;;)
3080 393 : {
3081 : long e;
3082 : GEN p;
3083 746 : if (!ifac_read(part,&p,&e)) return m;
3084 : /* square: skip */
3085 393 : if (!odd(e) || Z_issquare(p)) { ifac_skip(part); continue; }
3086 80 : if (!ifac_next(&part,&p,&e)) return m;
3087 80 : if (odd(e)) m = mulii(m, p);
3088 80 : if (gc_needed(av,1)) { affii(m,c); m=c; ifac_GC(av,&part); }
3089 : }
3090 : }
3091 :
3092 : /* must be >= 661 (various functions assume it in order to call uisprime_661
3093 : * instead of uisprime, and Z_isanypower_nosmalldiv instead of Z_isanypower) */
3094 : ulong
3095 4582290 : tridiv_boundu(ulong n)
3096 : {
3097 4582290 : long e = expu(n);
3098 4582306 : if(e<30) return 1UL<<12;
3099 : #ifdef LONG_IS_64BIT
3100 203084 : if(e<34) return 1UL<<13;
3101 113230 : if(e<37) return 1UL<<14;
3102 69538 : if(e<42) return 1UL<<15;
3103 32091 : if(e<47) return 1UL<<16;
3104 18238 : if(e<56) return 1UL<<17;
3105 5837 : if(e<56) return 1UL<<18;
3106 5837 : if(e<62) return 1UL<<19;
3107 1559 : return 1UL<<18;
3108 : #else
3109 7839 : return 1UL<<13;
3110 : #endif
3111 : }
3112 :
3113 : /* Where to stop trial dividing in factorization. Must be >= 661.
3114 : * If further n > 2^512, must be >= 2^14 */
3115 : ulong
3116 887548 : tridiv_bound(GEN n)
3117 : {
3118 887548 : if (lgefint(n)==3) return tridiv_boundu(n[2]);
3119 : else
3120 : {
3121 87959 : ulong l = (ulong)expi(n) + 1;
3122 87959 : if (l <= 512) return (l-16) << 10;
3123 1106 : return 1UL<<19; /* Rho is generally faster above this */
3124 : }
3125 : }
3126 :
3127 : /* destroys n */
3128 : static void
3129 807 : ifac_factoru(GEN n, long hint, GEN P, GEN E, long *pi)
3130 : {
3131 807 : GEN part = ifac_start_hint(n, 0, hint);
3132 807 : long i = *pi;
3133 : for(;;)
3134 1502 : {
3135 : long v;
3136 : GEN p;
3137 2309 : if (!ifac_next(&part,&p,&v)) { *pi = i; return; }
3138 1502 : P[i] = itou(p); E[i] = v; i++;
3139 : }
3140 : }
3141 : /* destroys n */
3142 : static long
3143 663 : ifac_moebiusu(GEN n)
3144 : {
3145 663 : GEN part = ifac_start(n, 1);
3146 663 : long s = 1;
3147 : for(;;)
3148 1326 : {
3149 : long v;
3150 : GEN p;
3151 1989 : if (!ifac_next(&part,&p,&v)) return v? 0: s;
3152 1326 : s = -s;
3153 : }
3154 : }
3155 :
3156 : INLINE ulong
3157 143889666 : u_forprime_next_fast(forprime_t *T)
3158 : {
3159 143889666 : if (++T->n <= pari_PRIMES[0])
3160 : {
3161 143891131 : T->p = pari_PRIMES[T->n];
3162 143891131 : return T->p > T->b ? 0: T->p;
3163 : }
3164 0 : return u_forprime_next(T);
3165 : }
3166 :
3167 : /* uisprime(n) knowing n has no prime divisor <= lim */
3168 : static int
3169 6721 : uisprime_nosmall(ulong n, ulong lim)
3170 6721 : { return (lim >= 661)? uisprime_661(n): uisprime(n); }
3171 :
3172 : static GEN factoru_sign(ulong n, ulong all, long hint, ulong *pU1, ulong *pU2);
3173 : static GEN ifactor_sign(GEN n, ulong all, long hint, long sn, GEN *pU);
3174 :
3175 : /* simplified version of factoru_sign, to be called on squarefree n whose
3176 : * prime divisors are in [minp, maxp]. In practice called with
3177 : * maxp <= maxprimelim() */
3178 : static GEN
3179 994640 : factoru_primes(ulong n, ulong minp, ulong maxp)
3180 : {
3181 : forprime_t S;
3182 : ulong p;
3183 : long i;
3184 : GEN P;
3185 :
3186 994640 : if (n < minp) return NULL;
3187 977254 : if (n <= maxp && PRIMES_search(n) > 0) return mkvecsmall(n);
3188 816981 : P = cgetg(16, t_VECSMALL); i = 1;
3189 816981 : u_forprime_init(&S, minp, maxp);
3190 38677773 : while ( (p = u_forprime_next_fast(&S)) )
3191 : {
3192 38677774 : ulong q = n / p;
3193 38677774 : if (n % p == 0)
3194 : {
3195 1319977 : P[i++] = p; n = q;
3196 1319977 : if (q <= p || (n <= maxp && PRIMES_search(n) > 0)) { P[i++] = n; break; }
3197 : }
3198 37357797 : else if (q <= p) { P[i++] = n; break; } /* n <= p^2: n is now prime */
3199 : }
3200 816979 : if (i == 1) return NULL;
3201 816979 : setlg(P, i); return P;
3202 : }
3203 : static GEN
3204 142022 : Z_factor_primes(GEN N, ulong minp, ulong maxp)
3205 : {
3206 : forprime_t S;
3207 142022 : ulong p, n = 0;
3208 : long i;
3209 : GEN P;
3210 142022 : if (lgefint(N) == 3) return factoru_primes(uel(N,2), minp, maxp);
3211 19092 : u_forprime_init(&S, minp, maxp);
3212 19092 : P = cgetg(expi(N) + 1, t_VECSMALL); i = 1;
3213 11404094 : while ( (p = u_forprime_next_fast(&S)) )
3214 : {
3215 : int stop;
3216 11404094 : long v = Z_lvalrem_stop(&N, p, &stop);
3217 11404094 : if (v) P[i++] = p;
3218 11404094 : if (stop)
3219 : {
3220 313 : if (!equali1(N)) P[i++] = uel(N,2);
3221 313 : goto END;
3222 : }
3223 11403781 : if (v && lgefint(N) == 3) { n = uel(N,2); break; }
3224 : }
3225 24059385 : if (n) while ( (p = u_forprime_next_fast(&S)) )
3226 : {
3227 24059385 : ulong q = n / p;
3228 24059385 : if (n % p == 0)
3229 : {
3230 64078 : P[i++] = p; n = q;
3231 64078 : if (q <= p || (n <= maxp && PRIMES_search(n) > 0)) { P[i++] = n; break; }
3232 : }
3233 23995307 : else if (q <= p) { P[i++] = n; break; } /* n <= p^2: n is now prime */
3234 : }
3235 0 : END:
3236 19092 : if (i == 1) return NULL;
3237 19092 : setlg(P, i); return P;
3238 : }
3239 :
3240 : /* N != 0. Product of odd prime divisors less than
3241 : * min(*pLIM, factorlimit) [WARNING!];
3242 : * with lim <= *pLIM < 2*lim and *pLIM prime
3243 : * Assume lim >= 128. Better for efficiency if N >= lim^2. */
3244 : static ulong
3245 872102 : u_oddprimedivisors_gcd(ulong N, ulong lim, ulong *pLIM)
3246 : {
3247 872102 : GEN PR = prodprimes(), LIM = prodprimeslim();
3248 872099 : long b = minss(lg(PR)-1, expu(lim)-6);
3249 : /* 2^{b+6} <= lim < 2^{b+7}, b >= 1 */
3250 872099 : *pLIM = LIM[b]; return ugcdiu(gel(PR,b), N);
3251 : }
3252 : /* not GC-clean */
3253 : static GEN
3254 142699 : Z_oddprimedivisors_gcd(GEN N, ulong lim, ulong *pLIM)
3255 : {
3256 142699 : GEN PR = prodprimes(), LIM = prodprimeslim();
3257 142699 : long b = minss(lg(PR)-1, expu(lim)-6);
3258 142699 : *pLIM = LIM[b]; return gcdii(N, gel(PR,b));
3259 : }
3260 :
3261 : /* Assume lim >= 128 and N odd. */
3262 : static GEN
3263 141419 : Z_oddprimedivisors_fast(GEN N, ulong lim)
3264 : {
3265 141419 : pari_sp av = avma;
3266 141419 : GEN Nr = Z_oddprimedivisors_gcd(N, lim, &lim);
3267 141419 : GEN P = Z_factor_primes(Nr, 3, lim);
3268 141419 : return P? P: gc_NULL(av);
3269 : }
3270 : /* return mask with bit 0, 1, 2 set if respectively 3, 5, 7 divide n */
3271 : static int
3272 16750446 : u_357_divides(ulong n)
3273 : { /* vector (105, i, n = i-1; !(n%3) + 2 * !(n%5) + 4 * !(n%7)) */
3274 16750446 : const unsigned int tab[] = {
3275 : 7,0,0,1,0,2,1,4,0,1,2,0,1,0,4,3,0,0,1,0,2,5,0,0,1,2,0,1,4,0,3,0,0,1,0,6,1,0,
3276 : 0,1,2,0,5,0,0,3,0,0,1,4,2,1,0,0,1,2,4,1,0,0,3,0,0,5,0,2,1,0,0,1,6,0,1,0,0,3,
3277 : 0,4,1,0,2,1,0,0,5,2,0,1,0,0,3,4,0,1,0,2,1,0,4,1,2,0,1,0,0};
3278 16750446 : return tab[n % 105UL];
3279 : }
3280 :
3281 : static GEN
3282 18489723 : factoru_result(GEN P, GEN E, long i)
3283 : {
3284 18489723 : GEN P2, E2, f = cgetg(3,t_VEC);
3285 18489310 : gel(f,1) = P2 = cgetg(i, t_VECSMALL);
3286 18488646 : gel(f,2) = E2 = cgetg(i, t_VECSMALL);
3287 56005715 : while (--i >= 1) { P2[i] = P[i]; E2[i] = E[i]; }
3288 18488637 : return f;
3289 : }
3290 :
3291 : /* Factor n and output [p,e] where
3292 : * p, e are vecsmall with n = prod{p[i]^e[i]}. If all != 0:
3293 : * if pU1 is not NULL, set *pU1 and *pU2 so that unfactored composite is
3294 : * U1^U2 with U1 not a pure power; else include it in factorization */
3295 : static GEN
3296 18948577 : factoru_sign(ulong n, ulong all, long hint, ulong *pU1, ulong *pU2)
3297 : {
3298 18948577 : pari_sp av = avma;
3299 18948577 : ulong ALL, p, lim = 0;
3300 18948577 : long i, oldi = -1;
3301 : forprime_t S;
3302 : GEN E, P;
3303 :
3304 18948577 : if (pU1) *pU1 = *pU2 = 1;
3305 18948577 : if (n == 0) retmkvec2(mkvecsmall(0), mkvecsmall(1));
3306 18948577 : if (n == 1) retmkvec2(cgetg(1,t_VECSMALL), cgetg(1,t_VECSMALL));
3307 :
3308 : /* enough room to store <= 15 primes and exponents (OK if n < 2^64) */
3309 18489173 : (void)new_chunk(3 + 16*2);
3310 18489171 : P = cgetg(16, t_VECSMALL); i = 1;
3311 18489064 : E = cgetg(16, t_VECSMALL);
3312 18488621 : ALL = all? all: ULONG_MAX; /* (!all || all > n) == ALL > n */
3313 18488621 : if (ALL > 2)
3314 : {
3315 : ulong maxp;
3316 18488595 : long v = vals(n);
3317 18488590 : if (v)
3318 : {
3319 12361272 : P[1] = 2; E[1] = v; i = 2;
3320 12361272 : n >>= v; if (n == 1) goto END;
3321 : }
3322 14996215 : if (ALL > 3)
3323 : {
3324 14996716 : int mask = u_357_divides(n);
3325 14997143 : if (mask)
3326 : {
3327 10188175 : if (mask & 1)
3328 6450054 : { P[i] = 3; E[i] = 1 + u_lvalrem(n / 3, 3, &n); i++;
3329 6450155 : if (n == 1) goto END; }
3330 7648098 : if ((mask & 2) && ALL > 5)
3331 3747182 : { P[i] = 5; E[i] = 1 + u_lvalrem(n / 5, 5, &n); i++;
3332 3747193 : if (n == 1) goto END; }
3333 5943940 : if ((mask & 4) && ALL > 7)
3334 2250478 : { P[i] = 7; E[i] = 1 + u_lvalrem(n / 7, 7, &n); i++;
3335 2250476 : if (n == 1) goto END; }
3336 : }
3337 : }
3338 9504185 : maxp = maxprime();
3339 9505622 : if (n <= maxp && PRIMES_search(n) > 0) { P[i] = n; E[i] = 1; i++; goto END; }
3340 3462309 : lim = all? all-1: tridiv_boundu(n);
3341 3462309 : if (lim >= 128 && n >= 691 * 691) /* expu(lim) >= 7 */
3342 6656 : { /* fast trial division */
3343 867348 : ulong gcdlim, gcd, sqrtn = usqrt(n);
3344 : GEN Q;
3345 867348 : lim = minuu(lim, sqrtn);
3346 867348 : gcd = u_oddprimedivisors_gcd(n, lim, &gcdlim);
3347 867348 : Q = factoru_primes(gcd, 11, gcdlim);
3348 867348 : maxp = GP_DATA->factorlimit;
3349 867348 : if (Q)
3350 : {
3351 853595 : long j, l = lg(Q);
3352 853595 : int stop = 0;
3353 2752077 : for (j = 1; j < l; j++)
3354 : {
3355 1898488 : ulong p = uel(Q,j);
3356 1898488 : if (all && p >= all) { stop = 1; break; }
3357 1898482 : E[i] = u_lvalrem_stop(&n, p, &stop); /* > 0 */
3358 1898482 : P[i] = p; i++;
3359 : }
3360 887284 : if (n == 1) goto END;
3361 36616 : if (stop || (n <= maxp && PRIMES_search(n) > 0))
3362 33689 : { P[i] = n; E[i] = 1; i++; goto END; }
3363 : }
3364 13753 : else if (lim == sqrtn && lim <= maxp)
3365 10024 : { P[i] = n; E[i] = 1; i++; goto END; }
3366 : }
3367 : else
3368 : { /* naive trial division */
3369 2594961 : maxp = lim;
3370 2594961 : u_forprime_init(&S, 11, lim);
3371 18938464 : while ( (p = u_forprime_next_fast(&S)) )
3372 : {
3373 : int stop;
3374 : /* tiny integers without small factors are often primes */
3375 18938120 : if (p == 673)
3376 : {
3377 2594899 : if (uisprime_661(n)) { P[i] = n; E[i] = 1; i++; goto END; }
3378 290 : oldi = i;
3379 : }
3380 18938120 : v = u_lvalrem_stop(&n, p, &stop);
3381 18938119 : if (v) { P[i] = p; E[i] = v; i++; }
3382 18938119 : if (stop)
3383 : {
3384 2594609 : if (n != 1) { P[i] = n; E[i] = 1; i++; }
3385 2594609 : goto END;
3386 : }
3387 : }
3388 : }
3389 7023 : if (lim > maxp)
3390 : { /* second pass usually empty, outside fast trial division range */
3391 : long v;
3392 6 : u_forprime_init(&S, maxp+1, lim);
3393 5296866 : while ((p = u_forprime_next(&S)))
3394 : {
3395 : int stop;
3396 5296892 : v = u_lvalrem_stop(&n, p, &stop);
3397 5296866 : if (v) { P[i] = p; E[i] = v; i++; }
3398 5296866 : if (stop)
3399 : {
3400 6 : if (n != 1) { P[i] = n; E[i] = 1; i++; }
3401 6 : goto END;
3402 : }
3403 : }
3404 : }
3405 : }
3406 : /* if i > oldi (includes oldi = -1) we don't know that n is composite */
3407 7017 : if (all)
3408 : { /* smallfact: look for easy pure powers then stop */
3409 : #ifdef LONG_IS_64BIT
3410 1062 : ulong mask = all > 563 ? (all > 7129 ? 1: 3): 7;
3411 : #else
3412 15 : ulong mask = all > 22 ? (all > 83 ? 1: 3): 7;
3413 : #endif
3414 1077 : long k = 1, ex;
3415 1552 : while (uissquareall(n, &n)) k <<= 1;
3416 1090 : while ( (ex = uis_357_power(n, &n, &mask)) ) k *= ex;
3417 1077 : if (pU1 && (i == oldi || !uisprime_nosmall(n, lim)))
3418 266 : { *pU1 = n; *pU2 = (ulong)k; }
3419 : else
3420 811 : { P[i] = n; E[i] = k; i++; }
3421 1077 : goto END;
3422 : }
3423 : /* we don't known that n is composite ? */
3424 5940 : if (oldi != i && uisprime_nosmall(n, lim)) { P[i]=n; E[i]=1; i++; goto END; }
3425 :
3426 : {
3427 : GEN perm;
3428 807 : ifac_factoru(utoipos(n), hint, P, E, &i);
3429 807 : setlg(P, i);
3430 807 : perm = vecsmall_indexsort(P);
3431 807 : P = vecsmallpermute(P, perm);
3432 807 : E = vecsmallpermute(E, perm);
3433 : }
3434 18490734 : END:
3435 18490734 : set_avma(av); return factoru_result(P, E, i);
3436 : }
3437 : GEN
3438 3812209 : factoru(ulong n)
3439 3812209 : { return factoru_sign(n, 0, decomp_default_hint, NULL, NULL); }
3440 :
3441 : ulong
3442 0 : radicalu(ulong n)
3443 : {
3444 0 : pari_sp av = avma;
3445 0 : return gc_long(av, zv_prod(gel(factoru(n),1)));
3446 : }
3447 :
3448 : long
3449 54194 : moebiusu_fact(GEN f)
3450 : {
3451 54194 : GEN E = gel(f,2);
3452 54194 : long i, l = lg(E);
3453 93569 : for (i = 1; i < l; i++)
3454 57834 : if (E[i] > 1) return 0;
3455 35735 : return odd(l)? 1: -1;
3456 : }
3457 :
3458 : long
3459 2491091 : moebiusu(ulong n)
3460 : {
3461 : pari_sp av;
3462 : long s, v, test_prime;
3463 : ulong p, lim;
3464 : int mask;
3465 :
3466 2491091 : switch(n)
3467 : {
3468 0 : case 0: (void)check_arith_non0(gen_0,"moebius");/*error*/
3469 569268 : case 1: return 1;
3470 106694 : case 2: return -1;
3471 : }
3472 : /* n > 2 */
3473 1832389 : p = n & 3; if (!p) return 0;
3474 1744253 : if (p == 2) { n >>= 1; s = -1; } else s = 1;
3475 1744253 : mask = u_357_divides(n);
3476 1763228 : if (mask)
3477 : {
3478 676670 : if (mask & 1) { n /= 3; s = -s; if (n % 3 == 0) return 0; }
3479 612850 : if (mask & 2) { n /= 5; s = -s; if (n % 5 == 0) return 0; }
3480 571475 : if (mask & 4) { n /= 7; s = -s; if (n % 7 == 0) return 0; }
3481 : }
3482 1622877 : if (n <= maxprimelim() && PRIMES_search(n) > 0) return -s;
3483 659556 : av = avma; lim = tridiv_boundu(n);
3484 670850 : if (n >= 691 * 691)
3485 : {
3486 4507 : ulong gcdlim, gcd, sqrtn = usqrt(n);
3487 : GEN P;
3488 4507 : lim = minuu(sqrtn, lim);
3489 4507 : gcd = u_oddprimedivisors_gcd(n, lim, &gcdlim);
3490 4507 : if (gcd != 1)
3491 : {
3492 3523 : n /= gcd;
3493 3846 : if (ugcd(gcd, n) != 1) return 0;
3494 : }
3495 4362 : P = factoru_primes(gcd, 11, gcdlim);
3496 4362 : if (P && odd(lg(P) - 1)) s = -s;
3497 4362 : if (n == 1) return gc_long(av, s);
3498 4060 : if (lim == sqrtn && lim <= GP_DATA->factorlimit) return gc_long(av, -s);
3499 4039 : test_prime = 1;
3500 : }
3501 : else
3502 : {
3503 : forprime_t S;
3504 666343 : u_forprime_init(&S, 3, lim);
3505 666144 : test_prime = 0;
3506 7425986 : while ((p = u_forprime_next_fast(&S)))
3507 : {
3508 : int stop;
3509 : /* tiny integers without small factors are often primes */
3510 7422455 : if (p == 673)
3511 : {
3512 0 : test_prime = 0;
3513 664575 : if (uisprime_661(n)) return gc_long(av,-s);
3514 : }
3515 7422455 : v = u_lvalrem_stop(&n, p, &stop);
3516 7423930 : if (v) {
3517 635551 : if (v > 1) return gc_long(av,0);
3518 593565 : test_prime = 1;
3519 593565 : s = -s;
3520 : }
3521 7381944 : if (stop) return gc_long(av, n==1? s: -s);
3522 : }
3523 : }
3524 4039 : set_avma(av);
3525 4039 : if (test_prime && uisprime_661(n)) return -s;
3526 : else
3527 : {
3528 663 : long t = ifac_moebiusu(utoipos(n));
3529 663 : set_avma(av);
3530 663 : if (t == 0) return 0;
3531 663 : return (s == t)? 1: -1;
3532 : }
3533 : }
3534 :
3535 : long
3536 57511 : moebius(GEN n)
3537 : {
3538 57511 : pari_sp av = avma;
3539 : GEN F;
3540 : ulong p, lim, n357;
3541 : long i, l, s, v, copy;
3542 : int mask;
3543 :
3544 57511 : if ((F = check_arith_non0(n,"moebius")))
3545 : {
3546 : GEN E;
3547 732 : F = clean_Z_factor(F);
3548 728 : E = gel(F,2);
3549 728 : l = lg(E);
3550 1428 : for(i = 1; i < l; i++)
3551 980 : if (!equali1(gel(E,i))) return gc_long(av,0);
3552 448 : return gc_long(av, odd(l)? 1: -1);
3553 : }
3554 56756 : if (lgefint(n) == 3) return moebiusu(uel(n,2));
3555 1608 : p = mod4(n); if (!p) return 0;
3556 1408 : copy = s = 1;
3557 1408 : if (p == 2)
3558 : {
3559 358 : n = shifti(n, -1);
3560 358 : copy = 0; s = -1;
3561 : }
3562 1408 : n357 = umodiu(n, 9 * 25 * 49);
3563 1408 : mask = u_357_divides(n357);
3564 1408 : if (mask)
3565 : {
3566 764 : ulong m = 1;
3567 764 : if (mask & 1) { m = 3; s = -s; }
3568 764 : if (mask & 2) { m *= 5; s = -s; }
3569 764 : if (mask & 4) { m *= 7; s = -s; }
3570 764 : if (u_357_divides(n357 / m)) return gc_long(av, 0);
3571 549 : copy = 0; n = diviuexact(n, m);
3572 : }
3573 1193 : if (copy) n = icopy(n);
3574 701 : else if (lgefint(n) == 3) return gc_long(av, s * moebiusu(uel(n,2)));
3575 883 : setabssign(n); lim = tridiv_bound(n);
3576 883 : if (lim >= 128)
3577 : {
3578 : ulong gcdlim;
3579 883 : GEN gcd = Z_oddprimedivisors_gcd(n, lim, &gcdlim);
3580 883 : if (!equali1(gcd))
3581 : {
3582 : GEN P;
3583 622 : n = diviiexact(n, gcd);
3584 808 : if (!equali1(gcdii(gcd, n))) return gc_long(av, 0);
3585 603 : P = Z_factor_primes(gcd, 11, gcdlim);
3586 603 : if (P)
3587 : {
3588 603 : if (odd(lg(P) - 1)) s = -s;
3589 603 : if (is_pm1(n)) return gc_long(av, s);
3590 1158 : if (lim <= GP_DATA->factorlimit &&
3591 741 : cmpii(sqru(lim), n) >= 0) return gc_long(av, -s); /* n prime */
3592 : }
3593 : }
3594 : }
3595 : else
3596 : {
3597 : forprime_t S;
3598 0 : u_forprime_init(&S, 3, lim);
3599 0 : while ((p = u_forprime_next_fast(&S)))
3600 : {
3601 : int stop;
3602 0 : v = Z_lvalrem_stop(&n, p, &stop);
3603 0 : if (v)
3604 : {
3605 0 : if (v > 1) return gc_long(av,0);
3606 0 : s = -s;
3607 : }
3608 0 : if (stop) return gc_long(av, is_pm1(n)? s: -s);
3609 : }
3610 : }
3611 678 : l = lg(primetab);
3612 682 : for (i = 1; i < l; i++)
3613 : {
3614 7 : v = Z_pvalrem(n, gel(primetab,i), &n);
3615 7 : if (v)
3616 : {
3617 7 : if (v > 1) return gc_long(av,0);
3618 5 : s = -s;
3619 5 : if (is_pm1(n)) return gc_long(av,s);
3620 : }
3621 : }
3622 675 : if (ifac_isprime(n)) return gc_long(av,-s);
3623 : /* large composite without small factors */
3624 236 : v = ifac_moebius(n);
3625 236 : return gc_long(av, s < 0? -v: v); /* correct also if v==0 */
3626 : }
3627 :
3628 : long
3629 1708 : ispowerful(GEN n)
3630 : {
3631 1708 : pari_sp av = avma;
3632 : GEN F;
3633 : ulong p, lim, n357;
3634 : long i, l, v;
3635 1708 : int mask, copy = 1;
3636 :
3637 1708 : if ((F = check_arith_all(n, "ispowerful")))
3638 : {
3639 742 : GEN p, P = gel(F,1), E = gel(F,2);
3640 742 : if (lg(P) == 1) return 1; /* 1 */
3641 728 : p = gel(P,1);
3642 728 : if (!signe(p)) return 1; /* 0 */
3643 707 : i = is_pm1(p)? 2: 1; /* skip -1 */
3644 707 : l = lg(E);
3645 980 : for (; i < l; i++)
3646 847 : if (equali1(gel(E,i))) return 0;
3647 133 : return 1;
3648 : }
3649 966 : if (!signe(n)) return 1;
3650 952 : if (mod4(n) == 2) return 0;
3651 623 : n357 = umodiu(n, 9 * 25 * 49);
3652 623 : mask = u_357_divides(n357);
3653 623 : if (mask)
3654 : {
3655 315 : if ((mask & 1) && n357 % 9) return 0;
3656 203 : if ((mask & 2) && n357 % 25) return 0;
3657 126 : if ((mask & 4) && n357 % 49) return 0;
3658 98 : if (mask & 1) (void)Z_lvalrem(diviuexact(n,9), 3, &n);
3659 98 : if (mask & 2) (void)Z_lvalrem(diviuexact(n,25), 5, &n);
3660 98 : if (mask & 4) (void)Z_lvalrem(diviuexact(n,49), 7, &n);
3661 98 : copy = 0;
3662 : }
3663 406 : if (!mod2(n)) { n = shifti(n, -vali(n)); copy = 0; }
3664 406 : if (is_pm1(n)) return gc_long(av, 1);
3665 238 : if (copy) n = icopy(n);
3666 238 : setabssign(n); lim = tridiv_bound(n);
3667 238 : if (cmpiu(n, 691 * 691) >= 0)
3668 : {
3669 70 : ulong gcdlim, sqrtn = 0;
3670 : GEN gcd;
3671 70 : if (lgefint(n) == 3)
3672 : {
3673 6 : sqrtn = usqrt(n[2]);
3674 6 : lim = minuu(sqrtn, lim);
3675 : }
3676 70 : gcd = Z_oddprimedivisors_gcd(n, lim, &gcdlim);
3677 70 : if (!equali1(gcd))
3678 : {
3679 : GEN r;
3680 70 : n = diviiexact(n, gcd);
3681 70 : n = dvmdii(n, gcd, &r);
3682 70 : if (r != gen_0) return gc_long(av, 0);
3683 70 : n = Z_ppo(n, gcd);
3684 : }
3685 : /* prime divisors > gcdlim */
3686 70 : if (equali1(n)) return gc_long(av, 1);
3687 7 : if (sqrtn && gcdlim >= sqrtn) return gc_long(av, 0); /* prime */
3688 : }
3689 : else
3690 : {
3691 : forprime_t S;
3692 168 : u_forprime_init(&S, 3, lim);
3693 378 : while ((p = u_forprime_next_fast(&S)))
3694 : {
3695 : int stop;
3696 378 : v = Z_lvalrem_stop(&n, p, &stop);
3697 546 : if (v == 1) return gc_long(av,0);
3698 378 : if (stop) return gc_long(av, is_pm1(n)); /* n > 1 is now prime */
3699 : }
3700 : }
3701 7 : l = lg(primetab);
3702 7 : for (i = 1; i < l; i++)
3703 : {
3704 0 : v = Z_pvalrem(n, gel(primetab,i), &n);
3705 0 : if (v)
3706 : {
3707 0 : if (v == 1) return gc_long(av,0);
3708 0 : if (is_pm1(n)) return gc_long(av,1);
3709 : }
3710 : }
3711 : /* no need to factor: must be p^2 or not powerful */
3712 7 : if (cmpii(powuu(lim+1, 3), n) > 0) return gc_long(av, Z_issquare(n));
3713 :
3714 7 : if (ifac_isprime(n)) return gc_long(av,0);
3715 : /* large composite without small factors */
3716 7 : return gc_long(av, ifac_ispowerful(n));
3717 : }
3718 :
3719 : ulong
3720 0 : coreu_fact(GEN f)
3721 : {
3722 0 : GEN P = gel(f,1), E = gel(f,2);
3723 0 : long i, l = lg(P), m = 1;
3724 0 : for (i = 1; i < l; i++)
3725 : {
3726 0 : ulong p = P[i], e = E[i];
3727 0 : if (e & 1) m *= p;
3728 : }
3729 0 : return m;
3730 : }
3731 :
3732 : /* d = a squarefree divisor of n. Return n / (n, d^oo)
3733 : * and set *pcore = \prod_{p | (n,d), v_p(n) odd} p
3734 : * Simpified form of Z_cba. */
3735 : static GEN
3736 327 : core_init_from_squarefree(GEN n, GEN d, GEN *pcore)
3737 : {
3738 327 : GEN c = gen_1;
3739 : long v;
3740 :
3741 327 : if (equali1(d)) { *pcore = c; return n; }
3742 260 : v = Z_pvalrem(n, d, &n);
3743 59 : for (;; v++)
3744 59 : { /* d^v divides "original n" */
3745 319 : GEN newd = gcdii(n, d); /* newd^{v+1} divides original n */
3746 319 : if (!equalii(d, newd))
3747 : { /* new d loses primes dividing original n to exact power v */
3748 310 : if (odd(v)) c = mulii(c, diviiexact(d, newd)); /* lost primes */
3749 310 : d = newd; if (equali1(d)) break;
3750 : }
3751 63 : if (equalii(d, n))
3752 : {
3753 4 : if (odd(v + 1)) c = mulii(c, d);
3754 4 : *pcore = c; return gen_1;
3755 : }
3756 59 : n = diviiexact(n, d);
3757 : }
3758 256 : *pcore = c; return n;
3759 : }
3760 : static ulong
3761 247 : coreu_init_from_squarefree(ulong n, ulong d, ulong *pcore)
3762 : {
3763 247 : ulong c = 1;
3764 : long v;
3765 :
3766 247 : if (d == 1) { *pcore = c; return n; }
3767 205 : v = u_lvalrem(n, d, &n);
3768 18 : for (;; v++)
3769 18 : { /* d^v divides "original n" */
3770 223 : ulong newd = ugcd(n, d); /* newd^{v+1} divides original n */
3771 223 : if (d != newd)
3772 : { /* new d loses primes dividing original n to exact power v */
3773 211 : if (odd(v)) c *= d / newd; /* lost primes */
3774 211 : d = newd; if (d == 1) break;
3775 : }
3776 90 : if (d == n)
3777 : {
3778 72 : if (odd(v + 1)) c *= d;
3779 72 : *pcore = c; return 1;
3780 : }
3781 18 : n /= d;
3782 : }
3783 133 : *pcore = c; return n;
3784 : }
3785 :
3786 : ulong
3787 63015 : coreu(ulong n)
3788 : {
3789 : ulong p, lim, m;
3790 : long v;
3791 :
3792 63015 : if (!n) return 0;
3793 63015 : m = 1;
3794 63015 : v = vals(n);
3795 63015 : if (v)
3796 : {
3797 4147 : n >>= v;
3798 4147 : if (odd(v)) m = 2;
3799 : }
3800 63015 : v = u_lvalrem(n, 3, &n); if (odd(v)) m *= 3;
3801 63015 : v = u_lvalrem(n, 5, &n); if (odd(v)) m *= 5;
3802 63015 : v = u_lvalrem(n, 7, &n); if (odd(v)) m *= 7;
3803 63015 : if (n == 1) return m;
3804 3320 : if (n <= maxprimelim() && PRIMES_search(n) > 0) return m * n;
3805 408 : lim = tridiv_boundu(n);
3806 408 : if (n >= 691 * 691)
3807 : {
3808 247 : ulong mpart, gcd, gcdlim, sqrtn = usqrt(n);
3809 247 : lim = minuu(sqrtn, lim);
3810 247 : gcd = u_oddprimedivisors_gcd(n, lim, &gcdlim);
3811 247 : n = coreu_init_from_squarefree(n, gcd, &mpart);
3812 247 : m *= mpart;
3813 266 : if (n == 1) return m;
3814 : /* n has no prime divisor <= gcdlim */
3815 103 : if ((lim == sqrtn && lim <= GP_DATA->factorlimit)
3816 96 : || (gcdlim + 1) * (gcdlim + 1) > n)
3817 19 : return m * n; /* prime */
3818 : }
3819 : else
3820 : {
3821 : forprime_t S;
3822 161 : u_forprime_init(&S, 11, lim);
3823 3633 : while ((p = u_forprime_next_fast(&S)))
3824 : {
3825 : int stop;
3826 3633 : v = u_lvalrem_stop(&n, p, &stop);
3827 3633 : if (v & 1) m *= p;
3828 3633 : if (stop) return n == 1? m: m * n; /* n > 1 is now prime */
3829 : }
3830 : }
3831 84 : if (uisprime_661(n)) return m * n;
3832 : else
3833 : {
3834 84 : pari_sp av = avma;
3835 84 : m *= itou(ifac_core(utoipos(n)));
3836 84 : return gc_ulong(av, m);
3837 : }
3838 : }
3839 :
3840 : GEN
3841 709573 : core(GEN n)
3842 : {
3843 709573 : pari_sp av = avma;
3844 : GEN m, mpart, gcd, F;
3845 : ulong lim, gcdlim, mask, m0;
3846 : long i, l, v, s;
3847 709573 : int copy = 1;
3848 :
3849 709573 : if ((F = check_arith_all(n, "core")))
3850 : {
3851 646247 : GEN p, x, P = gel(F,1), E = gel(F,2);
3852 646247 : long j = 1;
3853 646247 : if (lg(P) == 1) return gen_1;
3854 646219 : p = gel(P,1);
3855 646219 : if (!signe(p)) return gen_0;
3856 646177 : l = lg(P); x = cgetg(l, t_VEC);
3857 2283047 : for (i = 1; i < l; i++)
3858 1636881 : if (mpodd(gel(E,i))) gel(x,j++) = gel(P,i);
3859 646166 : setlg(x, j); return ZV_prod(x);
3860 : }
3861 63314 : s = signe(n);
3862 63314 : if (!s) return gen_0;
3863 63286 : if (lgefint(n) == 3)
3864 : {
3865 62878 : ulong c = coreu(uel(n,2));
3866 62878 : return s < 0? utoineg(c): utoipos(c);
3867 : }
3868 408 : v = vali(n); m0 = 1;
3869 408 : if (v)
3870 : {
3871 123 : n = shifti(n, -v); if (odd(v)) m0 *= 2;
3872 123 : copy = 0;
3873 : }
3874 408 : if ((mask = u_357_divides(umodiu(n, 3 * 5 * 7))))
3875 : {
3876 275 : if (mask & 1) { v = Z_lvalrem(n, 3, &n); if (odd(v)) m0 *= 3; }
3877 275 : if (mask & 2) { v = Z_lvalrem(n, 5, &n); if (odd(v)) m0 *= 5; }
3878 275 : if (mask & 4) { v = Z_lvalrem(n, 7, &n); if (odd(v)) m0 *= 7; ; }
3879 275 : copy = 0;
3880 : }
3881 408 : if (copy) n = absi(n); /* ifac_core destroys n */
3882 289 : else if (lgefint(n) == 3)
3883 : {
3884 81 : ulong c = coreu(uel(n,2));
3885 81 : m = muluu(m0, c); if (s < 0) setsigne(m, -1);
3886 81 : return gc_INT(av, m);
3887 : }
3888 327 : setabssign(n); lim = tridiv_bound(n);
3889 : /* n >= 691^2 */
3890 327 : gcd = Z_oddprimedivisors_gcd(n, lim, &gcdlim);
3891 327 : n = core_init_from_squarefree(n, gcd, &mpart);
3892 327 : m = mului(m0, mpart); if (s < 0) setsigne(m, -1);
3893 327 : if (equali1(n)) return gc_INT(av, m);
3894 : /* n has no prime divisor <= gcdlim */
3895 276 : if (cmpii(sqru(gcdlim + 1), n) > 0)
3896 2 : return gc_INT(av, mulii(m, n)); /* prime */
3897 274 : l = lg(primetab);
3898 750 : for (i = 1; i < l; i++)
3899 : {
3900 478 : GEN q = gel(primetab,i);
3901 478 : v = Z_pvalrem(n, q, &n);
3902 478 : if (v)
3903 : {
3904 8 : if (v & 1) m = mulii(m, q);
3905 8 : if (is_pm1(n)) return gc_INT(av, m);
3906 : }
3907 : }
3908 272 : if (!ifac_isprime(n)) n = ifac_core(n); /* composite without small factors */
3909 272 : return gc_INT(av, mulii(m, n));
3910 : }
3911 :
3912 : long
3913 0 : Z_issmooth(GEN m, ulong lim)
3914 : {
3915 0 : pari_sp av = avma;
3916 0 : ulong p = 2;
3917 : forprime_t S;
3918 0 : u_forprime_init(&S, 2, lim);
3919 0 : while ((p = u_forprime_next_fast(&S)))
3920 : {
3921 : int stop;
3922 0 : (void)Z_lvalrem_stop(&m, p, &stop);
3923 0 : if (stop) return gc_long(av, abscmpiu(m,lim) <= 0);
3924 : }
3925 0 : return gc_long(av,0);
3926 : }
3927 :
3928 : GEN
3929 175385 : Z_issmooth_fact(GEN m, ulong lim)
3930 : {
3931 175385 : pari_sp av = avma;
3932 : GEN F, P, E;
3933 : ulong p;
3934 175385 : long i = 1, l = expi(m)+1;
3935 : forprime_t S;
3936 175404 : P = cgetg(l, t_VECSMALL);
3937 175394 : E = cgetg(l, t_VECSMALL); F = mkmat2(P,E);
3938 175292 : if (l == 1) return F; /* m == 1 */
3939 175250 : u_forprime_init(&S, 2, lim);
3940 43353710 : while ((p = u_forprime_next_fast(&S)))
3941 : {
3942 : int stop;
3943 43311110 : long v = Z_lvalrem_stop(&m, p, &stop);
3944 43314290 : if (v) { P[i] = p; E[i] = v; i++; }
3945 43314290 : if (stop)
3946 : {
3947 135887 : if (abscmpiu(m,lim) > 0) break;
3948 111334 : if (m[2] > 1) { P[i] = m[2]; E[i] = 1; i++; }
3949 111334 : setlg(P, i);
3950 111426 : setlg(E, i); return gc_const((pari_sp)F, F);
3951 : }
3952 : }
3953 60175 : return gc_NULL(av);
3954 : }
3955 :
3956 : /* assume (x,p) = 1 */
3957 : static GEN
3958 14 : Z_to_Up(GEN x, GEN p, long d)
3959 14 : { retmkpadic_i(modii(x, _pd), p, powiu(p,d), 0, d); }
3960 : /* Is (a mod p^e) a K-th power ? p is prime and e > 0 */
3961 : static int
3962 798 : Zp_ispower(GEN a, GEN L, GEN K, GEN p, long e)
3963 : {
3964 798 : GEN t = gen_0;
3965 798 : long v = Z_pvalrem(a, p, &a), d = e - v;
3966 798 : if (d > 0)
3967 : { /* is a mod p^d a K-th power ? a p-unit */
3968 : ulong r;
3969 735 : v = uabsdivui_rem(v, K, &r);
3970 735 : if (r || !Fp_ispower(a, K, p)) return 0;
3971 623 : if (d == 1) /* mod p*/
3972 560 : { if (L) t = Fp_sqrtn(a, K, p, NULL); }
3973 63 : else if (dvdii(K, p))
3974 : { /* mod p^{2 +}, ramified case */
3975 14 : if (!ispower(Z_to_Up(a, p, d), K, L? &t: NULL)) return 0;
3976 14 : if (L) t = padic_to_Q(t);
3977 : }
3978 : else
3979 : { /* mod p^{2 +}, unramified case */
3980 49 : if (L)
3981 : {
3982 42 : t = Fp_sqrtn(a, K, p, NULL);
3983 42 : t = Zp_sqrtnlift(a, K, t, p, d);
3984 : }
3985 : }
3986 623 : if (L && v) t = mulii(t, powiu(p, v));
3987 : }
3988 686 : if (L) vectrunc_append(L, mkintmod(t, powiu(p, e)));
3989 686 : return 1;
3990 : }
3991 : long
3992 756 : Zn_ispower(GEN a, GEN q, GEN K, GEN *pt)
3993 : {
3994 : GEN L, N;
3995 : pari_sp av;
3996 : long e, i, l;
3997 : ulong pp, lim;
3998 :
3999 756 : if (!signe(a))
4000 : {
4001 91 : if (pt) {
4002 91 : GEN t = cgetg(3, t_INTMOD);
4003 91 : gel(t,1) = icopy(q); gel(t,2) = gen_0; *pt = t;
4004 : }
4005 91 : return 1;
4006 : }
4007 : /* a != 0 */
4008 665 : av = avma;
4009 :
4010 665 : if (typ(q) != t_INT) /* integer factorization */
4011 : {
4012 0 : GEN P = gel(q,1), E = gel(q,2);
4013 0 : l = lg(P);
4014 0 : L = pt? vectrunc_init(l): NULL;
4015 0 : for (i = 1; i < l; i++)
4016 : {
4017 0 : GEN p = gel(P,i);
4018 0 : long e = itos(gel(E,i));
4019 0 : if (!Zp_ispower(a, L, K, p, e)) return gc_long(av,0);
4020 : }
4021 0 : goto END;
4022 : }
4023 665 : e = vali(q); if (e) q = shifti(q, -e);
4024 665 : if (!mod2(K) && kronecker(a, q) == -1) return gc_long(av,0);
4025 658 : L = pt? vectrunc_init(expi(q)+2): NULL;
4026 658 : if (e)
4027 : {
4028 469 : if (!Zp_ispower(a, L, K, gen_2, e)) return gc_long(av,0);
4029 455 : a = modii(a, q);
4030 : }
4031 644 : lim = tridiv_bound(q);
4032 644 : if (cmpiu(q, 691 * 691) >= 0)
4033 : {
4034 161 : ulong sqrtq = lgefint(q) == 3? usqrt(q[2]): 0;
4035 : GEN P;
4036 161 : if (sqrtq) lim = minuu(sqrtq, lim);
4037 161 : P = Z_oddprimedivisors_fast(q, lim);
4038 161 : if (P)
4039 : {
4040 103 : long nP = lg(P) - 1;
4041 103 : int stop = 0;
4042 206 : for (i = 1; i <= nP; i++)
4043 : {
4044 151 : ulong pp = uel(P,i);
4045 151 : e = Z_lvalrem_stop(&q, pp, &stop);
4046 151 : if (!Zp_ispower(a, L, K, utoipos(pp), e)) return gc_long(av,0);
4047 103 : a = modii(a, q);
4048 : }
4049 55 : if (stop)
4050 : {
4051 48 : if (!is_pm1(q) && !Zp_ispower(a, L, K, q, 1)) return gc_long(av,0);
4052 48 : goto END;
4053 : }
4054 : }
4055 58 : else if (lim == sqrtq && lim <= GP_DATA->factorlimit)
4056 : {
4057 0 : if (!Zp_ispower(a, L, K, q, 1)) return gc_long(av,0);
4058 0 : goto END;
4059 : }
4060 : }
4061 : else
4062 : {
4063 : forprime_t S;
4064 483 : u_forprime_init(&S, 3, lim);
4065 237174 : while ((pp = u_forprime_next(&S)))
4066 : {
4067 : int stop;
4068 236754 : e = Z_lvalrem_stop(&q, pp, &stop);
4069 236754 : if (!e) continue;
4070 63 : if (!Zp_ispower(a, L, K, utoipos(pp), e)) return gc_long(av,0);
4071 56 : a = modii(a, q);
4072 56 : if (stop)
4073 : {
4074 56 : if (!is_pm1(q) && !Zp_ispower(a, L, K, q, 1)) return gc_long(av,0);
4075 56 : goto END;
4076 : }
4077 : }
4078 : }
4079 485 : l = lg(primetab);
4080 485 : for (i = 1; i < l; i++)
4081 : {
4082 0 : GEN p = gel(primetab,i);
4083 0 : e = Z_pvalrem(q, p, &q);
4084 0 : if (!e) continue;
4085 0 : if (!Zp_ispower(a, L, K, p, e)) return gc_long(av,0);
4086 0 : if (is_pm1(q)) goto END;
4087 0 : a = modii(a, q);
4088 : }
4089 485 : N = gcdii(a,q);
4090 485 : if (!is_pm1(N))
4091 : {
4092 52 : if (ifac_isprime(N))
4093 : {
4094 34 : e = Z_pvalrem(q, N, &q);
4095 34 : if (!Zp_ispower(a, L, K, N, e)) return gc_long(av,0);
4096 0 : a = modii(a, q);
4097 : }
4098 : else
4099 : {
4100 18 : GEN part = ifac_start(N, 0);
4101 : for(;;)
4102 18 : {
4103 : long e;
4104 : GEN p;
4105 36 : if (!ifac_next(&part, &p, &e)) break;
4106 18 : e = Z_pvalrem(q, p, &q);
4107 18 : if (!Zp_ispower(a, L, K, p, e)) return gc_long(av,0);
4108 18 : a = modii(a, q);
4109 : }
4110 : }
4111 : }
4112 451 : if (!is_pm1(q))
4113 : {
4114 31 : if (ifac_isprime(q))
4115 : {
4116 4 : if (!Zp_ispower(a, L, K, q, 1)) return gc_long(av,0);
4117 : }
4118 : else
4119 : { /* icopy needed: ifac_next would destroy q */
4120 27 : GEN part = ifac_start(icopy(q), 0);
4121 : for(;;)
4122 43 : {
4123 : long e;
4124 : GEN p;
4125 70 : if (!ifac_next(&part, &p, &e)) break;
4126 52 : if (!Zp_ispower(a, L, K, p, e)) return gc_long(av,0);
4127 43 : a = modii(a, q);
4128 : }
4129 : }
4130 : }
4131 420 : END:
4132 546 : if (!pt) return gc_long(av, 1);
4133 476 : *pt = gc_upto(av, chinese1_coprime_Z(L)); return 1;
4134 : }
4135 :
4136 :
4137 : /***********************************************************************/
4138 : /** **/
4139 : /** COMPUTING THE MATRIX OF PRIME DIVISORS AND EXPONENTS **/
4140 : /** **/
4141 : /***********************************************************************/
4142 : static GEN
4143 142849 : aux_end(GEN M, GEN n, long nb)
4144 : {
4145 142849 : GEN P,E, z = (GEN)avma;
4146 : long i;
4147 :
4148 142849 : guncloneNULL(n);
4149 142849 : P = cgetg(nb+1,t_COL);
4150 142849 : E = cgetg(nb+1,t_COL);
4151 912807 : for (i=nb; i; i--)
4152 : { /* allow a stackdummy in the middle */
4153 857180 : while (typ(z) != t_INT) z += lg(z);
4154 769958 : gel(E,i) = z; z += lg(z);
4155 769958 : gel(P,i) = z; z += lg(z);
4156 : }
4157 142849 : gel(M,1) = P;
4158 142849 : gel(M,2) = E;
4159 142849 : return sort_factor(M, (void*)&abscmpii, cmp_nodata);
4160 : }
4161 :
4162 : static void
4163 764969 : STORE(long *nb, GEN x, long e) { (*nb)++; (void)x; (void)utoipos(e); }
4164 : static void
4165 737031 : STOREu(long *nb, ulong x, long e) { STORE(nb, utoipos(x), e); }
4166 : static void
4167 27786 : STOREi(long *nb, GEN x, long e) { STORE(nb, icopy(x), e); }
4168 : /* no prime less than p divides n; return 1 if factored completely */
4169 : static int
4170 36046 : special_primes(GEN n, ulong p, long *nb, GEN T)
4171 : {
4172 36046 : long l = lg(T);
4173 36046 : if (l > 1)
4174 : { /* pp = square of biggest p tried so far */
4175 536 : long i, k, pp[] = { evaltyp(t_INT)|_evallg(4), 0,0,0 };
4176 536 : pari_sp av = avma; affii(sqru(p), pp); set_avma(av);
4177 1168 : for (i = 1; i < l; i++)
4178 765 : if ((k = Z_pval_inplace(n, gel(T,i))))
4179 : {
4180 231 : STOREi(nb, gel(T,i), k);
4181 231 : if (abscmpii(pp, n) > 0)
4182 : {
4183 133 : if (!is_pm1(n)) STOREi(nb, n, 1);
4184 133 : return 1;
4185 : }
4186 : }
4187 : }
4188 35913 : return 0;
4189 : }
4190 :
4191 : /* factor(sn*|n|), where sn = -1 or 1.
4192 : * all != 0 : only look for prime divisors < all. If pU is not NULL,
4193 : * set it to unfactored composite */
4194 : static GEN
4195 15278787 : ifactor_sign(GEN n, ulong all, long hint, long sn, GEN *pU)
4196 : {
4197 : GEN M, N;
4198 : pari_sp av;
4199 15278787 : long nb = 0, nb0 = -1, i;
4200 : ulong lim;
4201 : forprime_t T;
4202 :
4203 15278787 : if (lgefint(n) == 3)
4204 : { /* small integer */
4205 15135952 : GEN f, Pf, Ef, P, E, F = cgetg(3, t_MAT);
4206 : ulong U1, U2;
4207 : long l;
4208 15136375 : av = avma;
4209 : /* enough room to store <= 15 primes and exponents (OK if n < 2^64) */
4210 15136375 : (void)new_chunk((15*3 + 15 + 1) * 2);
4211 15136355 : f = factoru_sign(uel(n,2), all, hint, pU? &U1: NULL, pU? &U2: NULL);
4212 15136483 : set_avma(av);
4213 15136474 : Pf = gel(f,1);
4214 15136474 : Ef = gel(f,2);
4215 15136474 : l = lg(Pf);
4216 15136474 : if (sn < 0)
4217 : { /* add sign */
4218 6519 : long L = l+1;
4219 6519 : gel(F,1) = P = cgetg(L, t_COL);
4220 6519 : gel(F,2) = E = cgetg(L, t_COL);
4221 6519 : gel(P,1) = gen_m1; P++;
4222 6519 : gel(E,1) = gen_1; E++;
4223 : }
4224 : else
4225 : {
4226 15129955 : gel(F,1) = P = cgetg(l, t_COL);
4227 15129973 : gel(F,2) = E = cgetg(l, t_COL);
4228 : }
4229 46079299 : for (i = 1; i < l; i++)
4230 : {
4231 30942854 : gel(P,i) = utoipos(Pf[i]);
4232 30942850 : gel(E,i) = utoipos(Ef[i]);
4233 : }
4234 15136445 : if (pU) *pU = U1 == 1? NULL: mkvec2(utoipos(U1), utoipos(U2));
4235 15136444 : return F;
4236 : }
4237 142835 : if (pU) *pU = NULL;
4238 142835 : M = cgetg(3,t_MAT);
4239 142849 : if (sn < 0) STORE(&nb, utoineg(1), 1);
4240 142849 : if (is_pm1(n)) return aux_end(M,NULL,nb);
4241 :
4242 142849 : n = N = gclone(n); setabssign(n);
4243 : /* trial division bound; look for primes <= lim; nb is the number of
4244 : * distinct prime factors so far; if nb0 >= 0, it records the value of nb
4245 : * for which we made a successful compositeness test: if later nb = nb0,
4246 : * we know that n is composite */
4247 142849 : lim = 1;
4248 142849 : if (!all || all > 2)
4249 : { /* trial divide p < all if all != 0, else p <= tridiv_bound() */
4250 : ulong maxp, p;
4251 : pari_sp av2;
4252 142835 : i = vali(n);
4253 142835 : if (i)
4254 : {
4255 88956 : STOREu(&nb, 2, i);
4256 88956 : av = avma; affii(shifti(n,-i), n); set_avma(av);
4257 : }
4258 142835 : if (is_pm1(n)) return aux_end(M,n,nb);
4259 142717 : lim = all? all-1: tridiv_bound(n);
4260 142717 : av = avma;
4261 142717 : if (lim >= 128)
4262 : { /* fast trial division */
4263 141258 : GEN Q = Z_oddprimedivisors_fast(n, lim);
4264 141258 : av2 = avma;
4265 141258 : if (Q)
4266 : {
4267 138667 : long l = lg(Q);
4268 782455 : for (i = 1; i < l; i++)
4269 : {
4270 644773 : pari_sp av3 = avma;
4271 644773 : ulong p = uel(Q, i);
4272 : long k;
4273 644773 : if (all && p >= all) break;
4274 643788 : k = Z_lvalrem(n, p, &n); /* > 0 */
4275 643788 : affii(n, N); n = N; set_avma(av3);
4276 643788 : STOREu(&nb, p, k);
4277 : }
4278 138667 : if (is_pm1(n))
4279 : {
4280 106363 : stackdummy(av, av2);
4281 106363 : return aux_end(M,n,nb);
4282 : }
4283 : }
4284 34895 : maxp = GP_DATA->factorlimit;
4285 : }
4286 : else
4287 : { /* naive trial division */
4288 1459 : maxp = maxprime();
4289 1459 : u_forprime_init(&T, 3, minuu(lim, maxp)); av2 = avma;
4290 : /* first pass: known to fit in private prime table */
4291 31033 : while ((p = u_forprime_next_fast(&T)))
4292 : {
4293 29895 : pari_sp av3 = avma;
4294 : int stop;
4295 29895 : long k = Z_lvalrem_stop(&n, p, &stop);
4296 29895 : if (k)
4297 : {
4298 4286 : affii(n, N); n = N; set_avma(av3);
4299 4286 : STOREu(&nb, p, k);
4300 : }
4301 : /* prodeuler(p=2,16381,1-1/p) ~ 0.0578; if probability of being prime
4302 : * knowing P^-(n) > 16381 is at least 10%, try BPSW */
4303 29895 : if (!stop && p == 16381)
4304 : {
4305 0 : if (bit_accuracy_mul(lgefint(n), 0.0578 * M_LN2) < 10)
4306 0 : { nb0 = nb; stop = ifac_isprime(n); }
4307 : }
4308 29895 : if (stop)
4309 : {
4310 321 : if (!is_pm1(n)) STOREi(&nb, n, 1);
4311 321 : stackdummy(av, av2);
4312 321 : return aux_end(M,n,nb);
4313 : }
4314 : }
4315 : }
4316 36033 : stackdummy(av, av2);
4317 36033 : if (lim > maxp)
4318 : { /* second pass usually empty, outside fast trial division range */
4319 1 : av = avma; u_forprime_init(&T, maxp+1, lim); av2 = avma;
4320 882811 : while ((p = u_forprime_next(&T)))
4321 : {
4322 882811 : pari_sp av3 = avma;
4323 : int stop;
4324 882811 : long k = Z_lvalrem_stop(&n, p, &stop);
4325 882811 : if (k)
4326 : {
4327 1 : affii(n, N); n = N; set_avma(av3);
4328 1 : STOREu(&nb, p, k);
4329 : }
4330 882811 : if (stop)
4331 : {
4332 1 : if (!is_pm1(n)) STOREi(&nb, n, 1);
4333 1 : stackdummy(av, av2);
4334 1 : return aux_end(M,n,nb);
4335 : }
4336 : }
4337 0 : stackdummy(av, av2);
4338 : }
4339 : }
4340 36046 : if (special_primes(n, lim, &nb, primetab)) return aux_end(M,n, nb);
4341 : /* if nb > nb0 (includes nb0 = -1) we don't know that n is composite */
4342 35913 : if (all)
4343 : { /* smallfact: look for easy pure powers then stop. Cf Z_isanypower */
4344 : GEN x;
4345 27997 : long k, e = expu(lim);
4346 27997 : av = avma;
4347 26687 : k = e >= 10? Z_isanypower_nosmalldiv(n, e, &x)
4348 27997 : : Z_isanypower(n, &x);
4349 27997 : if (k > 1) { affii(x, n); nb0 = -1; } else if (k < 1) k = 1;
4350 27997 : if (pU)
4351 : {
4352 : GEN F;
4353 13155 : if (abscmpiu(n, lim) <= 0
4354 13155 : || cmpii(n, sqru(lim)) <= 0
4355 8823 : || ((e >= 14) &&
4356 7870 : (nb>nb0 && bit_accuracy(lgefint(n))<2048 && ifac_isprime(n))))
4357 13155 : { set_avma(av); STOREi(&nb, n, k); return aux_end(M,n, nb); }
4358 5943 : set_avma(av); F = aux_end(M, NULL, nb); /* don't destroy n */
4359 5943 : *pU = mkvec2(icopy(n), utoipos(k)); /* composite cofactor */
4360 5943 : gunclone(n); return F;
4361 : }
4362 14842 : set_avma(av); STOREi(&nb, n, k);
4363 14842 : if (DEBUGLEVEL >= 2) {
4364 0 : pari_warn(warner,
4365 0 : "IFAC: untested %ld-bit integer declared prime", expi(n)+1);
4366 0 : if (expi(n) <= 256) err_printf("\t%Ps\n", n);
4367 : }
4368 : }
4369 7916 : else if (nb > nb0 && ifac_isprime(n)) STOREi(&nb, n, 1);
4370 2569 : else nb += ifac_decomp(n, hint);
4371 22758 : return aux_end(M,n, nb);
4372 : }
4373 :
4374 : static GEN
4375 10324369 : ifactor(GEN n, ulong all, long hint)
4376 : {
4377 10324369 : long s = signe(n);
4378 10324369 : if (!s) retmkmat2(mkcol(gen_0), mkcol(gen_1));
4379 10324320 : return ifactor_sign(n, all, hint, s, NULL);
4380 : }
4381 :
4382 : int
4383 6477 : ifac_next(GEN *part, GEN *p, long *e)
4384 : {
4385 6477 : GEN here = ifac_main(part);
4386 6477 : if (here == gen_0) { *p = NULL; *e = 1; return 0; }
4387 6475 : if (!here) { *p = NULL; *e = 0; return 0; }
4388 4735 : *p = VALUE(here);
4389 4735 : *e = EXPON(here)[2];
4390 4735 : ifac_delete(here); return 1;
4391 : }
4392 :
4393 : /* see before ifac_crack for current semantics of 'hint' (factorint's 'flag') */
4394 : GEN
4395 10290 : factorint(GEN n, long flag)
4396 : {
4397 : GEN F;
4398 10290 : if ((F = check_arith_all(n,"factorint"))) return gcopy(F);
4399 10276 : return ifactor(n,0,flag);
4400 : }
4401 :
4402 : GEN
4403 55350 : Z_factor_limit(GEN n, ulong all)
4404 : {
4405 55350 : if (!all) all = GP_DATA->factorlimit + 1;
4406 55350 : return ifactor(n, all, decomp_default_hint);
4407 : }
4408 : GEN
4409 895453 : absZ_factor_limit_strict(GEN n, ulong all, GEN *pU)
4410 : {
4411 : GEN F, U;
4412 895453 : if (!signe(n))
4413 : {
4414 0 : if (pU) *pU = NULL;
4415 0 : retmkmat2(mkcol(gen_0), mkcol(gen_1));
4416 : }
4417 895453 : if (!all) all = GP_DATA->factorlimit + 1;
4418 895453 : F = ifactor_sign(n, all, decomp_default_hint, 1, &U);
4419 895494 : if (pU) *pU = U;
4420 895494 : return F;
4421 : }
4422 : GEN
4423 287685 : absZ_factor_limit(GEN n, ulong all)
4424 : {
4425 287685 : if (!signe(n)) retmkmat2(mkcol(gen_0), mkcol(gen_1));
4426 287685 : if (!all) all = GP_DATA->factorlimit + 1;
4427 287685 : return ifactor_sign(n, all, decomp_default_hint, 1, NULL);
4428 : }
4429 : GEN
4430 10258830 : Z_factor(GEN n)
4431 10258830 : { return ifactor(n,0,decomp_default_hint); }
4432 : GEN
4433 3768253 : absZ_factor(GEN n)
4434 : {
4435 3768253 : if (!signe(n)) retmkmat2(mkcol(gen_0), mkcol(gen_1));
4436 3768239 : return ifactor_sign(n, 0, decomp_default_hint, 1, NULL);
4437 : }
4438 : /* Factor until the unfactored part is smaller than limit. Return the
4439 : * factored part. Hence factorback(output) may be smaller than n */
4440 : GEN
4441 3045 : Z_factor_until(GEN n, GEN limit)
4442 : {
4443 3045 : pari_sp av = avma;
4444 3045 : long s = signe(n), eq;
4445 : GEN q, F, U;
4446 :
4447 3045 : if (!s) retmkmat2(mkcol(gen_0), mkcol(gen_1));
4448 3045 : F = ifactor_sign(n, tridiv_bound(n), decomp_default_hint, s, &U);
4449 3045 : if (!U) return F;
4450 1155 : q = gel(U,1); /* composite, q^eq = unfactored part */
4451 1155 : eq = itou(gel(U,2));
4452 1155 : if (cmpii(eq == 1? q: powiu(q, eq), limit) > 0)
4453 : { /* factor further */
4454 1022 : long l2 = expi(q)+1;
4455 : GEN P2, E2, F2, part;
4456 1022 : if (eq > 1) limit = sqrtnint(limit, eq);
4457 1022 : P2 = coltrunc_init(l2);
4458 1022 : E2 = coltrunc_init(l2); F2 = mkmat2(P2,E2);
4459 1022 : part = ifac_start(icopy(q), 0); /* ifac_next would destroy q */
4460 : for(;;)
4461 70 : {
4462 : long e;
4463 : GEN p;
4464 1092 : if (!ifac_next(&part,&p,&e)) break;
4465 1092 : vectrunc_append(P2, p);
4466 1092 : vectrunc_append(E2, utoipos(e * eq));
4467 1092 : q = diviiexact(q, powiu(p, e));
4468 1092 : if (cmpii(q, limit) <= 0) break;
4469 : }
4470 1022 : F2 = sort_factor(F2, (void*)&abscmpii, cmp_nodata);
4471 1022 : F = merge_factor(F, F2, (void*)&abscmpii, cmp_nodata);
4472 : }
4473 1155 : return gc_GEN(av, F);
4474 : }
4475 :
4476 : static void
4477 102257941 : matsmalltrunc_append(GEN m, ulong p, ulong e)
4478 : {
4479 102257941 : GEN P = gel(m,1), E = gel(m,2);
4480 102257941 : long l = lg(P);
4481 102257941 : P[l] = p; lg_increase(P);
4482 102255149 : E[l] = e; lg_increase(E);
4483 102250862 : }
4484 : static GEN
4485 40048504 : matsmalltrunc_init(long l)
4486 : {
4487 40048504 : GEN P = vecsmalltrunc_init(l);
4488 40032300 : GEN E = vecsmalltrunc_init(l); return mkvec2(P,E);
4489 : }
4490 :
4491 : /* return optimal N s.t. omega(b) <= N for all b <= x */
4492 : long
4493 71820 : maxomegau(ulong x)
4494 : { /* P=primes(15); for(i=1,15, print([i, vecprod(P[1..i])])) */
4495 71820 : if (x < 30030UL)/* rare trivial cases */
4496 : {
4497 37662 : if (x < 2UL) return 0;
4498 19406 : if (x < 6UL) return 1;
4499 13806 : if (x < 30UL) return 2;
4500 13099 : if (x < 210UL) return 3;
4501 12840 : if (x < 2310UL) return 4;
4502 11776 : return 5;
4503 : }
4504 34158 : if (x < 510510UL) return 6; /* most frequent case */
4505 18753 : if (x < 9699690UL) return 7;
4506 7 : if (x < 223092870UL) return 8;
4507 : #ifdef LONG_IS_64BIT
4508 6 : if (x < 6469693230UL) return 9;
4509 0 : if (x < 200560490130UL) return 10;
4510 0 : if (x < 7420738134810UL) return 11;
4511 0 : if (x < 304250263527210UL) return 12;
4512 0 : if (x < 13082761331670030UL) return 13;
4513 0 : if (x < 614889782588491410UL) return 14;
4514 0 : return 15;
4515 : #else
4516 1 : return 9;
4517 : #endif
4518 : }
4519 : /* return optimal N s.t. omega(b) <= N for all odd b <= x */
4520 : long
4521 2358 : maxomegaoddu(ulong x)
4522 : { /* P=primes(15+1); for(i=1,15, print([i, vecprod(P[2..i+1])])) */
4523 2358 : if (x < 255255UL)/* rare trivial cases */
4524 : {
4525 1415 : if (x < 3UL) return 0;
4526 1415 : if (x < 15UL) return 1;
4527 1415 : if (x < 105UL) return 2;
4528 1415 : if (x < 1155UL) return 3;
4529 1387 : if (x < 15015UL) return 4;
4530 1387 : return 5;
4531 : }
4532 943 : if (x < 4849845UL) return 6; /* most frequent case */
4533 0 : if (x < 111546435UL) return 7;
4534 0 : if (x < 3234846615UL) return 8;
4535 : #ifdef LONG_IS_64BIT
4536 0 : if (x < 100280245065UL) return 9;
4537 0 : if (x < 3710369067405UL) return 10;
4538 0 : if (x < 152125131763605UL) return 11;
4539 0 : if (x < 6541380665835015UL) return 12;
4540 0 : if (x < 307444891294245705UL) return 13;
4541 0 : if (x < 16294579238595022365UL) return 14;
4542 0 : return 15;
4543 : #else
4544 0 : return 9;
4545 : #endif
4546 : }
4547 :
4548 : /* If a <= c <= b , factoru(c) = L[c-a+1] */
4549 : GEN
4550 31967 : vecfactoru_i(ulong a, ulong b)
4551 : {
4552 31967 : ulong k, p, n = b-a+1, N = maxomegau(b) + 1;
4553 31967 : GEN v = const_vecsmall(n, 1);
4554 31967 : GEN L = cgetg(n+1, t_VEC);
4555 : forprime_t T;
4556 21405368 : for (k = 1; k <= n; k++) gel(L,k) = matsmalltrunc_init(N);
4557 31967 : u_forprime_init(&T, 2, usqrt(b));
4558 885825 : while ((p = u_forprime_next(&T)))
4559 : { /* p <= sqrt(b) */
4560 853778 : ulong pk = p, K = ulogint(b, p);
4561 2971853 : for (k = 1; k <= K; k++)
4562 : {
4563 2117995 : ulong j, t = a / pk, ap = t * pk;
4564 2117995 : if (ap < a) { ap += pk; t++; }
4565 : /* t = (j+a-1) \ pk */
4566 2117995 : t %= p;
4567 62676987 : for (j = ap-a+1; j <= n; j += pk)
4568 : {
4569 60558918 : if (t) { v[j] *= pk; matsmalltrunc_append(gel(L,j), p,k); }
4570 60558992 : if (++t == p) t = 0;
4571 : }
4572 2118069 : pk *= p;
4573 : }
4574 : }
4575 : /* complete factorisation of non-sqrt(b)-smooth numbers */
4576 21522638 : for (k = 1, N = a; k <= n; k++, N++)
4577 21491970 : if (uel(v,k) != N) matsmalltrunc_append(gel(L,k), N/uel(v,k),1UL);
4578 30668 : return L;
4579 : }
4580 : GEN
4581 0 : vecfactoru(ulong a, ulong b)
4582 : {
4583 0 : pari_sp av = avma;
4584 0 : return gc_GEN(av, vecfactoru_i(a,b));
4585 : }
4586 :
4587 : /* Assume a and b odd, return L s.t. L[k] = factoru(a + 2*(k-1))
4588 : * If a <= c <= b odd, factoru(c) = L[(c-a)>>1 + 1] */
4589 : GEN
4590 2358 : vecfactoroddu_i(ulong a, ulong b)
4591 : {
4592 2358 : ulong k, p, n = ((b-a)>>1) + 1, N = maxomegaoddu(b) + 1;
4593 2358 : GEN v = const_vecsmall(n, 1);
4594 2358 : GEN L = cgetg(n+1, t_VEC);
4595 : forprime_t T;
4596 :
4597 18757537 : for (k = 1; k <= n; k++) gel(L,k) = matsmalltrunc_init(N);
4598 2358 : u_forprime_init(&T, 3, usqrt(b));
4599 194438 : while ((p = u_forprime_next(&T)))
4600 : { /* p <= sqrt(b) */
4601 194789 : ulong pk = p, K = ulogint(b, p);
4602 660819 : for (k = 1; k <= K; k++)
4603 : {
4604 468739 : ulong j, t = (a / pk) | 1UL, ap = t * pk;
4605 : /* t and ap are odd, ap multiple of pk = p^k */
4606 468739 : if (ap < a) { ap += pk<<1; t+=2; }
4607 : /* c=t*p^k by steps of 2*p^k; factorization of c*=p^k if (t,p)=1 */
4608 468739 : t %= p;
4609 34781150 : for (j = ((ap-a)>>1)+1; j <= n; j += pk)
4610 : {
4611 34315181 : if (t) { v[j] *= pk; matsmalltrunc_append(gel(L,j), p,k); }
4612 34312411 : t += 2; if (t >= p) t -= p;
4613 : }
4614 465969 : pk *= p;
4615 : }
4616 : }
4617 : /* complete factorisation of non-sqrt(b)-smooth numbers */
4618 18874816 : for (k = 1, N = a; k <= n; k++, N+=2)
4619 18872438 : if (uel(v,k) != N) matsmalltrunc_append(gel(L,k), N/uel(v,k),1UL);
4620 2378 : return L;
4621 : }
4622 : GEN
4623 0 : vecfactoroddu(ulong a, ulong b)
4624 : {
4625 0 : pari_sp av = avma;
4626 0 : return gc_GEN(av, vecfactoroddu_i(a,b));
4627 : }
4628 :
4629 : /* If 0 <= a <= c <= b; L[c-a+1] = factoru(c)[,1] if c squarefree, else NULL */
4630 : GEN
4631 7014 : vecfactorsquarefreeu(ulong a, ulong b)
4632 : {
4633 7014 : ulong k, p, n = b-a+1, N = maxomegau(b) + 1;
4634 7014 : GEN v = const_vecsmall(n, 1);
4635 7014 : GEN L = cgetg(n+1, t_VEC);
4636 : forprime_t T;
4637 14007238 : for (k = 1; k <= n; k++) gel(L,k) = vecsmalltrunc_init(N);
4638 7014 : u_forprime_init(&T, 2, usqrt(b));
4639 838334 : while ((p = u_forprime_next(&T)))
4640 : { /* p <= sqrt(b), kill nonsquarefree */
4641 831320 : ulong j, pk = p*p, t = a / pk, ap = t * pk;
4642 831320 : if (ap < a) ap += pk;
4643 7160090 : for (j = ap-a+1; j <= n; j += pk) gel(L,j) = NULL;
4644 :
4645 831320 : t = a / p; ap = t * p;
4646 831320 : if (ap < a) { ap += p; t++; }
4647 30551556 : for (j = ap-a+1; j <= n; j += p, t++)
4648 29720236 : if (gel(L,j)) { v[j] *= p; vecsmalltrunc_append(gel(L,j), p); }
4649 : }
4650 : /* complete factorisation of non-sqrt(b)-smooth numbers */
4651 14007238 : for (k = 1, N = a; k <= n; k++, N++)
4652 14000224 : if (gel(L,k) && uel(v,k) != N) vecsmalltrunc_append(gel(L,k), N/uel(v,k));
4653 7014 : return L;
4654 : }
4655 : /* If 0 <= a <= c <= b; L[c-a+1] = factoru(c)[,1] if c squarefree and coprime
4656 : * to all the primes in sorted zv P, else NULL */
4657 : GEN
4658 32762 : vecfactorsquarefreeu_coprime(ulong a, ulong b, GEN P)
4659 : {
4660 32762 : ulong k, p, n = b-a+1, sqb = usqrt(b), N = maxomegau(b) + 1;
4661 32762 : GEN v = const_vecsmall(n, 1);
4662 32762 : GEN L = cgetg(n+1, t_VEC);
4663 : forprime_t T;
4664 92257294 : for (k = 1; k <= n; k++) gel(L,k) = vecsmalltrunc_init(N);
4665 32761 : u_forprime_init(&T, 2, sqb);
4666 3680820 : while ((p = u_forprime_next(&T)))
4667 : { /* p <= sqrt(b), kill nonsquarefree */
4668 3646260 : ulong j, t, ap, bad = zv_search(P, p), pk = bad ? p: p * p;
4669 3646612 : t = a / pk; ap = t * pk; if (ap < a) ap += pk;
4670 82002224 : for (j = ap-a+1; j <= n; j += pk) gel(L,j) = NULL;
4671 3646612 : if (bad) continue;
4672 :
4673 3584290 : t = a / p; ap = t * p;
4674 3584290 : if (ap < a) { ap += p; t++; }
4675 118484745 : for (j = ap-a+1; j <= n; j += p, t++)
4676 114899009 : if (gel(L,j)) { v[j] *= p; vecsmalltrunc_append(gel(L,j), p); }
4677 : }
4678 32761 : if (uel(P,lg(P)-1) <= sqb) P = NULL;
4679 : /* complete factorisation of non-sqrt(b)-smooth numbers */
4680 92496469 : for (k = 1, N = a; k <= n; k++, N++)
4681 92463708 : if (gel(L,k) && uel(v,k) != N)
4682 : {
4683 26202547 : ulong q = N / uel(v,k);
4684 26202547 : if (!P || !zv_search(P, q)) vecsmalltrunc_append(gel(L,k), q);
4685 : }
4686 32761 : return L;
4687 : }
4688 :
4689 : GEN
4690 49 : vecsquarefreeu(ulong a, ulong b)
4691 : {
4692 49 : ulong j, k, p, n = b-a+1;
4693 49 : GEN L = const_vecsmall(n, 1);
4694 : forprime_t T;
4695 49 : u_forprime_init(&T, 2, usqrt(b));
4696 462 : while ((p = u_forprime_next(&T)))
4697 : { /* p <= sqrt(b), kill nonsquarefree */
4698 413 : ulong pk = p*p, t = a / pk, ap = t * pk;
4699 413 : if (ap < a) { ap += pk; t++; }
4700 : /* t = (j+a-1) \ pk */
4701 21777 : for (j = ap-a+1; j <= n; j += pk, t++) L[j] = 0;
4702 : }
4703 48258 : for (k = j = 1; k <= n; k++)
4704 48209 : if (L[k]) L[j++] = a+k-1;
4705 49 : setlg(L,j); return L;
4706 : }
|