Line data Source code
1 : #line 2 "../src/kernel/none/halfgcd.c"
2 : /* Copyright (C) 2019 The PARI group.
3 :
4 : This file is part of the PARI/GP package.
5 :
6 : PARI/GP is free software; you can redistribute it and/or modify it under the
7 : terms of the GNU General Public License as published by the Free Software
8 : Foundation; either version 2 of the License, or (at your option) any later
9 : version. It is distributed in the hope that it will be useful, but WITHOUT
10 : ANY WARRANTY WHATSOEVER.
11 :
12 : Check the License for details. You should have received a copy of it, along
13 : with the package; see the file 'COPYING'. If not, write to the Free Software
14 : Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */
15 :
16 : GEN
17 2338 : ZM2_sqr(GEN A)
18 : {
19 2338 : GEN a = gcoeff(A,1,1), b = gcoeff(A,1,2), a2 = sqri(a);
20 2338 : GEN c = gcoeff(A,2,1), d = gcoeff(A,2,2), d2 = sqri(d), t = addii(a,d);
21 2338 : if (equalii(b, c)) /* symetric, 3S + 1M */
22 : {
23 322 : GEN b2 = sqri(b), M = cgetg(3, t_MAT), tb = mulii(b, t);
24 322 : gel(M,1) = mkcol2(addii(a2, b2), tb);
25 322 : gel(M,2) = mkcol2(tb, addii(b2, d2)); return M;
26 : }
27 : else
28 : { /* general, 2S + 3M */
29 2016 : GEN bc = mulii(b, c);
30 2016 : retmkmat2(mkcol2(addii(bc, a2), mulii(c, t)),
31 : mkcol2(mulii(b, t), addii(bc, d2)));
32 : }
33 : }
34 :
35 : GEN
36 7286881 : ZM2_mul(GEN A, GEN B)
37 : {
38 7286881 : const long t = ZM2_MUL_LIMIT+2;
39 7286881 : GEN A11=gcoeff(A,1,1),A12=gcoeff(A,1,2), B11=gcoeff(B,1,1),B12=gcoeff(B,1,2);
40 7286881 : GEN A21=gcoeff(A,2,1),A22=gcoeff(A,2,2), B21=gcoeff(B,2,1),B22=gcoeff(B,2,2);
41 7286881 : if (lgefint(A11) < t || lgefint(B11) < t || lgefint(A22) < t || lgefint(B22) < t
42 128292 : || lgefint(A12) < t || lgefint(B12) < t || lgefint(A21) < t || lgefint(B21) < t)
43 : { /* 8M */
44 7161247 : GEN a = mulii(A11, B11), b = mulii(A12, B21);
45 7160578 : GEN c = mulii(A11, B12), d = mulii(A12, B22);
46 7160545 : GEN e = mulii(A21, B11), f = mulii(A22, B21);
47 7160599 : GEN g = mulii(A21, B12), h = mulii(A22, B22);
48 7160533 : retmkmat2(mkcol2(addii(a,b), addii(e,f)), mkcol2(addii(c,d), addii(g,h)));
49 : } else
50 : { /* Strassen: 7M */
51 125634 : GEN M1 = mulii(addii(A11,A22), addii(B11,B22));
52 125635 : GEN M2 = mulii(addii(A21,A22), B11);
53 125635 : GEN M3 = mulii(A11, subii(B12,B22));
54 125635 : GEN M4 = mulii(A22, subii(B21,B11));
55 125635 : GEN M5 = mulii(addii(A11,A12), B22);
56 125635 : GEN M6 = mulii(subii(A21,A11), addii(B11,B12));
57 125635 : GEN M7 = mulii(subii(A12,A22), addii(B21,B22));
58 125635 : GEN T1 = addii(M1,M4), T2 = subii(M7,M5);
59 125635 : GEN T3 = subii(M1,M2), T4 = addii(M3,M6);
60 125635 : retmkmat2(mkcol2(addii(T1,T2), addii(M2,M4)),
61 : mkcol2(addii(M3,M5), addii(T3,T4)));
62 : }
63 : }
64 :
65 : static GEN
66 867 : matid2(void)
67 : {
68 867 : retmkmat2(mkcol2(gen_1,gen_0),
69 : mkcol2(gen_0,gen_1));
70 : }
71 :
72 : /* Return M*[q,1;1,0] */
73 : static GEN
74 3061344 : mulq(GEN M, GEN q)
75 : {
76 3061344 : GEN u, v, res = cgetg(3, t_MAT);
77 3061321 : u = addii(mulii(gcoeff(M,1,1), q), gcoeff(M,1,2));
78 3061353 : v = addii(mulii(gcoeff(M,2,1), q), gcoeff(M,2,2));
79 3061350 : gel(res,1) = mkcol2(u, v);
80 3061339 : gel(res,2) = gel(M,1);
81 3061339 : return res;
82 : }
83 : static GEN
84 71 : mulqab(GEN M, GEN q, GEN *ap, GEN *bp)
85 : {
86 71 : GEN b = subii(*ap, mulii(*bp, q));
87 71 : *ap = *bp; *bp = b;
88 71 : return mulq(M,q);
89 : }
90 :
91 : /* Return M*[q,1;1,0]^-1 */
92 :
93 : static GEN
94 1284 : mulqi(GEN M, GEN q, GEN *ap, GEN *bp)
95 : {
96 : GEN u, v, res, a;
97 1284 : a = addii(mulii(*ap, q), *bp);
98 1284 : *bp = *ap; *ap = a;
99 1284 : res = cgetg(3, t_MAT);
100 1284 : u = subii(gcoeff(M,1,1),mulii(gcoeff(M,1,2), q));
101 1284 : v = subii(gcoeff(M,2,1),mulii(gcoeff(M,2,2), q));
102 1284 : gel(res,1) = gel(M,2);
103 1284 : gel(res,2) = mkcol2(u,v);
104 1284 : return res;
105 : }
106 :
107 : /* test whether n is a power of 2 */
108 : static long
109 22879013 : isint2n(GEN n)
110 : {
111 : GEN x;
112 22879013 : long lx = lgefint(n), i;
113 22879013 : if (lx == 2) return 0;
114 22879013 : x = int_MSW(n);
115 22879013 : if (*(ulong*)x != 1UL<<expu(*(ulong*)x) ) return 0;
116 542199 : for (i = 3; i < lx; i++)
117 : {
118 534814 : x = int_precW(x); if (*x) return 0;
119 : }
120 7385 : return 1;
121 : }
122 :
123 : static long
124 22879277 : uexpi(GEN a)
125 22879277 : { return expi(a)+!isint2n(a); }
126 :
127 : static GEN
128 123341 : FIXUP0(GEN M, GEN *a, GEN *b, long m)
129 : {
130 123341 : long cnt=0;
131 156456 : while (expi(*b) >= m)
132 : {
133 33115 : GEN r, q = dvmdii(*a, *b, &r);
134 33115 : *a = *b; *b = r;
135 33115 : M = mulq(M, q);
136 33115 : cnt++;
137 : };
138 123341 : if (cnt>6) pari_err_BUG("FIXUP0");
139 123341 : return M;
140 : }
141 :
142 : static long
143 6280956 : signdet(GEN Q)
144 : {
145 6280956 : long a = Mod4(gcoeff(Q,1,1)), b = Mod4(gcoeff(Q,1,2));
146 6280892 : long c = Mod4(gcoeff(Q,2,1)), d = Mod4(gcoeff(Q,2,2));
147 6282008 : return ((a*d-b*c)&3)==1 ? 1 : -1;
148 : }
149 :
150 : static GEN
151 6097935 : ZM_inv2(GEN M)
152 : {
153 6097935 : long e = signdet(M);
154 9556720 : if (e==1) return mkmat22(gcoeff(M,2,2),negi(gcoeff(M,1,2)),
155 3458113 : negi(gcoeff(M,2,1)),gcoeff(M,1,1));
156 2640631 : else return mkmat22(negi(gcoeff(M,2,2)),gcoeff(M,1,2),
157 2640650 : gcoeff(M,2,1),negi(gcoeff(M,1,1)));
158 : }
159 :
160 : static GEN
161 1284 : lastq(GEN Q)
162 : {
163 1284 : GEN p = gcoeff(Q,1,1), q = gcoeff(Q,1,2), s = gcoeff(Q,2,2);
164 1284 : if (signe(q)==0) pari_err_BUG("halfgcd");
165 1284 : if (signe(s)==0) return p;
166 1284 : if (equali1(q)) return subiu(p,1);
167 1284 : return divii(p, q);
168 : }
169 :
170 : static GEN
171 7820 : mulT(GEN Q, GEN *ap, GEN *bp)
172 : {
173 7820 : *ap = addii(*ap, *bp);
174 7820 : *bp = negi(*bp);
175 7820 : return mkmat2(gel(Q,1),
176 7819 : mkcol2(subii(gcoeff(Q,1,1), gcoeff(Q,1,2))
177 7820 : , subii(gcoeff(Q,2,1), gcoeff(Q,2,2))));
178 : }
179 :
180 : static GEN
181 183039 : FIXUP1(GEN M, GEN a, GEN b, long m, long t, GEN *ap, GEN *bp)
182 : {
183 183039 : GEN Q = gel(M,1), a0 = gel(M,2), b0 = gel(M,3);
184 183039 : GEN q, am = remi2n(a, m), bm = remi2n(b, m);
185 183236 : if (signdet(Q)==-1)
186 : {
187 121255 : *ap = subii(mulii(bm, gcoeff(Q,1,2)),mulii(am, gcoeff(Q,2,2)));
188 121156 : *bp = subii(mulii(am, gcoeff(Q,2,1)),mulii(bm, gcoeff(Q,1,1)));
189 121376 : *ap = addii(*ap, shifti(addii(a0, gcoeff(Q,2,2)), m));
190 121342 : *bp = addii(*bp, shifti(subii(b0, gcoeff(Q,2,1)), m));
191 120862 : if (signe(*bp) >= 0)
192 112959 : return Q;
193 7903 : if (expi(addii(*ap,*bp)) >= m+t)
194 7820 : return mulT(Q, ap ,bp);
195 83 : q = lastq(Q);
196 83 : Q = mulqi(Q, q, ap, bp);
197 83 : if (cmpiu(q, 2)>=0)
198 71 : return mulqab(Q, subiu(q,1), ap, bp);
199 : else
200 12 : return mulqi(Q, lastq(Q), ap, bp);
201 : }
202 : else
203 : {
204 61855 : *ap = subii(mulii(am, gcoeff(Q,2,2)),mulii(bm, gcoeff(Q,1,2)));
205 61855 : *bp = subii(mulii(bm, gcoeff(Q,1,1)),mulii(am, gcoeff(Q,2,1)));
206 61855 : *ap = addii(*ap, shifti(subii(a0, gcoeff(Q,2,2)), m));
207 61855 : *bp = addii(*bp, shifti(addii(b0, gcoeff(Q,2,1)), m));
208 61855 : if (expi(*ap) >= m+t)
209 60666 : return FIXUP0(Q, ap, bp, m+t);
210 : else
211 1189 : return signe(gcoeff(Q,1,2))==0? Q: mulqi(Q, lastq(Q), ap, bp);
212 : }
213 : }
214 :
215 : static long
216 22816701 : magic_threshold(GEN a)
217 22816701 : { return (3+uexpi(a))>>1; }
218 :
219 : static GEN
220 14796576 : HGCD_basecase(GEN y, GEN x)
221 : {
222 14796576 : pari_sp av = avma;
223 : GEN d, d1, q, r;
224 : GEN u, u1, v, v1;
225 : ulong xu, xu1, xv, xv1; /* Lehmer stage recurrence matrix */
226 : int lhmres; /* Lehmer stage return value */
227 :
228 14796576 : long m = magic_threshold(y);
229 :
230 : /* There is no special case for single-word numbers since this is
231 : * mainly meant to be used with large moduli. */
232 14796604 : if (cmpii(y,x) <= 0)
233 : {
234 97779 : d = x; d1 = y;
235 97779 : u = gen_1; u1 = gen_0;
236 97779 : v = gen_0; v1 = gen_1;
237 : } else
238 : {
239 14698784 : d = y; d1 = x;
240 14698784 : u = gen_0; u1 = gen_1;
241 14698784 : v = gen_1; v1 = gen_0;
242 : }
243 34199853 : while (lgefint(d) > 3 && expi(d1) >= m + BITS_IN_LONG + 1)
244 : {
245 : /* do a Lehmer-Jebelean round */
246 19714645 : lhmres = lgcdii((ulong *)d, (ulong *)d1, &xu, &xu1, &xv, &xv1, 0);
247 :
248 19721623 : if (lhmres)
249 : {
250 18699431 : if (lhmres == 1 || lhmres == -1)
251 : {
252 438837 : if (xv1 == 1)
253 : {
254 372522 : r = subii(d,d1); d = d1; d1 = r;
255 372523 : r = addii(u,u1); u = u1; u1 = r;
256 372399 : r = addii(v,v1); v = v1; v1 = r;
257 : }
258 : else
259 : {
260 66315 : r = subii(d, mului(xv1,d1)); d = d1; d1 = r;
261 66315 : r = addii(u, mului(xv1,u1)); u = u1; u1 = r;
262 66315 : r = addii(v, mului(xv1,v1)); v = v1; v1 = r;
263 : }
264 : }
265 : else
266 : {
267 18260594 : r = subii(muliu(d,xu), muliu(d1,xv));
268 18255407 : d1 = subii(muliu(d,xu1), muliu(d1,xv1)); d = r;
269 18256105 : r = addii(muliu(u,xu), muliu(u1,xv));
270 18254380 : u1 = addii(muliu(u,xu1), muliu(u1,xv1)); u = r;
271 18254337 : r = addii(muliu(v,xu), muliu(v1,xv));
272 18254247 : v1 = addii(muliu(v,xu1), muliu(v1,xv1)); v = r;
273 18257326 : if (lhmres&1) togglesign(d); else togglesign(d1);
274 : }
275 : } /* lhmres != 0 */
276 19718126 : if (expi(d1) < m) break;
277 :
278 19403899 : if (lhmres <= 0 && signe(d1))
279 : {
280 1077382 : q = dvmdii(d,d1,&r);
281 1077391 : d = d1; d1 = r;
282 1077391 : r = addii(u, mulii(q,u1)); u = u1; u1 = r;
283 1076974 : r = addii(v, mulii(q,v1)); v = v1; v1 = r;
284 : }
285 19403487 : if (gc_needed(av,1))
286 : {
287 0 : if(DEBUGMEM>1) pari_warn(warnmem,"ratlift");
288 0 : (void)gc_all(av, 6, &d, &d1, &u, &u1, &v, &v1);
289 : }
290 : }
291 84302968 : while (expi(d1) >= m)
292 : {
293 69506246 : GEN r, q = dvmdii(d,d1, &r);
294 69517168 : d = d1; d1 = r; swap(u,u1); swap(v,v1);
295 69517168 : u1 = addii(mulii(u, q), u1);
296 69506384 : v1 = addii(mulii(v, q), v1);
297 : }
298 14788630 : return gc_GEN(av, mkvec3(mkmat22(u1,u,v1,v), d, d1));
299 : }
300 :
301 : static GEN HGCD(GEN x, GEN y);
302 :
303 : /*
304 : Based on
305 : Klaus Thull and Chee K. Yap,
306 : A unified approach to HGCD algorithms for polynomials andintegers,
307 : 1990, Manuscript.
308 : URL: http://cs.nyu.edu/cs/faculty/yap/papers.
309 : */
310 :
311 : static GEN
312 120833 : HGCD_split(GEN a, GEN b)
313 : {
314 120833 : pari_sp av = avma;
315 120833 : long m = magic_threshold(a), t, l, k, tp;
316 : GEN a0, b0, ap, bp, c, d, c0, d0, cp, dp, R, S, T, q, r;
317 120688 : if (signe(b) < 0 || cmpii(a,b)<0) pari_err_BUG("HGCD_split");
318 120710 : if (expi(b) < m)
319 462 : return gc_GEN(av, mkvec3(matid2(), a, b));
320 120186 : a0 = addiu(shifti(a, -m), 1);
321 120288 : if (cmpiu(a0,7) <= 0)
322 : {
323 0 : R = FIXUP0(matid2(), &a, &b, m);
324 0 : return gc_GEN(av, mkvec3(R, a, b));
325 : }
326 120305 : b0 = shifti(b,-m);
327 120546 : t = magic_threshold(a0);
328 120264 : R = FIXUP1(HGCD(a0,b0),a, b, m, t, &ap, &bp);
329 120030 : if (expi(bp) < m)
330 57243 : return gc_GEN(av, mkvec3(R, ap, bp));
331 62676 : q = dvmdii(ap, bp, &r);
332 62676 : c = bp; d = r;
333 62676 : if (cmpiu(shifti(c,-m),6) <= 0)
334 : {
335 21 : R = FIXUP0(mulq(R, q), &c, &d, m);
336 21 : return gc_GEN(av, mkvec3(R, c, d));
337 : }
338 62655 : l = uexpi(c);
339 62655 : k = 2*m-l-1; if (k<0) pari_err_BUG("halfgcd");
340 62655 : c0 = addiu(shifti(c, -k), 1); if (cmpiu(c0,8)<0) pari_err_BUG("halfgcd");
341 62655 : d0 = shifti(d, -k);
342 62655 : tp = magic_threshold(c0);
343 62655 : S = FIXUP1(HGCD(c0,d0), c, d, k, tp, &cp, &dp);
344 62654 : if (!(expi(cp)>=m+1 && m+1 > expi(dp))) pari_err_BUG("halfgcd");
345 62654 : T = FIXUP0(ZM2_mul(mulq(R, q), S), &cp, &dp, m);
346 62655 : return gc_GEN(av, mkvec3(T, cp, dp));
347 : }
348 :
349 : static GEN
350 14917179 : HGCD(GEN x, GEN y)
351 : {
352 14917179 : if (lgefint(y)-2 < HALFGCD_LIMIT)
353 14796551 : return HGCD_basecase(x, y);
354 : else
355 120628 : return HGCD_split(x, y);
356 : }
357 :
358 : static GEN
359 28900711 : HGCD0(GEN x, GEN y)
360 : {
361 28900711 : if (signe(y) >= 0 && cmpii(x, y) >= 0)
362 14730394 : return HGCD(x, y);
363 14170312 : if (cmpii(x, y) < 0)
364 : {
365 11800431 : GEN M = HGCD0(y, x), Q = gel(M,1);
366 11799246 : return mkvec3(mkmat22(gcoeff(Q,2,1),gcoeff(Q,2,2),gcoeff(Q,1,1),gcoeff(Q,1,2)),
367 11800746 : gel(M,2),gel(M,3));
368 : } /* Now y <= x*/
369 2369995 : if (signe(x) <= 0)
370 : { /* y <= x <=0 */
371 3973 : GEN M = HGCD(negi(y), negi(x)), Q = gel(M,1);
372 3973 : return mkvec3(mkmat22(negi(gcoeff(Q,2,1)),negi(gcoeff(Q,2,2)),
373 3973 : negi(gcoeff(Q,1,1)),negi(gcoeff(Q,1,2))),
374 3973 : gel(M,2),gel(M,3));
375 : }
376 : else /* y <= 0 <=x */
377 : {
378 2366022 : GEN M = HGCD0(x, negi(y)), Q = gel(M,1);
379 2366022 : return mkvec3(mkmat22(gcoeff(Q,1,1),gcoeff(Q,1,2),negi(gcoeff(Q,2,1)),negi(gcoeff(Q,2,2))),
380 2366022 : gel(M,2),gel(M,3));
381 : }
382 : }
383 :
384 : GEN
385 6098136 : halfgcdii(GEN A, GEN B)
386 : {
387 6098136 : pari_sp av = avma;
388 6098136 : GEN M, Q, a, b, m = abscmpii(A, B)>0 ? A: B;
389 6098172 : M = HGCD0(A,B); Q = gel(M,1); a = gel(M,2); b = gel(M,3);
390 9062179 : while (signe(b) && abscmpii(sqri(b), m) >= 0)
391 : {
392 2965201 : GEN r, q = dvmdii(a, b, &r);
393 2965179 : a = b; b = r;
394 2965179 : Q = mulq(Q, q);
395 : }
396 6097340 : return gc_GEN(av, mkvec2(ZM_inv2(Q),mkcol2(a,b)));
397 : }
|