Line  | Count  | Source (jump to first uncovered line)  | 
1  |  | /* Compute {up,n}^(-1) mod B^n. | 
2  |  |  | 
3  |  |    Contributed to the GNU project by Torbjorn Granlund.  | 
4  |  |  | 
5  |  |    THE FUNCTIONS IN THIS FILE ARE INTERNAL WITH MUTABLE INTERFACES.  IT IS ONLY  | 
6  |  |    SAFE TO REACH THEM THROUGH DOCUMENTED INTERFACES.  IN FACT, IT IS ALMOST  | 
7  |  |    GUARANTEED THAT THEY WILL CHANGE OR DISAPPEAR IN A FUTURE GMP RELEASE.  | 
8  |  |  | 
9  |  | Copyright (C) 2004-2007, 2009, 2012, 2017, 2021 Free Software Foundation, Inc.  | 
10  |  |  | 
11  |  | This file is part of the GNU MP Library.  | 
12  |  |  | 
13  |  | The GNU MP Library is free software; you can redistribute it and/or modify  | 
14  |  | it under the terms of either:  | 
15  |  |  | 
16  |  |   * the GNU Lesser General Public License as published by the Free  | 
17  |  |     Software Foundation; either version 3 of the License, or (at your  | 
18  |  |     option) any later version.  | 
19  |  |  | 
20  |  | or  | 
21  |  |  | 
22  |  |   * the GNU General Public License as published by the Free Software  | 
23  |  |     Foundation; either version 2 of the License, or (at your option) any  | 
24  |  |     later version.  | 
25  |  |  | 
26  |  | or both in parallel, as here.  | 
27  |  |  | 
28  |  | The GNU MP Library is distributed in the hope that it will be useful, but  | 
29  |  | WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY  | 
30  |  | or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License  | 
31  |  | for more details.  | 
32  |  |  | 
33  |  | You should have received copies of the GNU General Public License and the  | 
34  |  | GNU Lesser General Public License along with the GNU MP Library.  If not,  | 
35  |  | see https://www.gnu.org/licenses/.  */  | 
36  |  |  | 
37  |  | #include "gmp-impl.h"  | 
38  |  |  | 
39  |  |  | 
40  |  | /*  | 
41  |  |   r[k+1] = r[k] - r[k] * (u*r[k] - 1)  | 
42  |  |   r[k+1] = r[k] + r[k] - r[k]*(u*r[k])  | 
43  |  | */  | 
44  |  |  | 
45  |  | #if TUNE_PROGRAM_BUILD  | 
46  |  | #define NPOWS \  | 
47  |  |  ((sizeof(mp_size_t) > 6 ? 48 : 8*sizeof(mp_size_t)))  | 
48  |  | #else  | 
49  |  | #define NPOWS \  | 
50  |  |  ((sizeof(mp_size_t) > 6 ? 48 : 8*sizeof(mp_size_t)) - LOG2C (BINV_NEWTON_THRESHOLD))  | 
51  |  | #endif  | 
52  |  |  | 
53  |  | mp_size_t  | 
54  |  | mpn_binvert_itch (mp_size_t n)  | 
55  | 0  | { | 
56  | 0  |   mp_size_t itch_local = mpn_mulmod_bnm1_next_size (n);  | 
57  | 0  |   mp_size_t itch_out = mpn_mulmod_bnm1_itch (itch_local, n, (n + 1) >> 1);  | 
58  | 0  |   return itch_local + itch_out;  | 
59  | 0  | }  | 
60  |  |  | 
61  |  | void  | 
62  |  | mpn_binvert (mp_ptr rp, mp_srcptr up, mp_size_t n, mp_ptr scratch)  | 
63  | 0  | { | 
64  | 0  |   mp_ptr xp;  | 
65  | 0  |   mp_size_t rn, newrn;  | 
66  | 0  |   mp_size_t sizes[NPOWS], *sizp;  | 
67  | 0  |   mp_limb_t di;  | 
68  |  |  | 
69  |  |   /* Compute the computation precisions from highest to lowest, leaving the  | 
70  |  |      base case size in 'rn'.  */  | 
71  | 0  |   sizp = sizes;  | 
72  | 0  |   for (rn = n; ABOVE_THRESHOLD (rn, BINV_NEWTON_THRESHOLD); rn = (rn + 1) >> 1)  | 
73  | 0  |     *sizp++ = rn;  | 
74  |  | 
  | 
75  | 0  |   xp = scratch;  | 
76  |  |  | 
77  |  |   /* Compute a base value of rn limbs.  */  | 
78  | 0  |   MPN_ZERO (xp, rn);  | 
79  | 0  |   xp[0] = 1;  | 
80  | 0  |   binvert_limb (di, up[0]);  | 
81  | 0  |   if (BELOW_THRESHOLD (rn, DC_BDIV_Q_THRESHOLD))  | 
82  | 0  |     mpn_sbpi1_bdiv_q (rp, xp, rn, up, rn, -di);  | 
83  | 0  |   else  | 
84  | 0  |     mpn_dcpi1_bdiv_q (rp, xp, rn, up, rn, -di);  | 
85  |  | 
  | 
86  | 0  |   mpn_neg (rp, rp, rn);  | 
87  |  |  | 
88  |  |   /* Use Newton iterations to get the desired precision.  */  | 
89  | 0  |   for (; rn < n; rn = newrn)  | 
90  | 0  |     { | 
91  | 0  |       mp_size_t m;  | 
92  | 0  |       newrn = *--sizp;  | 
93  |  |  | 
94  |  |       /* X <- UR. */  | 
95  | 0  |       m = mpn_mulmod_bnm1_next_size (newrn);  | 
96  | 0  |       mpn_mulmod_bnm1 (xp, m, up, newrn, rp, rn, xp + m);  | 
97  |  |       /* Only the values in the range xp + rn .. xp + newrn - 1 are  | 
98  |  |    used by the _mullo_n below.  | 
99  |  |    Since m >= newrn, we do not need the following. */  | 
100  |  |       /* mpn_sub_1 (xp + m, xp, rn - (m - newrn), 1); */  | 
101  |  |  | 
102  |  |       /* R = R(X/B^rn) */  | 
103  | 0  |       mpn_mullo_n (rp + rn, rp, xp + rn, newrn - rn);  | 
104  | 0  |       mpn_neg (rp + rn, rp + rn, newrn - rn);  | 
105  | 0  |     }  | 
106  | 0  | }  |