Coverage Report

Created: 2024-06-28 06:19

/src/gmp-6.2.1/mpn/tdiv_qr.c
Line
Count
Source (jump to first uncovered line)
1
/* mpn_tdiv_qr -- Divide the numerator (np,nn) by the denominator (dp,dn) and
2
   write the nn-dn+1 quotient limbs at qp and the dn remainder limbs at rp.  If
3
   qxn is non-zero, generate that many fraction limbs and append them after the
4
   other quotient limbs, and update the remainder accordingly.  The input
5
   operands are unaffected.
6
7
   Preconditions:
8
   1. The most significant limb of the divisor must be non-zero.
9
   2. nn >= dn, even if qxn is non-zero.  (??? relax this ???)
10
11
   The time complexity of this is O(qn*qn+M(dn,qn)), where M(m,n) is the time
12
   complexity of multiplication.
13
14
Copyright 1997, 2000-2002, 2005, 2009, 2015 Free Software Foundation, Inc.
15
16
This file is part of the GNU MP Library.
17
18
The GNU MP Library is free software; you can redistribute it and/or modify
19
it under the terms of either:
20
21
  * the GNU Lesser General Public License as published by the Free
22
    Software Foundation; either version 3 of the License, or (at your
23
    option) any later version.
24
25
or
26
27
  * the GNU General Public License as published by the Free Software
28
    Foundation; either version 2 of the License, or (at your option) any
29
    later version.
30
31
or both in parallel, as here.
32
33
The GNU MP Library is distributed in the hope that it will be useful, but
34
WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
35
or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
36
for more details.
37
38
You should have received copies of the GNU General Public License and the
39
GNU Lesser General Public License along with the GNU MP Library.  If not,
40
see https://www.gnu.org/licenses/.  */
41
42
#include "gmp-impl.h"
43
#include "longlong.h"
44
45
46
void
47
mpn_tdiv_qr (mp_ptr qp, mp_ptr rp, mp_size_t qxn,
48
       mp_srcptr np, mp_size_t nn, mp_srcptr dp, mp_size_t dn)
49
24.2k
{
50
24.2k
  ASSERT_ALWAYS (qxn == 0);
51
52
24.2k
  ASSERT (nn >= 0);
53
24.2k
  ASSERT (dn >= 0);
54
24.2k
  ASSERT (dn == 0 || dp[dn - 1] != 0);
55
24.2k
  ASSERT (! MPN_OVERLAP_P (qp, nn - dn + 1 + qxn, np, nn));
56
24.2k
  ASSERT (! MPN_OVERLAP_P (qp, nn - dn + 1 + qxn, dp, dn));
57
58
24.2k
  switch (dn)
59
24.2k
    {
60
0
    case 0:
61
0
      DIVIDE_BY_ZERO;
62
63
1.08k
    case 1:
64
1.08k
      {
65
1.08k
  rp[0] = mpn_divrem_1 (qp, (mp_size_t) 0, np, nn, dp[0]);
66
1.08k
  return;
67
0
      }
68
69
420
    case 2:
70
420
      {
71
420
  mp_ptr n2p;
72
420
  mp_limb_t qhl, cy;
73
420
  TMP_DECL;
74
420
  TMP_MARK;
75
420
  if ((dp[1] & GMP_NUMB_HIGHBIT) == 0)
76
389
    {
77
389
      int cnt;
78
389
      mp_limb_t d2p[2];
79
389
      count_leading_zeros (cnt, dp[1]);
80
389
      cnt -= GMP_NAIL_BITS;
81
389
      d2p[1] = (dp[1] << cnt) | (dp[0] >> (GMP_NUMB_BITS - cnt));
82
389
      d2p[0] = (dp[0] << cnt) & GMP_NUMB_MASK;
83
389
      n2p = TMP_ALLOC_LIMBS (nn + 1);
84
389
      cy = mpn_lshift (n2p, np, nn, cnt);
85
389
      n2p[nn] = cy;
86
389
      qhl = mpn_divrem_2 (qp, 0L, n2p, nn + (cy != 0), d2p);
87
389
      if (cy == 0)
88
125
        qp[nn - 2] = qhl; /* always store nn-2+1 quotient limbs */
89
389
      rp[0] = (n2p[0] >> cnt)
90
389
        | ((n2p[1] << (GMP_NUMB_BITS - cnt)) & GMP_NUMB_MASK);
91
389
      rp[1] = (n2p[1] >> cnt);
92
389
    }
93
31
  else
94
31
    {
95
31
      n2p = TMP_ALLOC_LIMBS (nn);
96
31
      MPN_COPY (n2p, np, nn);
97
31
      qhl = mpn_divrem_2 (qp, 0L, n2p, nn, dp);
98
31
      qp[nn - 2] = qhl; /* always store nn-2+1 quotient limbs */
99
31
      rp[0] = n2p[0];
100
31
      rp[1] = n2p[1];
101
31
    }
102
420
  TMP_FREE;
103
420
  return;
104
420
      }
105
106
22.7k
    default:
107
22.7k
      {
108
22.7k
  int adjust;
109
22.7k
  gmp_pi1_t dinv;
110
22.7k
  TMP_DECL;
111
22.7k
  TMP_MARK;
112
22.7k
  adjust = np[nn - 1] >= dp[dn - 1];  /* conservative tests for quotient size */
113
22.7k
  if (nn + adjust >= 2 * dn)
114
17.1k
    {
115
17.1k
      mp_ptr n2p, d2p;
116
17.1k
      mp_limb_t cy;
117
17.1k
      int cnt;
118
119
17.1k
      qp[nn - dn] = 0;        /* zero high quotient limb */
120
17.1k
      if ((dp[dn - 1] & GMP_NUMB_HIGHBIT) == 0) /* normalize divisor */
121
16.6k
        {
122
16.6k
    count_leading_zeros (cnt, dp[dn - 1]);
123
16.6k
    cnt -= GMP_NAIL_BITS;
124
16.6k
    d2p = TMP_ALLOC_LIMBS (dn);
125
16.6k
    mpn_lshift (d2p, dp, dn, cnt);
126
16.6k
    n2p = TMP_ALLOC_LIMBS (nn + 1);
127
16.6k
    cy = mpn_lshift (n2p, np, nn, cnt);
128
16.6k
    n2p[nn] = cy;
129
16.6k
    nn += adjust;
130
16.6k
        }
131
458
      else
132
458
        {
133
458
    cnt = 0;
134
458
    d2p = (mp_ptr) dp;
135
458
    n2p = TMP_ALLOC_LIMBS (nn + 1);
136
458
    MPN_COPY (n2p, np, nn);
137
458
    n2p[nn] = 0;
138
458
    nn += adjust;
139
458
        }
140
141
17.1k
      invert_pi1 (dinv, d2p[dn - 1], d2p[dn - 2]);
142
17.1k
      if (BELOW_THRESHOLD (dn, DC_DIV_QR_THRESHOLD))
143
16.0k
        mpn_sbpi1_div_qr (qp, n2p, nn, d2p, dn, dinv.inv32);
144
1.11k
      else if (BELOW_THRESHOLD (dn, MUPI_DIV_QR_THRESHOLD) ||   /* fast condition */
145
1.11k
         BELOW_THRESHOLD (nn, 2 * MU_DIV_QR_THRESHOLD) || /* fast condition */
146
1.11k
         (double) (2 * (MU_DIV_QR_THRESHOLD - MUPI_DIV_QR_THRESHOLD)) * dn /* slow... */
147
0
         + (double) MUPI_DIV_QR_THRESHOLD * nn > (double) dn * nn)    /* ...condition */
148
1.11k
        mpn_dcpi1_div_qr (qp, n2p, nn, d2p, dn, &dinv);
149
0
      else
150
0
        {
151
0
    mp_size_t itch = mpn_mu_div_qr_itch (nn, dn, 0);
152
0
    mp_ptr scratch = TMP_ALLOC_LIMBS (itch);
153
0
    mpn_mu_div_qr (qp, rp, n2p, nn, d2p, dn, scratch);
154
0
    n2p = rp;
155
0
        }
156
157
17.1k
      if (cnt != 0)
158
16.6k
        mpn_rshift (rp, n2p, dn, cnt);
159
458
      else
160
458
        MPN_COPY (rp, n2p, dn);
161
17.1k
      TMP_FREE;
162
17.1k
      return;
163
17.1k
    }
164
165
  /* When we come here, the numerator/partial remainder is less
166
     than twice the size of the denominator.  */
167
168
5.62k
    {
169
      /* Problem:
170
171
         Divide a numerator N with nn limbs by a denominator D with dn
172
         limbs forming a quotient of qn=nn-dn+1 limbs.  When qn is small
173
         compared to dn, conventional division algorithms perform poorly.
174
         We want an algorithm that has an expected running time that is
175
         dependent only on qn.
176
177
         Algorithm (very informally stated):
178
179
         1) Divide the 2 x qn most significant limbs from the numerator
180
      by the qn most significant limbs from the denominator.  Call
181
      the result qest.  This is either the correct quotient, but
182
      might be 1 or 2 too large.  Compute the remainder from the
183
      division.  (This step is implemented by an mpn_divrem call.)
184
185
         2) Is the most significant limb from the remainder < p, where p
186
      is the product of the most significant limb from the quotient
187
      and the next(d)?  (Next(d) denotes the next ignored limb from
188
      the denominator.)  If it is, decrement qest, and adjust the
189
      remainder accordingly.
190
191
         3) Is the remainder >= qest?  If it is, qest is the desired
192
      quotient.  The algorithm terminates.
193
194
         4) Subtract qest x next(d) from the remainder.  If there is
195
      borrow out, decrement qest, and adjust the remainder
196
      accordingly.
197
198
         5) Skip one word from the denominator (i.e., let next(d) denote
199
      the next less significant limb.  */
200
201
5.62k
      mp_size_t qn;
202
5.62k
      mp_ptr n2p, d2p;
203
5.62k
      mp_ptr tp;
204
5.62k
      mp_limb_t cy;
205
5.62k
      mp_size_t in, rn;
206
5.62k
      mp_limb_t quotient_too_large;
207
5.62k
      unsigned int cnt;
208
209
5.62k
      qn = nn - dn;
210
5.62k
      qp[qn] = 0;       /* zero high quotient limb */
211
5.62k
      qn += adjust;     /* qn cannot become bigger */
212
213
5.62k
      if (qn == 0)
214
13
        {
215
13
    MPN_COPY (rp, np, dn);
216
13
    TMP_FREE;
217
13
    return;
218
13
        }
219
220
5.61k
      in = dn - qn;   /* (at least partially) ignored # of limbs in ops */
221
      /* Normalize denominator by shifting it to the left such that its
222
         most significant bit is set.  Then shift the numerator the same
223
         amount, to mathematically preserve quotient.  */
224
5.61k
      if ((dp[dn - 1] & GMP_NUMB_HIGHBIT) == 0)
225
4.92k
        {
226
4.92k
    count_leading_zeros (cnt, dp[dn - 1]);
227
4.92k
    cnt -= GMP_NAIL_BITS;
228
229
4.92k
    d2p = TMP_ALLOC_LIMBS (qn);
230
4.92k
    mpn_lshift (d2p, dp + in, qn, cnt);
231
4.92k
    d2p[0] |= dp[in - 1] >> (GMP_NUMB_BITS - cnt);
232
233
4.92k
    n2p = TMP_ALLOC_LIMBS (2 * qn + 1);
234
4.92k
    cy = mpn_lshift (n2p, np + nn - 2 * qn, 2 * qn, cnt);
235
4.92k
    if (adjust)
236
2.35k
      {
237
2.35k
        n2p[2 * qn] = cy;
238
2.35k
        n2p++;
239
2.35k
      }
240
2.56k
    else
241
2.56k
      {
242
2.56k
        n2p[0] |= np[nn - 2 * qn - 1] >> (GMP_NUMB_BITS - cnt);
243
2.56k
      }
244
4.92k
        }
245
689
      else
246
689
        {
247
689
    cnt = 0;
248
689
    d2p = (mp_ptr) dp + in;
249
250
689
    n2p = TMP_ALLOC_LIMBS (2 * qn + 1);
251
689
    MPN_COPY (n2p, np + nn - 2 * qn, 2 * qn);
252
689
    if (adjust)
253
18
      {
254
18
        n2p[2 * qn] = 0;
255
18
        n2p++;
256
18
      }
257
689
        }
258
259
      /* Get an approximate quotient using the extracted operands.  */
260
5.61k
      if (qn == 1)
261
1.11k
        {
262
1.11k
    mp_limb_t q0, r0;
263
1.11k
    udiv_qrnnd (q0, r0, n2p[1], n2p[0] << GMP_NAIL_BITS, d2p[0] << GMP_NAIL_BITS);
264
1.11k
    n2p[0] = r0 >> GMP_NAIL_BITS;
265
1.11k
    qp[0] = q0;
266
1.11k
        }
267
4.49k
      else if (qn == 2)
268
2.02k
        mpn_divrem_2 (qp, 0L, n2p, 4L, d2p); /* FIXME: obsolete function */
269
2.46k
      else
270
2.46k
        {
271
2.46k
    invert_pi1 (dinv, d2p[qn - 1], d2p[qn - 2]);
272
2.46k
    if (BELOW_THRESHOLD (qn, DC_DIV_QR_THRESHOLD))
273
2.28k
      mpn_sbpi1_div_qr (qp, n2p, 2 * qn, d2p, qn, dinv.inv32);
274
180
    else if (BELOW_THRESHOLD (qn, MU_DIV_QR_THRESHOLD))
275
180
      mpn_dcpi1_div_qr (qp, n2p, 2 * qn, d2p, qn, &dinv);
276
0
    else
277
0
      {
278
0
        mp_size_t itch = mpn_mu_div_qr_itch (2 * qn, qn, 0);
279
0
        mp_ptr scratch = TMP_ALLOC_LIMBS (itch);
280
0
        mp_ptr r2p = rp;
281
0
        if (np == r2p) /* If N and R share space, put ... */
282
0
          r2p += nn - qn; /* intermediate remainder at N's upper end. */
283
0
        mpn_mu_div_qr (qp, r2p, n2p, 2 * qn, d2p, qn, scratch);
284
0
        MPN_COPY (n2p, r2p, qn);
285
0
      }
286
2.46k
        }
287
288
5.61k
      rn = qn;
289
      /* Multiply the first ignored divisor limb by the most significant
290
         quotient limb.  If that product is > the partial remainder's
291
         most significant limb, we know the quotient is too large.  This
292
         test quickly catches most cases where the quotient is too large;
293
         it catches all cases where the quotient is 2 too large.  */
294
5.61k
      {
295
5.61k
        mp_limb_t dl, x;
296
5.61k
        mp_limb_t h, dummy;
297
298
5.61k
        if (in - 2 < 0)
299
333
    dl = 0;
300
5.27k
        else
301
5.27k
    dl = dp[in - 2];
302
303
5.61k
#if GMP_NAIL_BITS == 0
304
5.61k
        x = (dp[in - 1] << cnt) | ((dl >> 1) >> ((~cnt) % GMP_LIMB_BITS));
305
#else
306
        x = (dp[in - 1] << cnt) & GMP_NUMB_MASK;
307
        if (cnt != 0)
308
    x |= dl >> (GMP_NUMB_BITS - cnt);
309
#endif
310
5.61k
        umul_ppmm (h, dummy, x, qp[qn - 1] << GMP_NAIL_BITS);
311
312
5.61k
        if (n2p[qn - 1] < h)
313
334
    {
314
334
      mp_limb_t cy;
315
316
334
      mpn_decr_u (qp, (mp_limb_t) 1);
317
334
      cy = mpn_add_n (n2p, n2p, d2p, qn);
318
334
      if (cy)
319
64
        {
320
          /* The partial remainder is safely large.  */
321
64
          n2p[qn] = cy;
322
64
          ++rn;
323
64
        }
324
334
    }
325
5.61k
      }
326
327
5.61k
      quotient_too_large = 0;
328
5.61k
      if (cnt != 0)
329
4.92k
        {
330
4.92k
    mp_limb_t cy1, cy2;
331
332
    /* Append partially used numerator limb to partial remainder.  */
333
4.92k
    cy1 = mpn_lshift (n2p, n2p, rn, GMP_NUMB_BITS - cnt);
334
4.92k
    n2p[0] |= np[in - 1] & (GMP_NUMB_MASK >> cnt);
335
336
    /* Update partial remainder with partially used divisor limb.  */
337
4.92k
    cy2 = mpn_submul_1 (n2p, qp, qn, dp[in - 1] & (GMP_NUMB_MASK >> cnt));
338
4.92k
    if (qn != rn)
339
51
      {
340
51
        ASSERT_ALWAYS (n2p[qn] >= cy2);
341
51
        n2p[qn] -= cy2;
342
51
      }
343
4.87k
    else
344
4.87k
      {
345
4.87k
        n2p[qn] = cy1 - cy2; /* & GMP_NUMB_MASK; */
346
347
4.87k
        quotient_too_large = (cy1 < cy2);
348
4.87k
        ++rn;
349
4.87k
      }
350
4.92k
    --in;
351
4.92k
        }
352
      /* True: partial remainder now is neutral, i.e., it is not shifted up.  */
353
354
5.61k
      tp = TMP_ALLOC_LIMBS (dn);
355
356
5.61k
      if (in < qn)
357
789
        {
358
789
    if (in == 0)
359
236
      {
360
236
        MPN_COPY (rp, n2p, rn);
361
236
        ASSERT_ALWAYS (rn == dn);
362
236
        goto foo;
363
236
      }
364
553
    mpn_mul (tp, qp, qn, dp, in);
365
553
        }
366
4.82k
      else
367
4.82k
        mpn_mul (tp, dp, in, qp, qn);
368
369
5.37k
      cy = mpn_sub (n2p, n2p, rn, tp + in, qn);
370
5.37k
      MPN_COPY (rp + in, n2p, dn - in);
371
5.37k
      quotient_too_large |= cy;
372
5.37k
      cy = mpn_sub_n (rp, np, tp, in);
373
5.37k
      cy = mpn_sub_1 (rp + in, rp + in, rn, cy);
374
5.37k
      quotient_too_large |= cy;
375
5.61k
    foo:
376
5.61k
      if (quotient_too_large)
377
403
        {
378
403
    mpn_decr_u (qp, (mp_limb_t) 1);
379
403
    mpn_add_n (rp, rp, dp, dn);
380
403
        }
381
5.61k
    }
382
5.61k
  TMP_FREE;
383
5.61k
  return;
384
5.37k
      }
385
24.2k
    }
386
24.2k
}