Blame mpn/generic/sbpi1_bdiv_q.c

Packit 5c3484
/* mpn_sbpi1_bdiv_q -- schoolbook Hensel division with precomputed inverse,
Packit 5c3484
   returning quotient only.
Packit 5c3484
Packit 5c3484
   Contributed to the GNU project by Niels Möller.
Packit 5c3484
Packit 5c3484
   THE FUNCTIONS IN THIS FILE ARE INTERNAL FUNCTIONS WITH MUTABLE INTERFACES.
Packit 5c3484
   IT IS ONLY SAFE TO REACH THEM THROUGH DOCUMENTED INTERFACES.  IN FACT, IT IS
Packit 5c3484
   ALMOST GUARANTEED THAT THEY'LL CHANGE OR DISAPPEAR IN A FUTURE GMP RELEASE.
Packit 5c3484
Packit 5c3484
Copyright 2005, 2006, 2009, 2011, 2012 Free Software Foundation, Inc.
Packit 5c3484
Packit 5c3484
This file is part of the GNU MP Library.
Packit 5c3484
Packit 5c3484
The GNU MP Library is free software; you can redistribute it and/or modify
Packit 5c3484
it under the terms of either:
Packit 5c3484
Packit 5c3484
  * the GNU Lesser General Public License as published by the Free
Packit 5c3484
    Software Foundation; either version 3 of the License, or (at your
Packit 5c3484
    option) any later version.
Packit 5c3484
Packit 5c3484
or
Packit 5c3484
Packit 5c3484
  * the GNU General Public License as published by the Free Software
Packit 5c3484
    Foundation; either version 2 of the License, or (at your option) any
Packit 5c3484
    later version.
Packit 5c3484
Packit 5c3484
or both in parallel, as here.
Packit 5c3484
Packit 5c3484
The GNU MP Library is distributed in the hope that it will be useful, but
Packit 5c3484
WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
Packit 5c3484
or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
Packit 5c3484
for more details.
Packit 5c3484
Packit 5c3484
You should have received copies of the GNU General Public License and the
Packit 5c3484
GNU Lesser General Public License along with the GNU MP Library.  If not,
Packit 5c3484
see https://www.gnu.org/licenses/.  */
Packit 5c3484
Packit 5c3484
#include "gmp.h"
Packit 5c3484
#include "gmp-impl.h"
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* Computes Q = N / D mod B^nn, destroys N.
Packit 5c3484
Packit 5c3484
   D must be odd. dinv is (-D)^-1 mod B.
Packit 5c3484
Packit 5c3484
Packit 5c3484
   The straightforward way to compute Q is to cancel one limb at a time, using
Packit 5c3484
Packit 5c3484
     qp[i] = D^{-1} * np[i] (mod B)
Packit 5c3484
     N -= B^i * qp[i] * D
Packit 5c3484
Packit 5c3484
   But we prefer addition to subtraction, since mpn_addmul_1 is often faster
Packit 5c3484
   than mpn_submul_1.  Q = - N / D can be computed by iterating
Packit 5c3484
Packit 5c3484
     qp[i] = (-D)^{-1} * np[i] (mod B)
Packit 5c3484
     N += B^i * qp[i] * D
Packit 5c3484
Packit 5c3484
   And then we flip the sign, -Q = (not Q) + 1. */
Packit 5c3484
Packit 5c3484
void
Packit 5c3484
mpn_sbpi1_bdiv_q (mp_ptr qp,
Packit 5c3484
		  mp_ptr np, mp_size_t nn,
Packit 5c3484
		  mp_srcptr dp, mp_size_t dn,
Packit 5c3484
		  mp_limb_t dinv)
Packit 5c3484
{
Packit 5c3484
  mp_size_t i;
Packit 5c3484
  mp_limb_t cy, q;
Packit 5c3484
Packit 5c3484
  ASSERT (dn > 0);
Packit 5c3484
  ASSERT (nn >= dn);
Packit 5c3484
  ASSERT ((dp[0] & 1) != 0);
Packit 5c3484
  /* FIXME: Add ASSERTs for allowable overlapping; i.e., that qp = np is OK,
Packit 5c3484
     but some over N/Q overlaps will not work.  */
Packit 5c3484
Packit 5c3484
  for (i = nn - dn; i > 0; i--)
Packit 5c3484
    {
Packit 5c3484
      q = dinv * np[0];
Packit 5c3484
      cy = mpn_addmul_1 (np, dp, dn, q);
Packit 5c3484
      mpn_add_1 (np + dn, np + dn, i, cy);
Packit 5c3484
      ASSERT (np[0] == 0);
Packit 5c3484
      qp[0] = ~q;
Packit 5c3484
      qp++;
Packit 5c3484
      np++;
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  for (i = dn; i > 1; i--)
Packit 5c3484
    {
Packit 5c3484
      q = dinv * np[0];
Packit 5c3484
      mpn_addmul_1 (np, dp, i, q);
Packit 5c3484
      ASSERT (np[0] == 0);
Packit 5c3484
      qp[0] = ~q;
Packit 5c3484
      qp++;
Packit 5c3484
      np++;
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  /* Final limb */
Packit 5c3484
  q = dinv * np[0];
Packit 5c3484
  qp[0] = ~q;
Packit 5c3484
  mpn_add_1 (qp - nn + 1, qp - nn + 1, nn, 1);
Packit 5c3484
}