Blame mpn/generic/sbpi1_bdiv_qr.c

Packit 5c3484
/* mpn_sbpi1_bdiv_qr -- schoolbook Hensel division with precomputed inverse,
Packit 5c3484
   returning quotient and remainder.
Packit 5c3484
Packit 5c3484
   Contributed to the GNU project by Niels Möller.
Packit 5c3484
Packit 5c3484
   THE FUNCTIONS IN THIS FILE ARE INTERNAL FUNCTIONS WITH MUTABLE INTERFACES.
Packit 5c3484
   IT IS ONLY SAFE TO REACH THEM THROUGH DOCUMENTED INTERFACES.  IN FACT, IT IS
Packit 5c3484
   ALMOST GUARANTEED THAT THEY'LL CHANGE OR DISAPPEAR IN A FUTURE GMP RELEASE.
Packit 5c3484
Packit 5c3484
Copyright 2006, 2009, 2011, 2012 Free Software Foundation, Inc.
Packit 5c3484
Packit 5c3484
This file is part of the GNU MP Library.
Packit 5c3484
Packit 5c3484
The GNU MP Library is free software; you can redistribute it and/or modify
Packit 5c3484
it under the terms of either:
Packit 5c3484
Packit 5c3484
  * the GNU Lesser General Public License as published by the Free
Packit 5c3484
    Software Foundation; either version 3 of the License, or (at your
Packit 5c3484
    option) any later version.
Packit 5c3484
Packit 5c3484
or
Packit 5c3484
Packit 5c3484
  * the GNU General Public License as published by the Free Software
Packit 5c3484
    Foundation; either version 2 of the License, or (at your option) any
Packit 5c3484
    later version.
Packit 5c3484
Packit 5c3484
or both in parallel, as here.
Packit 5c3484
Packit 5c3484
The GNU MP Library is distributed in the hope that it will be useful, but
Packit 5c3484
WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
Packit 5c3484
or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
Packit 5c3484
for more details.
Packit 5c3484
Packit 5c3484
You should have received copies of the GNU General Public License and the
Packit 5c3484
GNU Lesser General Public License along with the GNU MP Library.  If not,
Packit 5c3484
see https://www.gnu.org/licenses/.  */
Packit 5c3484
Packit 5c3484
#include "gmp.h"
Packit 5c3484
#include "gmp-impl.h"
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* Computes a binary quotient of size qn = nn - dn.
Packit 5c3484
   Output:
Packit 5c3484
Packit 5c3484
      Q = N * D^{-1} mod B^qn,
Packit 5c3484
Packit 5c3484
      R = (N - Q * D) * B^(-qn)
Packit 5c3484
Packit 5c3484
   Stores the dn least significant limbs of R at {np + nn - dn, dn},
Packit 5c3484
   and returns the borrow from the subtraction N - Q*D.
Packit 5c3484
Packit 5c3484
   D must be odd. dinv is (-D)^-1 mod B. */
Packit 5c3484
Packit 5c3484
mp_limb_t
Packit 5c3484
mpn_sbpi1_bdiv_qr (mp_ptr qp,
Packit 5c3484
		   mp_ptr np, mp_size_t nn,
Packit 5c3484
		   mp_srcptr dp, mp_size_t dn, mp_limb_t dinv)
Packit 5c3484
{
Packit 5c3484
  mp_size_t qn;
Packit 5c3484
  mp_size_t i;
Packit 5c3484
  mp_limb_t rh;
Packit 5c3484
  mp_limb_t ql;
Packit 5c3484
Packit 5c3484
  ASSERT (dn > 0);
Packit 5c3484
  ASSERT (nn > dn);
Packit 5c3484
  ASSERT ((dp[0] & 1) != 0);
Packit 5c3484
  /* FIXME: Add ASSERTs for allowable overlapping; i.e., that qp = np is OK,
Packit 5c3484
     but some over N/Q overlaps will not work.  */
Packit 5c3484
Packit 5c3484
  qn = nn - dn;
Packit 5c3484
Packit 5c3484
  rh = 0;
Packit 5c3484
Packit 5c3484
  /* To complete the negation, this value is added to q. */
Packit 5c3484
  ql = 1;
Packit 5c3484
  while (qn > dn)
Packit 5c3484
    {
Packit 5c3484
      for (i = 0; i < dn; i++)
Packit 5c3484
	{
Packit 5c3484
	  mp_limb_t q;
Packit 5c3484
Packit 5c3484
	  q = dinv * np[i];
Packit 5c3484
	  np[i] = mpn_addmul_1 (np + i, dp, dn, q);
Packit 5c3484
	  qp[i] = ~q;
Packit 5c3484
	}
Packit 5c3484
      rh += mpn_add (np + dn, np + dn, qn, np, dn);
Packit 5c3484
      ql = mpn_add_1 (qp, qp, dn, ql);
Packit 5c3484
Packit 5c3484
      qp += dn; qn -= dn;
Packit 5c3484
      np += dn; nn -= dn;
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  for (i = 0; i < qn; i++)
Packit 5c3484
    {
Packit 5c3484
      mp_limb_t q;
Packit 5c3484
Packit 5c3484
      q = dinv * np[i];
Packit 5c3484
      np[i] = mpn_addmul_1 (np + i, dp, dn, q);
Packit 5c3484
      qp[i] = ~q;
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  rh += mpn_add_n (np + dn, np + dn, np, qn);
Packit 5c3484
  ql = mpn_add_1 (qp, qp, qn, ql);
Packit 5c3484
Packit 5c3484
  if (UNLIKELY (ql > 0))
Packit 5c3484
    {
Packit 5c3484
      /* q == 0 */
Packit 5c3484
      ASSERT (rh == 0);
Packit 5c3484
      return 0;
Packit 5c3484
    }
Packit 5c3484
  else
Packit 5c3484
    {
Packit 5c3484
      mp_limb_t cy;
Packit 5c3484
Packit 5c3484
      cy = mpn_sub_n (np + qn, np + qn, dp, dn);
Packit 5c3484
      ASSERT (cy >= rh);
Packit 5c3484
      return cy - rh;
Packit 5c3484
    }
Packit 5c3484
}