Blame mpn/generic/remove.c

Packit 5c3484
/* mpn_remove -- divide out all multiples of odd mpn number from another mpn
Packit 5c3484
   number.
Packit 5c3484
Packit 5c3484
   Contributed to the GNU project by Torbjorn Granlund.
Packit 5c3484
Packit 5c3484
   THE FUNCTION IN THIS FILE IS INTERNAL WITH A MUTABLE INTERFACE.  IT IS ONLY
Packit 5c3484
   SAFE TO REACH IT THROUGH DOCUMENTED INTERFACES.  IN FACT, IT IS ALMOST
Packit 5c3484
   GUARANTEED THAT IT WILL CHANGE OR DISAPPEAR IN A FUTURE GMP RELEASE.
Packit 5c3484
Packit 5c3484
Copyright 2009, 2012-2014 Free Software Foundation, Inc.
Packit 5c3484
Packit 5c3484
This file is part of the GNU MP Library.
Packit 5c3484
Packit 5c3484
The GNU MP Library is free software; you can redistribute it and/or modify
Packit 5c3484
it under the terms of either:
Packit 5c3484
Packit 5c3484
  * the GNU Lesser General Public License as published by the Free
Packit 5c3484
    Software Foundation; either version 3 of the License, or (at your
Packit 5c3484
    option) any later version.
Packit 5c3484
Packit 5c3484
or
Packit 5c3484
Packit 5c3484
  * the GNU General Public License as published by the Free Software
Packit 5c3484
    Foundation; either version 2 of the License, or (at your option) any
Packit 5c3484
    later version.
Packit 5c3484
Packit 5c3484
or both in parallel, as here.
Packit 5c3484
Packit 5c3484
The GNU MP Library is distributed in the hope that it will be useful, but
Packit 5c3484
WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
Packit 5c3484
or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
Packit 5c3484
for more details.
Packit 5c3484
Packit 5c3484
You should have received copies of the GNU General Public License and the
Packit 5c3484
GNU Lesser General Public License along with the GNU MP Library.  If not,
Packit 5c3484
see https://www.gnu.org/licenses/.  */
Packit 5c3484
Packit 5c3484
#include "gmp.h"
Packit 5c3484
#include "gmp-impl.h"
Packit 5c3484
Packit 5c3484
#if GMP_LIMB_BITS > 50
Packit 5c3484
#define LOG 50
Packit 5c3484
#else
Packit 5c3484
#define LOG GMP_LIMB_BITS
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* Input: U = {up,un}, V = {vp,vn} must be odd, cap
Packit 5c3484
   Ouput  W = {wp,*wn} allocation need is exactly *wn
Packit 5c3484
Packit 5c3484
   Set W = U / V^k, where k is the largest integer <= cap such that the
Packit 5c3484
   division yields an integer.
Packit 5c3484
Packit 5c3484
   FIXME: We currently allow any operand overlap.  This is quite non mpn-ish
Packit 5c3484
   and might be changed, since it cost significant temporary space.
Packit 5c3484
   * If we require W to have space for un + 1 limbs, we could save qp or qp2
Packit 5c3484
     (but we will still need to copy things into wp 50% of the time).
Packit 5c3484
   * If we allow ourselves to clobber U, we could save the other of qp and qp2,
Packit 5c3484
     and the initial COPY (but also here we would need un + 1 limbs).
Packit 5c3484
*/
Packit 5c3484
Packit 5c3484
/* FIXME: We need to wrap mpn_bdiv_qr due to the itch interface.  This need
Packit 5c3484
   indicates a flaw in the current itch mechanism: Which operands not greater
Packit 5c3484
   than un,un will incur the worst itch?  We need a parallel foo_maxitch set
Packit 5c3484
   of functions.  */
Packit 5c3484
static void
Packit 5c3484
mpn_bdiv_qr_wrap (mp_ptr qp, mp_ptr rp,
Packit 5c3484
		  mp_srcptr np, mp_size_t nn,
Packit 5c3484
		  mp_srcptr dp, mp_size_t dn)
Packit 5c3484
{
Packit 5c3484
  mp_ptr scratch_out;
Packit 5c3484
  TMP_DECL;
Packit 5c3484
Packit 5c3484
  TMP_MARK;
Packit 5c3484
  scratch_out = TMP_ALLOC_LIMBS (mpn_bdiv_qr_itch (nn, dn));
Packit 5c3484
  mpn_bdiv_qr (qp, rp, np, nn, dp, dn, scratch_out);
Packit 5c3484
Packit 5c3484
  TMP_FREE;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
mp_bitcnt_t
Packit 5c3484
mpn_remove (mp_ptr wp, mp_size_t *wn,
Packit 5c3484
	    mp_srcptr up, mp_size_t un, mp_srcptr vp, mp_size_t vn,
Packit 5c3484
	    mp_bitcnt_t cap)
Packit 5c3484
{
Packit 5c3484
  mp_srcptr pwpsp[LOG];
Packit 5c3484
  mp_size_t pwpsn[LOG];
Packit 5c3484
  mp_size_t npowers;
Packit 5c3484
  mp_ptr tp, qp, np, qp2;
Packit 5c3484
  mp_srcptr pp;
Packit 5c3484
  mp_size_t pn, nn, qn, i;
Packit 5c3484
  mp_bitcnt_t pwr;
Packit 5c3484
  TMP_DECL;
Packit 5c3484
Packit 5c3484
  ASSERT (un > 0);
Packit 5c3484
  ASSERT (vn > 0);
Packit 5c3484
  ASSERT (vp[0] % 2 != 0);	/* 2-adic division wants odd numbers */
Packit 5c3484
  ASSERT (vn > 1 || vp[0] > 1);	/* else we would loop indefinitely */
Packit 5c3484
Packit 5c3484
  TMP_MARK;
Packit 5c3484
Packit 5c3484
  TMP_ALLOC_LIMBS_3 (qp, un + 1,	/* quotient, alternating */
Packit 5c3484
		     qp2, un + 1,	/* quotient, alternating */
Packit 5c3484
		     tp, (un + 1 + vn) / 2); /* remainder */
Packit 5c3484
  pp = vp;
Packit 5c3484
  pn = vn;
Packit 5c3484
Packit 5c3484
  MPN_COPY (qp, up, un);
Packit 5c3484
  qn = un;
Packit 5c3484
Packit 5c3484
  npowers = 0;
Packit 5c3484
  while (qn >= pn)
Packit 5c3484
    {
Packit 5c3484
      qp[qn] = 0;
Packit 5c3484
      mpn_bdiv_qr_wrap (qp2, tp, qp, qn + 1, pp, pn);
Packit 5c3484
      if (!mpn_zero_p (tp, pn))
Packit 5c3484
	break;			/* could not divide by V^npowers */
Packit 5c3484
Packit 5c3484
      MP_PTR_SWAP (qp, qp2);
Packit 5c3484
      qn = qn - pn;
Packit 5c3484
      qn += qp[qn] != 0;
Packit 5c3484
Packit 5c3484
      pwpsp[npowers] = pp;
Packit 5c3484
      pwpsn[npowers] = pn;
Packit 5c3484
      ++npowers;
Packit 5c3484
Packit 5c3484
      if (((mp_bitcnt_t) 2 << npowers) - 1 > cap)
Packit 5c3484
	break;
Packit 5c3484
Packit 5c3484
      nn = 2 * pn - 1;		/* next power will be at least this large */
Packit 5c3484
      if (nn > qn)
Packit 5c3484
	break;			/* next power would be overlarge */
Packit 5c3484
Packit 5c3484
      if (npowers == 1)		/* Alloc once, but only if it's needed */
Packit 5c3484
	np = TMP_ALLOC_LIMBS (qn + LOG);	/* powers of V */
Packit 5c3484
      else
Packit 5c3484
	np += pn;
Packit 5c3484
Packit 5c3484
      mpn_sqr (np, pp, pn);
Packit 5c3484
      pn = nn + (np[nn] != 0);
Packit 5c3484
      pp = np;
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  pwr = ((mp_bitcnt_t) 1 << npowers) - 1;
Packit 5c3484
Packit 5c3484
  for (i = npowers; --i >= 0;)
Packit 5c3484
    {
Packit 5c3484
      pn = pwpsn[i];
Packit 5c3484
      if (qn < pn)
Packit 5c3484
	continue;
Packit 5c3484
Packit 5c3484
      if (pwr + ((mp_bitcnt_t) 1 << i) > cap)
Packit 5c3484
	continue;		/* V^i would bring us past cap */
Packit 5c3484
Packit 5c3484
      qp[qn] = 0;
Packit 5c3484
      mpn_bdiv_qr_wrap (qp2, tp, qp, qn + 1, pwpsp[i], pn);
Packit 5c3484
      if (!mpn_zero_p (tp, pn))
Packit 5c3484
	continue;		/* could not divide by V^i */
Packit 5c3484
Packit 5c3484
      MP_PTR_SWAP (qp, qp2);
Packit 5c3484
      qn = qn - pn;
Packit 5c3484
      qn += qp[qn] != 0;
Packit 5c3484
Packit 5c3484
      pwr += (mp_bitcnt_t) 1 << i;
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  MPN_COPY (wp, qp, qn);
Packit 5c3484
  *wn = qn;
Packit 5c3484
Packit 5c3484
  TMP_FREE;
Packit 5c3484
Packit 5c3484
  return pwr;
Packit 5c3484
}