mpn/generic/tdiv_qr.c - gmp - Git at Google

 /* mpn_tdiv_qr -- Divide the numerator (np,nn) by the denominator (dp,dn) and
    write the nn-dn+1 quotient limbs at qp and the dn remainder limbs at rp.  If
    qxn is non-zero, generate that many fraction limbs and append them after the
    other quotient limbs, and update the remainder accordingly.  The input
    operands are unaffected.

    Preconditions:
    1. The most significant limb of the divisor must be non-zero.
    2. nn >= dn, even if qxn is non-zero.  (??? relax this ???)

    The time complexity of this is O(qn*qn+M(dn,qn)), where M(m,n) is the time
    complexity of multiplication.

 Copyright 1997, 2000-2002, 2005, 2009, 2015 Free Software Foundation, Inc.

 This file is part of the GNU MP Library.

 The GNU MP Library is free software; you can redistribute it and/or modify
 it under the terms of either:

   * the GNU Lesser General Public License as published by the Free
     Software Foundation; either version 3 of the License, or (at your
     option) any later version.

 or

   * the GNU General Public License as published by the Free Software
     Foundation; either version 2 of the License, or (at your option) any
     later version.

 or both in parallel, as here.

 The GNU MP Library is distributed in the hope that it will be useful, but
 WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
 or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 for more details.

 You should have received copies of the GNU General Public License and the
 GNU Lesser General Public License along with the GNU MP Library.  If not,
 see https://www.gnu.org/licenses/.  */

 #include "gmp-impl.h"
 #include "longlong.h"


 void
 mpn_tdiv_qr (mp_ptr qp, mp_ptr rp, mp_size_t qxn,
 	     mp_srcptr np, mp_size_t nn, mp_srcptr dp, mp_size_t dn)
 {
   ASSERT_ALWAYS (qxn == 0);

   ASSERT (nn >= 0);
   ASSERT (dn >= 0);
   ASSERT (dn == 0 || dp[dn - 1] != 0);
   ASSERT (! MPN_OVERLAP_P (qp, nn - dn + 1 + qxn, np, nn));
   ASSERT (! MPN_OVERLAP_P (qp, nn - dn + 1 + qxn, dp, dn));

   switch (dn)
     {
     case 0:
       DIVIDE_BY_ZERO;

     case 1:
       {
 	rp[0] = mpn_divrem_1 (qp, (mp_size_t) 0, np, nn, dp[0]);
 	return;
       }

     case 2:
       {
 	mp_ptr n2p;
 	mp_limb_t qhl, cy;
 	TMP_DECL;
 	TMP_MARK;
 	if ((dp[1] & GMP_NUMB_HIGHBIT) == 0)
 	  {
 	    int cnt;
 	    mp_limb_t d2p[2];
 	    count_leading_zeros (cnt, dp[1]);
 	    cnt -= GMP_NAIL_BITS;
 	    d2p[1] = (dp[1] << cnt) | (dp[0] >> (GMP_NUMB_BITS - cnt));
 	    d2p[0] = (dp[0] << cnt) & GMP_NUMB_MASK;
 	    n2p = TMP_ALLOC_LIMBS (nn + 1);
 	    cy = mpn_lshift (n2p, np, nn, cnt);
 	    n2p[nn] = cy;
 	    qhl = mpn_divrem_2 (qp, 0L, n2p, nn + (cy != 0), d2p);
 	    if (cy == 0)
 	      qp[nn - 2] = qhl;	/* always store nn-2+1 quotient limbs */
 	    rp[0] = (n2p[0] >> cnt)
 	      | ((n2p[1] << (GMP_NUMB_BITS - cnt)) & GMP_NUMB_MASK);
 	    rp[1] = (n2p[1] >> cnt);
 	  }
 	else
 	  {
 	    n2p = TMP_ALLOC_LIMBS (nn);
 	    MPN_COPY (n2p, np, nn);
 	    qhl = mpn_divrem_2 (qp, 0L, n2p, nn, dp);
 	    qp[nn - 2] = qhl;	/* always store nn-2+1 quotient limbs */
 	    rp[0] = n2p[0];
 	    rp[1] = n2p[1];
 	  }
 	TMP_FREE;
 	return;
       }

     default:
       {
 	int adjust;
 	gmp_pi1_t dinv;
 	TMP_DECL;
 	TMP_MARK;
 	adjust = np[nn - 1] >= dp[dn - 1];	/* conservative tests for quotient size */
 	if (nn + adjust >= 2 * dn)
 	  {
 	    mp_ptr n2p, d2p;
 	    mp_limb_t cy;
 	    int cnt;

 	    qp[nn - dn] = 0;			  /* zero high quotient limb */
 	    if ((dp[dn - 1] & GMP_NUMB_HIGHBIT) == 0) /* normalize divisor */
 	      {
 		count_leading_zeros (cnt, dp[dn - 1]);
 		cnt -= GMP_NAIL_BITS;
 		d2p = TMP_ALLOC_LIMBS (dn);
 		mpn_lshift (d2p, dp, dn, cnt);
 		n2p = TMP_ALLOC_LIMBS (nn + 1);
 		cy = mpn_lshift (n2p, np, nn, cnt);
 		n2p[nn] = cy;
 		nn += adjust;
 	      }
 	    else
 	      {
 		cnt = 0;
 		d2p = (mp_ptr) dp;
 		n2p = TMP_ALLOC_LIMBS (nn + 1);
 		MPN_COPY (n2p, np, nn);
 		n2p[nn] = 0;
 		nn += adjust;
 	      }

 	    invert_pi1 (dinv, d2p[dn - 1], d2p[dn - 2]);
 	    if (BELOW_THRESHOLD (dn, DC_DIV_QR_THRESHOLD))
 	      mpn_sbpi1_div_qr (qp, n2p, nn, d2p, dn, dinv.inv32);
 	    else if (BELOW_THRESHOLD (dn, MUPI_DIV_QR_THRESHOLD) ||   /* fast condition */
 		     BELOW_THRESHOLD (nn, 2 * MU_DIV_QR_THRESHOLD) || /* fast condition */
 		     (double) (2 * (MU_DIV_QR_THRESHOLD - MUPI_DIV_QR_THRESHOLD)) * dn /* slow... */
 		     + (double) MUPI_DIV_QR_THRESHOLD * nn > (double) dn * nn)    /* ...condition */
 	      mpn_dcpi1_div_qr (qp, n2p, nn, d2p, dn, &dinv);
 	    else
 	      {
 		mp_size_t itch = mpn_mu_div_qr_itch (nn, dn, 0);
 		mp_ptr scratch = TMP_ALLOC_LIMBS (itch);
 		mpn_mu_div_qr (qp, rp, n2p, nn, d2p, dn, scratch);
 		n2p = rp;
 	      }

 	    if (cnt != 0)
 	      mpn_rshift (rp, n2p, dn, cnt);
 	    else
 	      MPN_COPY (rp, n2p, dn);
 	    TMP_FREE;
 	    return;
 	  }

 	/* When we come here, the numerator/partial remainder is less
 	   than twice the size of the denominator.  */

 	  {
 	    /* Problem:

 	       Divide a numerator N with nn limbs by a denominator D with dn
 	       limbs forming a quotient of qn=nn-dn+1 limbs.  When qn is small
 	       compared to dn, conventional division algorithms perform poorly.
 	       We want an algorithm that has an expected running time that is
 	       dependent only on qn.

 	       Algorithm (very informally stated):

 	       1) Divide the 2 x qn most significant limbs from the numerator
 		  by the qn most significant limbs from the denominator.  Call
 		  the result qest.  This is either the correct quotient, but
 		  might be 1 or 2 too large.  Compute the remainder from the
 		  division.  (This step is implemented by an mpn_divrem call.)

 	       2) Is the most significant limb from the remainder < p, where p
 		  is the product of the most significant limb from the quotient
 		  and the next(d)?  (Next(d) denotes the next ignored limb from
 		  the denominator.)  If it is, decrement qest, and adjust the
 		  remainder accordingly.

 	       3) Is the remainder >= qest?  If it is, qest is the desired
 		  quotient.  The algorithm terminates.

 	       4) Subtract qest x next(d) from the remainder.  If there is
 		  borrow out, decrement qest, and adjust the remainder
 		  accordingly.

 	       5) Skip one word from the denominator (i.e., let next(d) denote
 		  the next less significant limb.  */

 	    mp_size_t qn;
 	    mp_ptr n2p, d2p;
 	    mp_ptr tp;
 	    mp_limb_t cy;
 	    mp_size_t in, rn;
 	    mp_limb_t quotient_too_large;
 	    unsigned int cnt;

 	    qn = nn - dn;
 	    qp[qn] = 0;				/* zero high quotient limb */
 	    qn += adjust;			/* qn cannot become bigger */

 	    if (qn == 0)
 	      {
 		MPN_COPY (rp, np, dn);
 		TMP_FREE;
 		return;
 	      }

 	    in = dn - qn;		/* (at least partially) ignored # of limbs in ops */
 	    /* Normalize denominator by shifting it to the left such that its
 	       most significant bit is set.  Then shift the numerator the same
 	       amount, to mathematically preserve quotient.  */
 	    if ((dp[dn - 1] & GMP_NUMB_HIGHBIT) == 0)
 	      {
 		count_leading_zeros (cnt, dp[dn - 1]);
 		cnt -= GMP_NAIL_BITS;

 		d2p = TMP_ALLOC_LIMBS (qn);
 		mpn_lshift (d2p, dp + in, qn, cnt);
 		d2p[0] |= dp[in - 1] >> (GMP_NUMB_BITS - cnt);

 		n2p = TMP_ALLOC_LIMBS (2 * qn + 1);
 		cy = mpn_lshift (n2p, np + nn - 2 * qn, 2 * qn, cnt);
 		if (adjust)
 		  {
 		    n2p[2 * qn] = cy;
 		    n2p++;
 		  }
 		else
 		  {
 		    n2p[0] |= np[nn - 2 * qn - 1] >> (GMP_NUMB_BITS - cnt);
 		  }
 	      }
 	    else
 	      {
 		cnt = 0;
 		d2p = (mp_ptr) dp + in;

 		n2p = TMP_ALLOC_LIMBS (2 * qn + 1);
 		MPN_COPY (n2p, np + nn - 2 * qn, 2 * qn);
 		if (adjust)
 		  {
 		    n2p[2 * qn] = 0;
 		    n2p++;
 		  }
 	      }

 	    /* Get an approximate quotient using the extracted operands.  */
 	    if (qn == 1)
 	      {
 		mp_limb_t q0, r0;
 		udiv_qrnnd (q0, r0, n2p[1], n2p[0] << GMP_NAIL_BITS, d2p[0] << GMP_NAIL_BITS);
 		n2p[0] = r0 >> GMP_NAIL_BITS;
 		qp[0] = q0;
 	      }
 	    else if (qn == 2)
 	      mpn_divrem_2 (qp, 0L, n2p, 4L, d2p); /* FIXME: obsolete function */
 	    else
 	      {
 		invert_pi1 (dinv, d2p[qn - 1], d2p[qn - 2]);
 		if (BELOW_THRESHOLD (qn, DC_DIV_QR_THRESHOLD))
 		  mpn_sbpi1_div_qr (qp, n2p, 2 * qn, d2p, qn, dinv.inv32);
 		else if (BELOW_THRESHOLD (qn, MU_DIV_QR_THRESHOLD))
 		  mpn_dcpi1_div_qr (qp, n2p, 2 * qn, d2p, qn, &dinv);
 		else
 		  {
 		    mp_size_t itch = mpn_mu_div_qr_itch (2 * qn, qn, 0);
 		    mp_ptr scratch = TMP_ALLOC_LIMBS (itch);
 		    mp_ptr r2p = rp;
 		    if (np == r2p)	/* If N and R share space, put ... */
 		      r2p += nn - qn;	/* intermediate remainder at N's upper end. */
 		    mpn_mu_div_qr (qp, r2p, n2p, 2 * qn, d2p, qn, scratch);
 		    MPN_COPY (n2p, r2p, qn);
 		  }
 	      }

 	    rn = qn;
 	    /* Multiply the first ignored divisor limb by the most significant
 	       quotient limb.  If that product is > the partial remainder's
 	       most significant limb, we know the quotient is too large.  This
 	       test quickly catches most cases where the quotient is too large;
 	       it catches all cases where the quotient is 2 too large.  */
 	    {
 	      mp_limb_t dl, x;
 	      mp_limb_t h, dummy;

 	      if (in - 2 < 0)
 		dl = 0;
 	      else
 		dl = dp[in - 2];

 #if GMP_NAIL_BITS == 0
 	      x = (dp[in - 1] << cnt) | ((dl >> 1) >> ((~cnt) % GMP_LIMB_BITS));
 #else
 	      x = (dp[in - 1] << cnt) & GMP_NUMB_MASK;
 	      if (cnt != 0)
 		x |= dl >> (GMP_NUMB_BITS - cnt);
 #endif
 	      umul_ppmm (h, dummy, x, qp[qn - 1] << GMP_NAIL_BITS);

 	      if (n2p[qn - 1] < h)
 		{
 		  mp_limb_t cy;

 		  mpn_decr_u (qp, (mp_limb_t) 1);
 		  cy = mpn_add_n (n2p, n2p, d2p, qn);
 		  if (cy)
 		    {
 		      /* The partial remainder is safely large.  */
 		      n2p[qn] = cy;
 		      ++rn;
 		    }
 		}
 	    }

 	    quotient_too_large = 0;
 	    if (cnt != 0)
 	      {
 		mp_limb_t cy1, cy2;

 		/* Append partially used numerator limb to partial remainder.  */
 		cy1 = mpn_lshift (n2p, n2p, rn, GMP_NUMB_BITS - cnt);
 		n2p[0] |= np[in - 1] & (GMP_NUMB_MASK >> cnt);

 		/* Update partial remainder with partially used divisor limb.  */
 		cy2 = mpn_submul_1 (n2p, qp, qn, dp[in - 1] & (GMP_NUMB_MASK >> cnt));
 		if (qn != rn)
 		  {
 		    ASSERT_ALWAYS (n2p[qn] >= cy2);
 		    n2p[qn] -= cy2;
 		  }
 		else
 		  {
 		    n2p[qn] = cy1 - cy2; /* & GMP_NUMB_MASK; */

 		    quotient_too_large = (cy1 < cy2);
 		    ++rn;
 		  }
 		--in;
 	      }
 	    /* True: partial remainder now is neutral, i.e., it is not shifted up.  */

 	    tp = TMP_ALLOC_LIMBS (dn);

 	    if (in < qn)
 	      {
 		if (in == 0)
 		  {
 		    MPN_COPY (rp, n2p, rn);
 		    ASSERT_ALWAYS (rn == dn);
 		    goto foo;
 		  }
 		mpn_mul (tp, qp, qn, dp, in);
 	      }
 	    else
 	      mpn_mul (tp, dp, in, qp, qn);

 	    cy = mpn_sub (n2p, n2p, rn, tp + in, qn);
 	    MPN_COPY (rp + in, n2p, dn - in);
 	    quotient_too_large |= cy;
 	    cy = mpn_sub_n (rp, np, tp, in);
 	    cy = mpn_sub_1 (rp + in, rp + in, rn, cy);
 	    quotient_too_large |= cy;
 	  foo:
 	    if (quotient_too_large)
 	      {
 		mpn_decr_u (qp, (mp_limb_t) 1);
 		mpn_add_n (rp, rp, dp, dn);
 	      }
 	  }
 	TMP_FREE;
 	return;
       }
     }
 }
	/* mpn_tdiv_qr -- Divide the numerator (np,nn) by the denominator (dp,dn) and
	write the nn-dn+1 quotient limbs at qp and the dn remainder limbs at rp. If
	qxn is non-zero, generate that many fraction limbs and append them after the
	other quotient limbs, and update the remainder accordingly. The input
	operands are unaffected.

	Preconditions:
	1. The most significant limb of the divisor must be non-zero.
	2. nn >= dn, even if qxn is non-zero. (??? relax this ???)

	The time complexity of this is O(qn*qn+M(dn,qn)), where M(m,n) is the time
	complexity of multiplication.

	Copyright 1997, 2000-2002, 2005, 2009, 2015 Free Software Foundation, Inc.

	This file is part of the GNU MP Library.

	The GNU MP Library is free software; you can redistribute it and/or modify
	it under the terms of either:

	* the GNU Lesser General Public License as published by the Free
	Software Foundation; either version 3 of the License, or (at your
	option) any later version.

	or

	* the GNU General Public License as published by the Free Software
	Foundation; either version 2 of the License, or (at your option) any
	later version.

	or both in parallel, as here.

	The GNU MP Library is distributed in the hope that it will be useful, but
	WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
	or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
	for more details.

	You should have received copies of the GNU General Public License and the
	GNU Lesser General Public License along with the GNU MP Library. If not,
	see https://www.gnu.org/licenses/. */

	#include "gmp-impl.h"
	#include "longlong.h"


	void
	mpn_tdiv_qr (mp_ptr qp, mp_ptr rp, mp_size_t qxn,
	mp_srcptr np, mp_size_t nn, mp_srcptr dp, mp_size_t dn)
	{
	ASSERT_ALWAYS (qxn == 0);

	ASSERT (nn >= 0);
	ASSERT (dn >= 0);
	ASSERT (dn == 0 \|\| dp[dn - 1] != 0);
	ASSERT (! MPN_OVERLAP_P (qp, nn - dn + 1 + qxn, np, nn));
	ASSERT (! MPN_OVERLAP_P (qp, nn - dn + 1 + qxn, dp, dn));

	switch (dn)
	{
	case 0:
	DIVIDE_BY_ZERO;

	case 1:
	{
	rp[0] = mpn_divrem_1 (qp, (mp_size_t) 0, np, nn, dp[0]);
	return;
	}

	case 2:
	{
	mp_ptr n2p;
	mp_limb_t qhl, cy;
	TMP_DECL;
	TMP_MARK;
	if ((dp[1] & GMP_NUMB_HIGHBIT) == 0)
	{
	int cnt;
	mp_limb_t d2p[2];
	count_leading_zeros (cnt, dp[1]);
	cnt -= GMP_NAIL_BITS;
	d2p[1] = (dp[1] << cnt) \| (dp[0] >> (GMP_NUMB_BITS - cnt));
	d2p[0] = (dp[0] << cnt) & GMP_NUMB_MASK;
	n2p = TMP_ALLOC_LIMBS (nn + 1);
	cy = mpn_lshift (n2p, np, nn, cnt);
	n2p[nn] = cy;
	qhl = mpn_divrem_2 (qp, 0L, n2p, nn + (cy != 0), d2p);
	if (cy == 0)
	qp[nn - 2] = qhl; /* always store nn-2+1 quotient limbs */
	rp[0] = (n2p[0] >> cnt)
	\| ((n2p[1] << (GMP_NUMB_BITS - cnt)) & GMP_NUMB_MASK);
	rp[1] = (n2p[1] >> cnt);
	}
	else
	{
	n2p = TMP_ALLOC_LIMBS (nn);
	MPN_COPY (n2p, np, nn);
	qhl = mpn_divrem_2 (qp, 0L, n2p, nn, dp);
	qp[nn - 2] = qhl; /* always store nn-2+1 quotient limbs */
	rp[0] = n2p[0];
	rp[1] = n2p[1];
	}
	TMP_FREE;
	return;
	}

	default:
	{
	int adjust;
	gmp_pi1_t dinv;
	TMP_DECL;
	TMP_MARK;
	adjust = np[nn - 1] >= dp[dn - 1]; /* conservative tests for quotient size */
	if (nn + adjust >= 2 * dn)
	{
	mp_ptr n2p, d2p;
	mp_limb_t cy;
	int cnt;

	qp[nn - dn] = 0; /* zero high quotient limb */
	if ((dp[dn - 1] & GMP_NUMB_HIGHBIT) == 0) /* normalize divisor */
	{
	count_leading_zeros (cnt, dp[dn - 1]);
	cnt -= GMP_NAIL_BITS;
	d2p = TMP_ALLOC_LIMBS (dn);
	mpn_lshift (d2p, dp, dn, cnt);
	n2p = TMP_ALLOC_LIMBS (nn + 1);
	cy = mpn_lshift (n2p, np, nn, cnt);
	n2p[nn] = cy;
	nn += adjust;
	}
	else
	{
	cnt = 0;
	d2p = (mp_ptr) dp;
	n2p = TMP_ALLOC_LIMBS (nn + 1);
	MPN_COPY (n2p, np, nn);
	n2p[nn] = 0;
	nn += adjust;
	}

	invert_pi1 (dinv, d2p[dn - 1], d2p[dn - 2]);
	if (BELOW_THRESHOLD (dn, DC_DIV_QR_THRESHOLD))
	mpn_sbpi1_div_qr (qp, n2p, nn, d2p, dn, dinv.inv32);
	else if (BELOW_THRESHOLD (dn, MUPI_DIV_QR_THRESHOLD) \|\| /* fast condition */
	BELOW_THRESHOLD (nn, 2 * MU_DIV_QR_THRESHOLD) \|\| /* fast condition */
	(double) (2 * (MU_DIV_QR_THRESHOLD - MUPI_DIV_QR_THRESHOLD)) * dn /* slow... */
	+ (double) MUPI_DIV_QR_THRESHOLD * nn > (double) dn * nn) /* ...condition */
	mpn_dcpi1_div_qr (qp, n2p, nn, d2p, dn, &dinv);
	else
	{
	mp_size_t itch = mpn_mu_div_qr_itch (nn, dn, 0);
	mp_ptr scratch = TMP_ALLOC_LIMBS (itch);
	mpn_mu_div_qr (qp, rp, n2p, nn, d2p, dn, scratch);
	n2p = rp;
	}

	if (cnt != 0)
	mpn_rshift (rp, n2p, dn, cnt);
	else
	MPN_COPY (rp, n2p, dn);
	TMP_FREE;
	return;
	}

	/* When we come here, the numerator/partial remainder is less
	than twice the size of the denominator. */

	{
	/* Problem:

	Divide a numerator N with nn limbs by a denominator D with dn
	limbs forming a quotient of qn=nn-dn+1 limbs. When qn is small
	compared to dn, conventional division algorithms perform poorly.
	We want an algorithm that has an expected running time that is
	dependent only on qn.

	Algorithm (very informally stated):

	1) Divide the 2 x qn most significant limbs from the numerator
	by the qn most significant limbs from the denominator. Call
	the result qest. This is either the correct quotient, but
	might be 1 or 2 too large. Compute the remainder from the
	division. (This step is implemented by an mpn_divrem call.)

	2) Is the most significant limb from the remainder < p, where p
	is the product of the most significant limb from the quotient
	and the next(d)? (Next(d) denotes the next ignored limb from
	the denominator.) If it is, decrement qest, and adjust the
	remainder accordingly.

	3) Is the remainder >= qest? If it is, qest is the desired
	quotient. The algorithm terminates.

	4) Subtract qest x next(d) from the remainder. If there is
	borrow out, decrement qest, and adjust the remainder
	accordingly.

	5) Skip one word from the denominator (i.e., let next(d) denote
	the next less significant limb. */

	mp_size_t qn;
	mp_ptr n2p, d2p;
	mp_ptr tp;
	mp_limb_t cy;
	mp_size_t in, rn;
	mp_limb_t quotient_too_large;
	unsigned int cnt;

	qn = nn - dn;
	qp[qn] = 0; /* zero high quotient limb */
	qn += adjust; /* qn cannot become bigger */

	if (qn == 0)
	{
	MPN_COPY (rp, np, dn);
	TMP_FREE;
	return;
	}

	in = dn - qn; /* (at least partially) ignored # of limbs in ops */
	/* Normalize denominator by shifting it to the left such that its
	most significant bit is set. Then shift the numerator the same
	amount, to mathematically preserve quotient. */
	if ((dp[dn - 1] & GMP_NUMB_HIGHBIT) == 0)
	{
	count_leading_zeros (cnt, dp[dn - 1]);
	cnt -= GMP_NAIL_BITS;

	d2p = TMP_ALLOC_LIMBS (qn);
	mpn_lshift (d2p, dp + in, qn, cnt);
	d2p[0] \|= dp[in - 1] >> (GMP_NUMB_BITS - cnt);

	n2p = TMP_ALLOC_LIMBS (2 * qn + 1);
	cy = mpn_lshift (n2p, np + nn - 2 * qn, 2 * qn, cnt);
	if (adjust)
	{
	n2p[2 * qn] = cy;
	n2p++;
	}
	else
	{
	n2p[0] \|= np[nn - 2 * qn - 1] >> (GMP_NUMB_BITS - cnt);
	}
	}
	else
	{
	cnt = 0;
	d2p = (mp_ptr) dp + in;

	n2p = TMP_ALLOC_LIMBS (2 * qn + 1);
	MPN_COPY (n2p, np + nn - 2 * qn, 2 * qn);
	if (adjust)
	{
	n2p[2 * qn] = 0;
	n2p++;
	}
	}

	/* Get an approximate quotient using the extracted operands. */
	if (qn == 1)
	{
	mp_limb_t q0, r0;
	udiv_qrnnd (q0, r0, n2p[1], n2p[0] << GMP_NAIL_BITS, d2p[0] << GMP_NAIL_BITS);
	n2p[0] = r0 >> GMP_NAIL_BITS;
	qp[0] = q0;
	}
	else if (qn == 2)
	mpn_divrem_2 (qp, 0L, n2p, 4L, d2p); /* FIXME: obsolete function */
	else
	{
	invert_pi1 (dinv, d2p[qn - 1], d2p[qn - 2]);
	if (BELOW_THRESHOLD (qn, DC_DIV_QR_THRESHOLD))
	mpn_sbpi1_div_qr (qp, n2p, 2 * qn, d2p, qn, dinv.inv32);
	else if (BELOW_THRESHOLD (qn, MU_DIV_QR_THRESHOLD))
	mpn_dcpi1_div_qr (qp, n2p, 2 * qn, d2p, qn, &dinv);
	else
	{
	mp_size_t itch = mpn_mu_div_qr_itch (2 * qn, qn, 0);
	mp_ptr scratch = TMP_ALLOC_LIMBS (itch);
	mp_ptr r2p = rp;
	if (np == r2p) /* If N and R share space, put ... */
	r2p += nn - qn; /* intermediate remainder at N's upper end. */
	mpn_mu_div_qr (qp, r2p, n2p, 2 * qn, d2p, qn, scratch);
	MPN_COPY (n2p, r2p, qn);
	}
	}

	rn = qn;
	/* Multiply the first ignored divisor limb by the most significant
	quotient limb. If that product is > the partial remainder's
	most significant limb, we know the quotient is too large. This
	test quickly catches most cases where the quotient is too large;
	it catches all cases where the quotient is 2 too large. */
	{
	mp_limb_t dl, x;
	mp_limb_t h, dummy;

	if (in - 2 < 0)
	dl = 0;
	else
	dl = dp[in - 2];

	#if GMP_NAIL_BITS == 0
	x = (dp[in - 1] << cnt) \| ((dl >> 1) >> ((~cnt) % GMP_LIMB_BITS));
	#else
	x = (dp[in - 1] << cnt) & GMP_NUMB_MASK;
	if (cnt != 0)
	x \|= dl >> (GMP_NUMB_BITS - cnt);
	#endif
	umul_ppmm (h, dummy, x, qp[qn - 1] << GMP_NAIL_BITS);

	if (n2p[qn - 1] < h)
	{
	mp_limb_t cy;

	mpn_decr_u (qp, (mp_limb_t) 1);
	cy = mpn_add_n (n2p, n2p, d2p, qn);
	if (cy)
	{
	/* The partial remainder is safely large. */
	n2p[qn] = cy;
	++rn;
	}
	}
	}

	quotient_too_large = 0;
	if (cnt != 0)
	{
	mp_limb_t cy1, cy2;

	/* Append partially used numerator limb to partial remainder. */
	cy1 = mpn_lshift (n2p, n2p, rn, GMP_NUMB_BITS - cnt);
	n2p[0] \|= np[in - 1] & (GMP_NUMB_MASK >> cnt);

	/* Update partial remainder with partially used divisor limb. */
	cy2 = mpn_submul_1 (n2p, qp, qn, dp[in - 1] & (GMP_NUMB_MASK >> cnt));
	if (qn != rn)
	{
	ASSERT_ALWAYS (n2p[qn] >= cy2);
	n2p[qn] -= cy2;
	}
	else
	{
	n2p[qn] = cy1 - cy2; /* & GMP_NUMB_MASK; */

	quotient_too_large = (cy1 < cy2);
	++rn;
	}
	--in;
	}
	/* True: partial remainder now is neutral, i.e., it is not shifted up. */

	tp = TMP_ALLOC_LIMBS (dn);

	if (in < qn)
	{
	if (in == 0)
	{
	MPN_COPY (rp, n2p, rn);
	ASSERT_ALWAYS (rn == dn);
	goto foo;
	}
	mpn_mul (tp, qp, qn, dp, in);
	}
	else
	mpn_mul (tp, dp, in, qp, qn);

	cy = mpn_sub (n2p, n2p, rn, tp + in, qn);
	MPN_COPY (rp + in, n2p, dn - in);
	quotient_too_large \|= cy;
	cy = mpn_sub_n (rp, np, tp, in);
	cy = mpn_sub_1 (rp + in, rp + in, rn, cy);
	quotient_too_large \|= cy;
	foo:
	if (quotient_too_large)
	{
	mpn_decr_u (qp, (mp_limb_t) 1);
	mpn_add_n (rp, rp, dp, dn);
	}
	}
	TMP_FREE;
	return;
	}
	}
	}