[src/div.c] use an approximate quotient in mpfr_div_1()

git-svn-id: svn://scm.gforge.inria.fr/svn/mpfr/trunk@11108 280ebfd0-de03-0410-8827-d642c229c3f4
author: zimmerma <zimmerma@280ebfd0-de03-0410-8827-d642c229c3f4> 2016-12-30 13:16:21 +0000
committer: zimmerma <zimmerma@280ebfd0-de03-0410-8827-d642c229c3f4> 2016-12-30 13:16:21 +0000
commit: b0869ce6a6b21e9a9569381f9b383250b4298a63 (patch)
tree: 21c46d88e5fd2f619090f3a46120c1a9ff0bd221 /src/div.c
parent: 62b800b3f0e0a6ca0bfc21c088a056a76f9ddd28 (diff)
download: mpfr-b0869ce6a6b21e9a9569381f9b383250b4298a63.tar.gz
1 files changed, 28 insertions, 6 deletions
diff --git a/src/div.c b/src/div.c
index 1314d6910..f2351df97 100644
--- a/src/div.c
+++ b/src/div.c
@@ -45,13 +45,35 @@ mpfr_div_1 (mpfr_ptr q, mpfr_srcptr u, mpfr_srcptr v, mpfr_rnd_t rnd_mode)
   mp_limb_t q0, rb, sb, mask = MPFR_LIMB_MASK(sh);
   int extra;
 
-  extra = (u0 >= v0);
-  __udiv_qrnd_preinv (q0, sb, (extra) ? u0 - v0 : u0, v0);
-  qx += extra;
-  rb = q0 & (MPFR_LIMB_ONE << (sh + extra - 1));
-  sb |= (q0 ^ rb) & mask;
-  qp[0] = (((mp_limb_t) extra << (GMP_NUMB_BITS - 1)) | (q0 >> extra)) & ~mask;
+  if ((extra = (u0 >= v0)))
+    u0 -= v0;
+
+#if GMP_NUMB_BITS == 64 /* __gmpfr_invert_limb only exists for 64-bit for now */
+  /* first try with an approximate quotient */
+  mp_limb_t inv = __gmpfr_invert_limb (v0);
+  umul_ppmm (q0, sb, u0, inv);
+  q0 = (q0 + u0) >> extra;
+  /* before the >> extra shift, q0 + u0 does not exceed the true quotient
+     floor(u'0*2^GMP_NUMB_BITS/v0), with error at most 1, which means the rational
+     quotient q satisfies q0 + u0 <= q < q0 + u0 + 2. We can round correctly except
+     when the last sh-1 bits of q0 are now 000..000 or 111..111. */
+  if (MPFR_LIKELY(((q0 + 1) & (mask >> 1)) > 1))
+    {
+      rb = q0 & (MPFR_LIMB_ONE << (sh - 1));
+      sb = 1; /* result cannot be exact when we can round with an approximation */
+    }
+  else /* compute exact quotient and remainder */
+#endif
+    {
+      __udiv_qrnd_preinv (q0, sb, u0, v0);
+      sb |= q0 & extra;
+      q0 >>= extra;
+      rb = q0 & (MPFR_LIMB_ONE << (sh - 1));
+      sb |= q0 & (mask >> 1);
+    }
 
+  qp[0] = (MPFR_LIMB_HIGHBIT | q0) & ~mask;
+  qx += extra;
   MPFR_SIGN(q) = MPFR_MULT_SIGN (MPFR_SIGN (u), MPFR_SIGN (v));
 
   /* rounding */
author	zimmerma <zimmerma@280ebfd0-de03-0410-8827-d642c229c3f4>	2016-12-30 13:16:21 +0000
committer	zimmerma <zimmerma@280ebfd0-de03-0410-8827-d642c229c3f4>	2016-12-30 13:16:21 +0000
commit	b0869ce6a6b21e9a9569381f9b383250b4298a63 (patch)
tree	21c46d88e5fd2f619090f3a46120c1a9ff0bd221 /src/div.c
parent	62b800b3f0e0a6ca0bfc21c088a056a76f9ddd28 (diff)
download	mpfr-b0869ce6a6b21e9a9569381f9b383250b4298a63.tar.gz