1 files changed, 68 insertions, 55 deletions
diff --git a/mpfr/sqrt.c b/mpfr/sqrt.c
index 8489581bd..839f769bd 100644
--- a/mpfr/sqrt.c
+++ b/mpfr/sqrt.c
@@ -1,20 +1,20 @@
 /* mpfr_sqrt -- square root of a floating-point number
 
-Copyright (C) 1999, 2001 Free Software Foundation.
+Copyright (C) 1999, 2001 Free Software Foundation, Inc.
 
 This file is part of the MPFR Library.
 
 The MPFR Library is free software; you can redistribute it and/or modify
-it under the terms of the GNU Library General Public License as published by
-the Free Software Foundation; either version 2 of the License, or (at your
+it under the terms of the GNU Lesser General Public License as published by
+the Free Software Foundation; either version 2.1 of the License, or (at your
 option) any later version.
 
 The MPFR Library is distributed in the hope that it will be useful, but
 WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
-or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Library General Public
+or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
 License for more details.
 
-You should have received a copy of the GNU Library General Public License
+You should have received a copy of the GNU Lesser General Public License
 along with the MPFR Library; see the file COPYING.LIB.  If not, write to
 the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
 MA 02111-1307, USA. */
@@ -29,14 +29,7 @@ MA 02111-1307, USA. */
 /* #define DEBUG */
 
 int
-#if __STDC__
 mpfr_sqrt (mpfr_ptr r, mpfr_srcptr u, mp_rnd_t rnd_mode)
-#else
-mpfr_sqrt (r, u, rnd_mode)
-     mpfr_ptr r;
-     mpfr_srcptr u;
-     mp_rnd_t rnd_mode;
-#endif
 {
   mp_ptr up, rp, tmp, remp;
   mp_size_t usize, rrsize;
@@ -44,25 +37,25 @@ mpfr_sqrt (r, u, rnd_mode)
   mp_size_t prec, err;
   mp_limb_t q_limb;
   long rw, nw, k; 
-  int exact = 0, t;
+  int inexact = 0, t;
   unsigned long cc = 0; 
   char can_round = 0; 
   TMP_DECL(marker0);
 
   if (MPFR_IS_NAN(u)) {
     MPFR_SET_NAN(r);
-    return 1;
+    return 1; /* NaN is always inexact */
   }
 
   if (MPFR_SIGN(u) < 0) {
     if (MPFR_IS_INF(u) || MPFR_NOTZERO(u)) {
       MPFR_SET_NAN(r);
-      return 1;
+      return 1; /* NaN is always inexact */
     }
     else { /* sqrt(-0) = -0 */
       MPFR_SET_ZERO(r);
       if (MPFR_SIGN(r) > 0) MPFR_CHANGE_SIGN(r);
-      return 0;
+      return 0; /* zero is exact */
     }
   }
 
@@ -72,7 +65,7 @@ mpfr_sqrt (r, u, rnd_mode)
   if (MPFR_IS_INF(u)) 
     { 
       MPFR_SET_INF(r);
-      return 1;
+      return 0; /* infinity is exact */
     }
 
   MPFR_CLEAR_INF(r);
@@ -84,11 +77,10 @@ mpfr_sqrt (r, u, rnd_mode)
       MPFR_EXP(r) = 0;
       rsize = (prec-1)/BITS_PER_MP_LIMB + 1;
       MPN_ZERO(MPFR_MANT(r), rsize);
-      return 0;
+      return 0; /* zero is exact */
     }
 
   up = MPFR_MANT(u);
-
   usize = (MPFR_PREC(u) - 1)/BITS_PER_MP_LIMB + 1; 
 
 #ifdef DEBUG
@@ -121,7 +113,7 @@ mpfr_sqrt (r, u, rnd_mode)
 	{
 	  up = TMP_ALLOC((usize + 1)*BYTES_PER_MP_LIMB);
 	  if (mpn_rshift(up + 1, MPFR_MANT(u), usize, 1))
-	    up [0] = ((mp_limb_t) 1) << (BITS_PER_MP_LIMB - 1); 
+	    up [0] = MP_LIMB_T_HIGHBIT;
 	  else up[0] = 0; 
 	  usize++; 
 	}
@@ -164,14 +156,15 @@ mpfr_sqrt (r, u, rnd_mode)
       q_limb = mpn_sqrtrem (rp, remp, tmp, rsize);
 
 #ifdef DEBUG
-      printf("The result is : \n"); 
-      printf("sqrt : "); 
-      for(k = rrsize - 1; k >= 0; k--) { printf("%lu ", rp[k]); }
-      printf("(q_limb = %lu)\n", q_limb); 
+      printf ("The result is : \n"); 
+      printf ("sqrt : "); 
+      for (k = rrsize - 1; k >= 0; k--)
+	printf ("%lu ", rp[k]);
+      printf ("(inexact = %lu)\n", q_limb); 
 #endif
       
-      can_round = (mpfr_can_round_raw(rp, rrsize, 1, err, 
-				      GMP_RNDZ, rnd_mode, MPFR_PREC(r))); 
+      can_round = mpfr_can_round_raw(rp, rrsize, 1, err, 
+				     GMP_RNDZ, rnd_mode, MPFR_PREC(r));
 
       /* If we used all the limbs of both the dividend and the divisor, 
 	 then we have the correct RNDZ rounding */
@@ -186,67 +179,87 @@ mpfr_sqrt (r, u, rnd_mode)
     }
   while (!can_round && (rsize < 2*usize) 
 	 && (rsize += 2) && (rrsize ++)); 
-
+#ifdef DEBUG
+  printf ("can_round = %d\n", can_round);
+#endif
 
   /* This part may be deplaced upper to avoid a few mpfr_can_round_raw */
   /* when the square root is exact. It is however very unprobable that */
   /* it would improve the behaviour of the present code on average.    */
 
-  if (!q_limb) /* possibly exact */
+  if (!q_limb) /* the sqrtrem call was exact, possible exact square root */
     {
       /* if we have taken into account the whole of up */
       for (k = usize - rsize - 1; k >= 0; k ++)
 	if (up[k]) break; 
       
-      if (k < 0) { exact = 1; goto fin; }
+      if (k < 0)
+	goto fin; /* exact square root ==> inexact = 0 */
     }
 
   if (can_round) 
     {
-      cc = mpfr_round_raw(rp, rp, err, 0, MPFR_PREC(r), rnd_mode);  
+      cc = mpfr_round_raw (rp, rp, err, 0, MPFR_PREC(r), rnd_mode, &inexact);
+      if (!inexact) /* exact high part: inexact flag depends from remainder */
+	inexact = -q_limb;
       rrsize = (MPFR_PREC(r) - 1)/BITS_PER_MP_LIMB + 1; 
     }
   else
     /* Use the return value of sqrtrem to decide of the rounding         */
     /* Note that at this point the sqrt has been computed                */
-    /* EXACTLY. If rounding = GMP_RNDZ, do nothing [comes from           */
-    /* the fact that the exact square root can end with a bunch of ones, */
-    /* and in that case we indeed cannot round if we do not know that    */
-    /* the computation was exact.                                        */
+    /* EXACTLY.                                                          */
     switch (rnd_mode)
       {
       case GMP_RNDZ : 
-      case GMP_RNDD : break; 
+      case GMP_RNDD :
+	inexact = -1; /* result is truncated */
+	break; 
 
       case GMP_RNDN : 
 	/* Not in the situation ...0 111111 */
 	rw = (MPFR_PREC(r) + 1) & (BITS_PER_MP_LIMB - 1);
-	if (rw) { rw = BITS_PER_MP_LIMB - rw; nw = 0; } else nw = 1; 
+	if (rw)
+	  {
+	    rw = BITS_PER_MP_LIMB - rw;
+	    nw = 0;
+	  }
+	else
+	  nw = 1; 
 	if ((rp[nw] >> rw) & 1 &&                     /* Not 0111111111 */
 	    (q_limb ||                                /* Nonzero remainder */
 	    (rw ? (rp[nw] >> (rw + 1)) & 1 : 
 	     (rp[nw] >> (BITS_PER_MP_LIMB - 1)) & 1))) /* or even rounding */ 
-	  cc = mpn_add_1(rp + nw, rp + nw, rrsize, ((mp_limb_t)1) << rw); 
+	  {
+	    cc = mpn_add_1 (rp + nw, rp + nw, rrsize, MP_LIMB_T_ONE << rw);
+	    inexact = 1;
+	  }
+	else
+	  inexact = -1;
 	break;
  
-      case GMP_RNDU : 
-	if (q_limb)
-	  {
-	    t = MPFR_PREC(r) & (BITS_PER_MP_LIMB - 1); 
-	    if (t) 
-	      {
-		cc = mpn_add_1(rp, rp, rrsize, 1 << (BITS_PER_MP_LIMB - t)); 
-	      }
-	    else
-	      cc = mpn_add_1 (rp, rp, rrsize, 1); 
-	  }	      
+      case GMP_RNDU:
+	/* we should arrive here only when the result is inexact,
+	   i.e. either q_limb > 0 (the remainder from mpn_sqrtrem is non-zero)
+	   or up[0..usize-rsize-1] is non zero, thus we have to add one
+	   ulp, and inexact = 1 */
+	inexact = 1;
+	t = MPFR_PREC(r) & (BITS_PER_MP_LIMB - 1);
+	rsize = (MPFR_PREC(r) - 1)/BITS_PER_MP_LIMB + 1;
+	if (t) 
+	    cc = mpn_add_1 (rp + rrsize - rsize, rp + rrsize - rsize, rsize,
+			    MP_LIMB_T_ONE << (BITS_PER_MP_LIMB - t));
+	else
+	    cc = mpn_add_1 (rp + rrsize - rsize, rp + rrsize - rsize, rsize,
+			    MP_LIMB_T_ONE);
       }
 
-  if (cc) {
-    mpn_rshift(rp, rp, rrsize, 1);
-    rp[rrsize-1] |= (mp_limb_t) 1 << (BITS_PER_MP_LIMB-1);
-    MPFR_EXP(r)++; 
-  }
+  if (cc)
+    {
+      /* Is a shift necessary here? Isn't the result 1.0000...? */
+      mpn_rshift (rp, rp, rrsize, 1);
+      rp[rrsize-1] |= MP_LIMB_T_HIGHBIT;
+      MPFR_EXP(r)++; 
+    }
 
  fin:
   rsize = rrsize; 
@@ -254,11 +267,11 @@ mpfr_sqrt (r, u, rnd_mode)
   MPN_COPY(MPFR_MANT(r), rp + rsize - rrsize, rrsize); 
 
   if (MPFR_PREC(r) & (BITS_PER_MP_LIMB - 1))
-    MPFR_MANT(r) [0] &= ~(((mp_limb_t)1 << (BITS_PER_MP_LIMB - 
+    MPFR_MANT(r) [0] &= ~((MP_LIMB_T_ONE << (BITS_PER_MP_LIMB - 
 				   (MPFR_PREC(r) & (BITS_PER_MP_LIMB - 1)))) - 1) ; 
   
   TMP_FREE (marker);
   }
   TMP_FREE(marker0);
-  return exact;
+  return inexact;
 }