diff options
author | zimmerma <zimmerma@211d60ee-9f03-0410-a15a-8952a2c7a4e4> | 2012-03-06 18:37:49 +0000 |
---|---|---|
committer | zimmerma <zimmerma@211d60ee-9f03-0410-a15a-8952a2c7a4e4> | 2012-03-06 18:37:49 +0000 |
commit | b1af57b47281797329f7d3298585a60750e287f9 (patch) | |
tree | 690fc53498f056b2c2fb598c2242bb28465ab1d6 | |
parent | 2e55720e7dc4cb801e1047c137eef2e9c2cbe672 (diff) | |
download | mpc-b1af57b47281797329f7d3298585a60750e287f9.tar.gz |
[sqr.c] in the case of underflow in Karatsuba, fall back to mpfr_fsss
git-svn-id: svn://scm.gforge.inria.fr/svn/mpc/trunk@1138 211d60ee-9f03-0410-a15a-8952a2c7a4e4
-rw-r--r-- | src/sqr.c | 15 |
1 files changed, 11 insertions, 4 deletions
@@ -248,7 +248,9 @@ mpc_sqr (mpc_ptr rop, mpc_srcptr op, mpc_rnd_t rnd) } else { - /* Karatsuba squaring */ + /* Karatsuba squaring: we compute the real part as (x+y)*(x-y) and the + imaginary part as 2*x*y, with a total of 2M instead of 2S+1M for the + naive algorithm, which computes x^2-y^2 and 2*y*y */ mpfr_init (u); mpfr_init (v); @@ -266,7 +268,7 @@ mpc_sqr (mpc_ptr rop, mpc_srcptr op, mpc_rnd_t rnd) /* The error is bounded above by 1 ulp. */ /* We first let inexact be 1 if the real part is not computed */ /* exactly and determine the sign later. */ - inexact = ROUND_AWAY (mpfr_add (u, x, mpc_imagref (op), MPFR_RNDA), u) + inexact = ROUND_AWAY (mpfr_add (u, x, mpc_imagref (op), MPFR_RNDA), u) | ROUND_AWAY (mpfr_sub (v, x, mpc_imagref (op), MPFR_RNDA), v); /* compute the real part as u*v, rounded away */ @@ -284,8 +286,12 @@ mpc_sqr (mpc_ptr rop, mpc_srcptr op, mpc_rnd_t rnd) /* checks that no overflow nor underflow occurs: since u*v > 0 and we round up, an overflow will give +Inf, but an underflow will give 0.5*2^emin */ - MPC_ASSERT (mpfr_get_exp (u) != emin); - if (mpfr_inf_p (u)) + if (mpfr_get_exp (u) == emin) /* underflow */ + { + inex_re = mpfr_fsss (rop->re, x, op->im, MPC_RND_RE (rnd)); + goto end_of_real_part; + } + else if (mpfr_inf_p (u)) { /* let mpc_realref(rop) be a "correctly rounded overflow" */ inex_re = mpfr_set_ui_2exp (mpc_realref (rop), 1, emax, MPC_RND_RE (rnd)); @@ -345,6 +351,7 @@ mpc_sqr (mpc_ptr rop, mpc_srcptr op, mpc_rnd_t rnd) } while (!ok); + end_of_real_part: mpfr_clear (u); mpfr_clear (v); } |