[algorithms.tex] added error analysis for pow_ui

git-svn-id: svn://scm.gforge.inria.fr/svn/mpc/trunk@740 211d60ee-9f03-0410-a15a-8952a2c7a4e4
author: zimmerma <zimmerma@211d60ee-9f03-0410-a15a-8952a2c7a4e4> 2010-03-11 12:22:32 +0000
committer: zimmerma <zimmerma@211d60ee-9f03-0410-a15a-8952a2c7a4e4> 2010-03-11 12:22:32 +0000
commit: 04d32f58c2f36c536123b16a31f236b9846ef591 (patch)
tree: 89469e96c31357c81e1c46c83f162c1b906f57d2 /doc
parent: 4d51e71b251fdbfb4a23ddc4fe8398192944a2d1 (diff)
download: mpc-04d32f58c2f36c536123b16a31f236b9846ef591.tar.gz
2 files changed, 42 insertions, 0 deletions
diff --git a/doc/algorithms.bib b/doc/algorithms.bib
index 8f9d236..50bcaeb 100644
--- a/doc/algorithms.bib
+++ b/doc/algorithms.bib
@@ -37,3 +37,16 @@
   title =        {The {MPFR} {L}ibrary: {A}lgorithms {A}nd {P}roofs},
   note =         {\url{http://www.mpfr.org/algorithms.pdf}},
 }
+
+@Article{Percival03,
+  author = 	 "Colin Percival",
+  title = 	 "Rapid multiplication modulo the sum and difference of
+		  highly composite numbers",
+  journal =	 MC,
+  year =	 2003,
+  volume =	 72,
+  number =	 241,
+  pages =	 "387--395",
+  comment =	 "Includes good error analysis for FFT but proof is
+		  incorrect (result is OK)"
+}
diff --git a/doc/algorithms.tex b/doc/algorithms.tex
index 141c11e..27c27eb 100644
--- a/doc/algorithms.tex
+++ b/doc/algorithms.tex
@@ -1600,6 +1600,35 @@ the determined cases:
 where $\sigma_2$ (resp $\rho_1$, $\rho_2$) is the sign of $x_2$ (resp. $y_1$,
 $y_2$) and with the convention $0^0=+1$.
 
+\subsection {\texttt {mpc\_pow\_ui}}
+
+In the case of a non-negative integer exponent $n$, it might be faster to use
+binary exponentiation to compute $x^n$. This corresponds to a sequence of
+values $v_0 = x$, $v_1 \approx x^2$, \ldots, $v_k \approx x^n$,
+where $k$ is bounded
+by the length of $n$ in binary minus 1, plus the number of set bits in the
+binary representation of $n$ (except the leading one), or simply
+$k \leq 2 \lfloor \log_2 n \rfloor$.
+Each iteration computes either $v_{i+1} = \circ(v_i^2)$, or $v_{i+1} = \circ(x v_i)$.
+Since each such product is correctly rounded, if we work with precision $p$,
+the relative error on the real and imaginary parts of $v_{i+1}$ is bounded
+by $2^{-p}$ for rounding to nearest (with respect to $v_i^2$ or $x v_i$).
+It follows that the relative error in rounding $v_{i+1}$ is bounded by a
+complex value of norm $2^{-p}$. Indeed, if $\tilde{u} = u (1 + \theta_u)$
+and $\tilde{v} = v (1 + \theta_v)$ with $|\theta_u|, |\theta_v| \leq 2^{-p}$,
+then
+\[ \frac{\tilde{u} + i \tilde{v}}{u+iv} = 
+   \frac{u (1 + \theta_u) + i v (1 + \theta_v)}{u+iv} =
+   1 + \theta_z, \]
+where $|\theta_z|^2 = (u^2 \theta_u^2 + v^2 \theta_v^2)/(u^2+v^2) \leq
+2^{-2p}$.
+It is easy to see (for example by induction) that, if $v_i = x^{\ell}$,
+it accumulates exactly $\ell-1$ rounding errors. Thus we can write
+$v_k = x^n (1 + \theta)^{n-1}$, where $\theta$ is a complex number of norm
+at most $2^{-p}$. From this we deduce a bound on the absolute error on the
+real and imaginary parts of $v_k$, for example
+$|x|^n (|1 + 2^{-p}|^{n-1} - 1)$.
+
 \bibliographystyle{acm}
 \bibliography{algorithms}
author	zimmerma <zimmerma@211d60ee-9f03-0410-a15a-8952a2c7a4e4>	2010-03-11 12:22:32 +0000
committer	zimmerma <zimmerma@211d60ee-9f03-0410-a15a-8952a2c7a4e4>	2010-03-11 12:22:32 +0000
commit	04d32f58c2f36c536123b16a31f236b9846ef591 (patch)
tree	89469e96c31357c81e1c46c83f162c1b906f57d2 /doc
parent	4d51e71b251fdbfb4a23ddc4fe8398192944a2d1 (diff)
download	mpc-04d32f58c2f36c536123b16a31f236b9846ef591.tar.gz