summaryrefslogtreecommitdiff
path: root/m4
diff options
context:
space:
mode:
authorBruno Haible <bruno@clisp.org>2011-10-17 23:51:21 +0200
committerBruno Haible <bruno@clisp.org>2011-11-06 02:36:24 +0100
commite657a45c9599559dead7bbadb320764d7362d209 (patch)
tree361b178bd7b1866ae19f819db53877eb7d626127 /m4
parentb8d5f042e8a565bab1d73a5d7f56db342ae51451 (diff)
downloadgnulib-e657a45c9599559dead7bbadb320764d7362d209.tar.gz
New module 'fmaf'.
* lib/math.in.h (fmaf): New declaration. * lib/fmaf.c: New file. * m4/fmaf.m4: New file. * m4/math_h.m4 (gl_MATH_H): Test whethern fmaf is declared. (gl_MATH_H_DEFAULTS): Initialize GNULIB_FMAF, HAVE_FMAF, REPLACE_FMAF. * modules/math (Makefile.am): Substitute GNULIB_FMAF, HAVE_FMAF, REPLACE_FMAF. * modules/fmaf: New file. * doc/posix-functions/fmaf.texi: Mention the new module and the various bugs.
Diffstat (limited to 'm4')
-rw-r--r--m4/fmaf.m4167
-rw-r--r--m4/math_h.m47
2 files changed, 172 insertions, 2 deletions
diff --git a/m4/fmaf.m4 b/m4/fmaf.m4
new file mode 100644
index 0000000000..9d6eb37958
--- /dev/null
+++ b/m4/fmaf.m4
@@ -0,0 +1,167 @@
+# fmaf.m4 serial 1
+dnl Copyright (C) 2011 Free Software Foundation, Inc.
+dnl This file is free software; the Free Software Foundation
+dnl gives unlimited permission to copy and/or distribute it,
+dnl with or without modifications, as long as this notice is preserved.
+
+AC_DEFUN([gl_FUNC_FMAF],
+[
+ AC_REQUIRE([gl_MATH_H_DEFAULTS])
+
+ dnl Determine FMAF_LIBM.
+ gl_MATHFUNC([fmaf], [float], [(float, float, float)])
+ if test $gl_cv_func_fmaf_no_libm = yes \
+ || test $gl_cv_func_fmaf_in_libm = yes; then
+ gl_FUNC_FMAF_WORKS
+ case "$gl_cv_func_fmaf_works" in
+ *no) REPLACE_FMAF=1 ;;
+ esac
+ else
+ HAVE_FMAF=0
+ fi
+ if test $HAVE_FMAF = 0 || test $REPLACE_FMAF = 1; then
+ dnl Find libraries needed to link lib/fmaf.c.
+ AC_REQUIRE([gl_FUNC_FREXPF])
+ AC_REQUIRE([gl_FUNC_LDEXPF])
+ AC_REQUIRE([gl_FUNC_FEGETROUND])
+ FMAF_LIBM=
+ dnl Append $FREXPF_LIBM to FMAF_LIBM, avoiding gratuitous duplicates.
+ case " $FMAF_LIBM " in
+ *" $FREXPF_LIBM "*) ;;
+ *) FMAF_LIBM="$FMAF_LIBM $FREXPF_LIBM" ;;
+ esac
+ dnl Append $LDEXPF_LIBM to FMAF_LIBM, avoiding gratuitous duplicates.
+ case " $FMAF_LIBM " in
+ *" $LDEXPF_LIBM "*) ;;
+ *) FMAF_LIBM="$FMAF_LIBM $LDEXPF_LIBM" ;;
+ esac
+ dnl Append $FEGETROUND_LIBM to FMAF_LIBM, avoiding gratuitous duplicates.
+ case " $FMAF_LIBM " in
+ *" $FEGETROUND_LIBM "*) ;;
+ *) FMAF_LIBM="$FMAF_LIBM $FEGETROUND_LIBM" ;;
+ esac
+ fi
+ AC_SUBST([FMAF_LIBM])
+])
+
+dnl Test whether fmaf() has any of the 7 known bugs of glibc 2.11.3 on x86_64.
+AC_DEFUN([gl_FUNC_FMAF_WORKS],
+[
+ AC_REQUIRE([AC_PROG_CC])
+ AC_REQUIRE([AC_CANONICAL_HOST]) dnl for cross-compiles
+ AC_REQUIRE([gl_FUNC_LDEXPF])
+ save_LIBS="$LIBS"
+ LIBS="$LIBS $FMAF_LIBM $LDEXPF_LIBM"
+ AC_CACHE_CHECK([whether fmaf works], [gl_cv_func_fmaf_works],
+ [
+ AC_RUN_IFELSE(
+ [AC_LANG_SOURCE([[
+#include <float.h>
+#include <math.h>
+float p0 = 0.0f;
+int main()
+{
+ int failed_tests = 0;
+ /* These tests fail with glibc 2.11.3 on x86_64. */
+ {
+ volatile float x = 1.5f; /* 3 * 2^-1 */
+ volatile float y = x;
+ volatile float z = ldexpf (1.0f, FLT_MANT_DIG + 1); /* 2^25 */
+ /* x * y + z with infinite precision: 2^25 + 9 * 2^-2.
+ Lies between (2^23 + 0) * 2^2 and (2^23 + 1) * 2^2
+ and is closer to (2^23 + 1) * 2^2, therefore the rounding
+ must round up and produce (2^23 + 1) * 2^2. */
+ volatile float expected = z + 4.0f;
+ volatile float result = fmaf (x, y, z);
+ if (result != expected)
+ failed_tests |= 1;
+ }
+ {
+ volatile float x = 1.25f; /* 2^0 + 2^-2 */
+ volatile float y = - x;
+ volatile float z = ldexpf (1.0f, FLT_MANT_DIG + 1); /* 2^25 */
+ /* x * y + z with infinite precision: 2^25 - 2^0 - 2^-1 - 2^-4.
+ Lies between (2^24 - 1) * 2^1 and 2^24 * 2^1
+ and is closer to (2^24 - 1) * 2^1, therefore the rounding
+ must round down and produce (2^24 - 1) * 2^1. */
+ volatile float expected = (ldexpf (1.0f, FLT_MANT_DIG) - 1.0f) * 2.0f;
+ volatile float result = fmaf (x, y, z);
+ if (result != expected)
+ failed_tests |= 2;
+ }
+ {
+ volatile float x = 1.0f + ldexpf (1.0f, 1 - FLT_MANT_DIG); /* 2^0 + 2^-23 */
+ volatile float y = x;
+ volatile float z = 4.0f; /* 2^2 */
+ /* x * y + z with infinite precision: 2^2 + 2^0 + 2^-22 + 2^-46.
+ Lies between (2^23 + 2^21) * 2^-21 and (2^23 + 2^21 + 1) * 2^-21
+ and is closer to (2^23 + 2^21 + 1) * 2^-21, therefore the rounding
+ must round up and produce (2^23 + 2^21 + 1) * 2^-21. */
+ volatile float expected = 4.0f + 1.0f + ldexpf (1.0f, 3 - FLT_MANT_DIG);
+ volatile float result = fmaf (x, y, z);
+ if (result != expected)
+ failed_tests |= 4;
+ }
+ {
+ volatile float x = 1.0f + ldexpf (1.0f, 1 - FLT_MANT_DIG); /* 2^0 + 2^-23 */
+ volatile float y = - x;
+ volatile float z = 8.0f; /* 2^3 */
+ /* x * y + z with infinite precision: 2^2 + 2^1 + 2^0 - 2^-22 - 2^-46.
+ Lies between (2^23 + 2^22 + 2^21 - 1) * 2^-21 and
+ (2^23 + 2^22 + 2^21) * 2^-21 and is closer to
+ (2^23 + 2^22 + 2^21 - 1) * 2^-21, therefore the rounding
+ must round down and produce (2^23 + 2^22 + 2^21 - 1) * 2^-21. */
+ volatile float expected = 7.0f - ldexpf (1.0f, 3 - FLT_MANT_DIG);
+ volatile float result = fmaf (x, y, z);
+ if (result != expected)
+ failed_tests |= 8;
+ }
+ {
+ volatile float x = 1.25f; /* 2^0 + 2^-2 */
+ volatile float y = - 0.75f; /* - 2^0 + 2^-2 */
+ volatile float z = ldexpf (1.0f, FLT_MANT_DIG); /* 2^24 */
+ /* x * y + z with infinite precision: 2^24 - 2^0 + 2^-4.
+ Lies between (2^24 - 2^0) and 2^24 and is closer to (2^24 - 2^0),
+ therefore the rounding must round down and produce (2^24 - 2^0). */
+ volatile float expected = ldexpf (1.0f, FLT_MANT_DIG) - 1.0f;
+ volatile float result = fmaf (x, y, z);
+ if (result != expected)
+ failed_tests |= 16;
+ }
+ if ((FLT_MANT_DIG % 2) == 0)
+ {
+ volatile float x = 1.0f + ldexpf (1.0f, - FLT_MANT_DIG / 2); /* 2^0 + 2^-12 */
+ volatile float y = x;
+ volatile float z = ldexpf (1.0f, FLT_MIN_EXP - FLT_MANT_DIG); /* 2^-149 */
+ /* x * y + z with infinite precision: 2^0 + 2^-11 + 2^-24 + 2^-149.
+ Lies between (2^23 + 2^12 + 0) * 2^-23 and (2^23 + 2^12 + 1) * 2^-23
+ and is closer to (2^23 + 2^12 + 1) * 2^-23, therefore the rounding
+ must round up and produce (2^23 + 2^12 + 1) * 2^-23. */
+ volatile float expected =
+ 1.0f + ldexpf (1.0f, 1 - FLT_MANT_DIG / 2) + ldexpf (1.0f, 1 - FLT_MANT_DIG);
+ volatile float result = fmaf (x, y, z);
+ if (result != expected)
+ failed_tests |= 32;
+ }
+ {
+ float minus_inf = -1.0f / p0;
+ volatile float x = ldexpf (1.0f, FLT_MAX_EXP - 1);
+ volatile float y = ldexpf (1.0f, FLT_MAX_EXP - 1);
+ volatile float z = minus_inf;
+ volatile float result = fmaf (x, y, z);
+ if (!(result == minus_inf))
+ failed_tests |= 64;
+ }
+ return failed_tests;
+}]])],
+ [gl_cv_func_fmaf_works=yes],
+ [gl_cv_func_fmaf_works=no],
+ [dnl Guess no, even on glibc systems.
+ gl_cv_func_fmaf_works="guessing no"
+ ])
+ ])
+ LIBS="$save_LIBS"
+])
+
+# Prerequisites of lib/fmaf.c.
+AC_DEFUN([gl_PREREQ_FMAF], [:])
diff --git a/m4/math_h.m4 b/m4/math_h.m4
index 878aaff3a1..8c65173033 100644
--- a/m4/math_h.m4
+++ b/m4/math_h.m4
@@ -1,4 +1,4 @@
-# math_h.m4 serial 54
+# math_h.m4 serial 55
dnl Copyright (C) 2007-2011 Free Software Foundation, Inc.
dnl This file is free software; the Free Software Foundation
dnl gives unlimited permission to copy and/or distribute it,
@@ -41,7 +41,7 @@ AC_DEFUN([gl_MATH_H],
gl_WARN_ON_USE_PREPARE([[#include <math.h>]],
[acosf acosl asinf asinl atanf atanl
ceilf ceill copysign copysignf copysignl cosf cosl coshf
- expf expl fabsf floorf floorl fma fmodf frexpf frexpl
+ expf expl fabsf floorf floorl fma fmaf fmodf frexpf frexpl
ldexpf ldexpl logb logf logl log10f modff powf
rint rintf rintl round roundf roundl sinf sinl sinhf sqrtf sqrtl
tanf tanl tanhf trunc truncf truncl])
@@ -81,6 +81,7 @@ AC_DEFUN([gl_MATH_H_DEFAULTS],
GNULIB_FLOORF=0; AC_SUBST([GNULIB_FLOORF])
GNULIB_FLOORL=0; AC_SUBST([GNULIB_FLOORL])
GNULIB_FMA=0; AC_SUBST([GNULIB_FMA])
+ GNULIB_FMAF=0; AC_SUBST([GNULIB_FMAF])
GNULIB_FMODF=0; AC_SUBST([GNULIB_FMODF])
GNULIB_FREXPF=0; AC_SUBST([GNULIB_FREXPF])
GNULIB_FREXP=0; AC_SUBST([GNULIB_FREXP])
@@ -135,6 +136,7 @@ AC_DEFUN([gl_MATH_H_DEFAULTS],
HAVE_EXPL=1; AC_SUBST([HAVE_EXPL])
HAVE_FABSF=1; AC_SUBST([HAVE_FABSF])
HAVE_FMA=1; AC_SUBST([HAVE_FMA])
+ HAVE_FMAF=1; AC_SUBST([HAVE_FMAF])
HAVE_FMODF=1; AC_SUBST([HAVE_FMODF])
HAVE_FREXPF=1; AC_SUBST([HAVE_FREXPF])
HAVE_ISNANF=1; AC_SUBST([HAVE_ISNANF])
@@ -186,6 +188,7 @@ AC_DEFUN([gl_MATH_H_DEFAULTS],
REPLACE_FLOORF=0; AC_SUBST([REPLACE_FLOORF])
REPLACE_FLOORL=0; AC_SUBST([REPLACE_FLOORL])
REPLACE_FMA=0; AC_SUBST([REPLACE_FMA])
+ REPLACE_FMAF=0; AC_SUBST([REPLACE_FMAF])
REPLACE_FREXPF=0; AC_SUBST([REPLACE_FREXPF])
REPLACE_FREXP=0; AC_SUBST([REPLACE_FREXP])
REPLACE_FREXPL=0; AC_SUBST([REPLACE_FREXPL])