New module 'fmaf'.

* lib/math.in.h (fmaf): New declaration. * lib/fmaf.c: New file. * m4/fmaf.m4: New file. * m4/math_h.m4 (gl_MATH_H): Test whethern fmaf is declared. (gl_MATH_H_DEFAULTS): Initialize GNULIB_FMAF, HAVE_FMAF, REPLACE_FMAF. * modules/math (Makefile.am): Substitute GNULIB_FMAF, HAVE_FMAF, REPLACE_FMAF. * modules/fmaf: New file. * doc/posix-functions/fmaf.texi: Mention the new module and the various bugs.
author: Bruno Haible <bruno@clisp.org> 2011-10-17 23:51:21 +0200
committer: Bruno Haible <bruno@clisp.org> 2011-11-06 02:36:24 +0100
commit: e657a45c9599559dead7bbadb320764d7362d209 (patch)
tree: 361b178bd7b1866ae19f819db53877eb7d626127 /m4
parent: b8d5f042e8a565bab1d73a5d7f56db342ae51451 (diff)
download: gnulib-e657a45c9599559dead7bbadb320764d7362d209.tar.gz
2 files changed, 172 insertions, 2 deletions
diff --git a/m4/fmaf.m4 b/m4/fmaf.m4
new file mode 100644
index 0000000000..9d6eb37958
--- /dev/null
+++ b/m4/fmaf.m4
@@ -0,0 +1,167 @@
+# fmaf.m4 serial 1
+dnl Copyright (C) 2011 Free Software Foundation, Inc.
+dnl This file is free software; the Free Software Foundation
+dnl gives unlimited permission to copy and/or distribute it,
+dnl with or without modifications, as long as this notice is preserved.
+
+AC_DEFUN([gl_FUNC_FMAF],
+[
+  AC_REQUIRE([gl_MATH_H_DEFAULTS])
+
+  dnl Determine FMAF_LIBM.
+  gl_MATHFUNC([fmaf], [float], [(float, float, float)])
+  if test $gl_cv_func_fmaf_no_libm = yes \
+     || test $gl_cv_func_fmaf_in_libm = yes; then
+    gl_FUNC_FMAF_WORKS
+    case "$gl_cv_func_fmaf_works" in
+      *no) REPLACE_FMAF=1 ;;
+    esac
+  else
+    HAVE_FMAF=0
+  fi
+  if test $HAVE_FMAF = 0 || test $REPLACE_FMAF = 1; then
+    dnl Find libraries needed to link lib/fmaf.c.
+    AC_REQUIRE([gl_FUNC_FREXPF])
+    AC_REQUIRE([gl_FUNC_LDEXPF])
+    AC_REQUIRE([gl_FUNC_FEGETROUND])
+    FMAF_LIBM=
+    dnl Append $FREXPF_LIBM to FMAF_LIBM, avoiding gratuitous duplicates.
+    case " $FMAF_LIBM " in
+      *" $FREXPF_LIBM "*) ;;
+      *) FMAF_LIBM="$FMAF_LIBM $FREXPF_LIBM" ;;
+    esac
+    dnl Append $LDEXPF_LIBM to FMAF_LIBM, avoiding gratuitous duplicates.
+    case " $FMAF_LIBM " in
+      *" $LDEXPF_LIBM "*) ;;
+      *) FMAF_LIBM="$FMAF_LIBM $LDEXPF_LIBM" ;;
+    esac
+    dnl Append $FEGETROUND_LIBM to FMAF_LIBM, avoiding gratuitous duplicates.
+    case " $FMAF_LIBM " in
+      *" $FEGETROUND_LIBM "*) ;;
+      *) FMAF_LIBM="$FMAF_LIBM $FEGETROUND_LIBM" ;;
+    esac
+  fi
+  AC_SUBST([FMAF_LIBM])
+])
+
+dnl Test whether fmaf() has any of the 7 known bugs of glibc 2.11.3 on x86_64.
+AC_DEFUN([gl_FUNC_FMAF_WORKS],
+[
+  AC_REQUIRE([AC_PROG_CC])
+  AC_REQUIRE([AC_CANONICAL_HOST]) dnl for cross-compiles
+  AC_REQUIRE([gl_FUNC_LDEXPF])
+  save_LIBS="$LIBS"
+  LIBS="$LIBS $FMAF_LIBM $LDEXPF_LIBM"
+  AC_CACHE_CHECK([whether fmaf works], [gl_cv_func_fmaf_works],
+    [
+      AC_RUN_IFELSE(
+        [AC_LANG_SOURCE([[
+#include <float.h>
+#include <math.h>
+float p0 = 0.0f;
+int main()
+{
+  int failed_tests = 0;
+  /* These tests fail with glibc 2.11.3 on x86_64.  */
+  {
+    volatile float x = 1.5f; /* 3 * 2^-1 */
+    volatile float y = x;
+    volatile float z = ldexpf (1.0f, FLT_MANT_DIG + 1); /* 2^25 */
+    /* x * y + z with infinite precision: 2^25 + 9 * 2^-2.
+       Lies between (2^23 + 0) * 2^2 and (2^23 + 1) * 2^2
+       and is closer to (2^23 + 1) * 2^2, therefore the rounding
+       must round up and produce (2^23 + 1) * 2^2.  */
+    volatile float expected = z + 4.0f;
+    volatile float result = fmaf (x, y, z);
+    if (result != expected)
+      failed_tests |= 1;
+  }
+  {
+    volatile float x = 1.25f; /* 2^0 + 2^-2 */
+    volatile float y = - x;
+    volatile float z = ldexpf (1.0f, FLT_MANT_DIG + 1); /* 2^25 */
+    /* x * y + z with infinite precision: 2^25 - 2^0 - 2^-1 - 2^-4.
+       Lies between (2^24 - 1) * 2^1 and 2^24 * 2^1
+       and is closer to (2^24 - 1) * 2^1, therefore the rounding
+       must round down and produce (2^24 - 1) * 2^1.  */
+    volatile float expected = (ldexpf (1.0f, FLT_MANT_DIG) - 1.0f) * 2.0f;
+    volatile float result = fmaf (x, y, z);
+    if (result != expected)
+      failed_tests |= 2;
+  }
+  {
+    volatile float x = 1.0f + ldexpf (1.0f, 1 - FLT_MANT_DIG); /* 2^0 + 2^-23 */
+    volatile float y = x;
+    volatile float z = 4.0f; /* 2^2 */
+    /* x * y + z with infinite precision: 2^2 + 2^0 + 2^-22 + 2^-46.
+       Lies between (2^23 + 2^21) * 2^-21 and (2^23 + 2^21 + 1) * 2^-21
+       and is closer to (2^23 + 2^21 + 1) * 2^-21, therefore the rounding
+       must round up and produce (2^23 + 2^21 + 1) * 2^-21.  */
+    volatile float expected = 4.0f + 1.0f + ldexpf (1.0f, 3 - FLT_MANT_DIG);
+    volatile float result = fmaf (x, y, z);
+    if (result != expected)
+      failed_tests |= 4;
+  }
+  {
+    volatile float x = 1.0f + ldexpf (1.0f, 1 - FLT_MANT_DIG); /* 2^0 + 2^-23 */
+    volatile float y = - x;
+    volatile float z = 8.0f; /* 2^3 */
+    /* x * y + z with infinite precision: 2^2 + 2^1 + 2^0 - 2^-22 - 2^-46.
+       Lies between (2^23 + 2^22 + 2^21 - 1) * 2^-21 and
+       (2^23 + 2^22 + 2^21) * 2^-21 and is closer to
+       (2^23 + 2^22 + 2^21 - 1) * 2^-21, therefore the rounding
+       must round down and produce (2^23 + 2^22 + 2^21 - 1) * 2^-21.  */
+    volatile float expected = 7.0f - ldexpf (1.0f, 3 - FLT_MANT_DIG);
+    volatile float result = fmaf (x, y, z);
+    if (result != expected)
+      failed_tests |= 8;
+  }
+  {
+    volatile float x = 1.25f; /* 2^0 + 2^-2 */
+    volatile float y = - 0.75f; /* - 2^0 + 2^-2 */
+    volatile float z = ldexpf (1.0f, FLT_MANT_DIG); /* 2^24 */
+    /* x * y + z with infinite precision: 2^24 - 2^0 + 2^-4.
+       Lies between (2^24 - 2^0) and 2^24 and is closer to (2^24 - 2^0),
+       therefore the rounding must round down and produce (2^24 - 2^0).  */
+    volatile float expected = ldexpf (1.0f, FLT_MANT_DIG) - 1.0f;
+    volatile float result = fmaf (x, y, z);
+    if (result != expected)
+      failed_tests |= 16;
+  }
+  if ((FLT_MANT_DIG % 2) == 0)
+    {
+      volatile float x = 1.0f + ldexpf (1.0f, - FLT_MANT_DIG / 2); /* 2^0 + 2^-12 */
+      volatile float y = x;
+      volatile float z = ldexpf (1.0f, FLT_MIN_EXP - FLT_MANT_DIG); /* 2^-149 */
+      /* x * y + z with infinite precision: 2^0 + 2^-11 + 2^-24 + 2^-149.
+         Lies between (2^23 + 2^12 + 0) * 2^-23 and (2^23 + 2^12 + 1) * 2^-23
+         and is closer to (2^23 + 2^12 + 1) * 2^-23, therefore the rounding
+         must round up and produce (2^23 + 2^12 + 1) * 2^-23.  */
+      volatile float expected =
+        1.0f + ldexpf (1.0f, 1 - FLT_MANT_DIG / 2) + ldexpf (1.0f, 1 - FLT_MANT_DIG);
+      volatile float result = fmaf (x, y, z);
+      if (result != expected)
+        failed_tests |= 32;
+    }
+  {
+    float minus_inf = -1.0f / p0;
+    volatile float x = ldexpf (1.0f, FLT_MAX_EXP - 1);
+    volatile float y = ldexpf (1.0f, FLT_MAX_EXP - 1);
+    volatile float z = minus_inf;
+    volatile float result = fmaf (x, y, z);
+    if (!(result == minus_inf))
+      failed_tests |= 64;
+  }
+  return failed_tests;
+}]])],
+        [gl_cv_func_fmaf_works=yes],
+        [gl_cv_func_fmaf_works=no],
+        [dnl Guess no, even on glibc systems.
+         gl_cv_func_fmaf_works="guessing no"
+        ])
+    ])
+  LIBS="$save_LIBS"
+])
+
+# Prerequisites of lib/fmaf.c.
+AC_DEFUN([gl_PREREQ_FMAF], [:])
diff --git a/m4/math_h.m4 b/m4/math_h.m4
index 878aaff3a1..8c65173033 100644
--- a/m4/math_h.m4
+++ b/m4/math_h.m4
@@ -1,4 +1,4 @@
-# math_h.m4 serial 54
+# math_h.m4 serial 55
 dnl Copyright (C) 2007-2011 Free Software Foundation, Inc.
 dnl This file is free software; the Free Software Foundation
 dnl gives unlimited permission to copy and/or distribute it,
@@ -41,7 +41,7 @@ AC_DEFUN([gl_MATH_H],
   gl_WARN_ON_USE_PREPARE([[#include <math.h>]],
     [acosf acosl asinf asinl atanf atanl
      ceilf ceill copysign copysignf copysignl cosf cosl coshf
-     expf expl fabsf floorf floorl fma fmodf frexpf frexpl
+     expf expl fabsf floorf floorl fma fmaf fmodf frexpf frexpl
      ldexpf ldexpl logb logf logl log10f modff powf
      rint rintf rintl round roundf roundl sinf sinl sinhf sqrtf sqrtl
      tanf tanl tanhf trunc truncf truncl])
@@ -81,6 +81,7 @@ AC_DEFUN([gl_MATH_H_DEFAULTS],
   GNULIB_FLOORF=0;    AC_SUBST([GNULIB_FLOORF])
   GNULIB_FLOORL=0;    AC_SUBST([GNULIB_FLOORL])
   GNULIB_FMA=0;       AC_SUBST([GNULIB_FMA])
+  GNULIB_FMAF=0;      AC_SUBST([GNULIB_FMAF])
   GNULIB_FMODF=0;     AC_SUBST([GNULIB_FMODF])
   GNULIB_FREXPF=0;    AC_SUBST([GNULIB_FREXPF])
   GNULIB_FREXP=0;     AC_SUBST([GNULIB_FREXP])
@@ -135,6 +136,7 @@ AC_DEFUN([gl_MATH_H_DEFAULTS],
   HAVE_EXPL=1;                 AC_SUBST([HAVE_EXPL])
   HAVE_FABSF=1;                AC_SUBST([HAVE_FABSF])
   HAVE_FMA=1;                  AC_SUBST([HAVE_FMA])
+  HAVE_FMAF=1;                 AC_SUBST([HAVE_FMAF])
   HAVE_FMODF=1;                AC_SUBST([HAVE_FMODF])
   HAVE_FREXPF=1;               AC_SUBST([HAVE_FREXPF])
   HAVE_ISNANF=1;               AC_SUBST([HAVE_ISNANF])
@@ -186,6 +188,7 @@ AC_DEFUN([gl_MATH_H_DEFAULTS],
   REPLACE_FLOORF=0;            AC_SUBST([REPLACE_FLOORF])
   REPLACE_FLOORL=0;            AC_SUBST([REPLACE_FLOORL])
   REPLACE_FMA=0;               AC_SUBST([REPLACE_FMA])
+  REPLACE_FMAF=0;              AC_SUBST([REPLACE_FMAF])
   REPLACE_FREXPF=0;            AC_SUBST([REPLACE_FREXPF])
   REPLACE_FREXP=0;             AC_SUBST([REPLACE_FREXP])
   REPLACE_FREXPL=0;            AC_SUBST([REPLACE_FREXPL])
author	Bruno Haible <bruno@clisp.org>	2011-10-17 23:51:21 +0200
committer	Bruno Haible <bruno@clisp.org>	2011-11-06 02:36:24 +0100
commit	e657a45c9599559dead7bbadb320764d7362d209 (patch)
tree	361b178bd7b1866ae19f819db53877eb7d626127 /m4
parent	b8d5f042e8a565bab1d73a5d7f56db342ae51451 (diff)
download	gnulib-e657a45c9599559dead7bbadb320764d7362d209.tar.gz