about summary refs log tree commit diff
diff options
context:
space:
mode:
authorUlrich Drepper <drepper@gmail.com>2011-10-24 22:11:21 -0400
committerUlrich Drepper <drepper@gmail.com>2011-10-24 22:11:21 -0400
commit202c9deb15ee43bcbe70b36fa9bae050b8633c27 (patch)
treeda6f340b0a0475b22c0ec7664f2dfea47aaad153
parent485683c35f020bd8b926e9673adb9b748380e8ce (diff)
downloadglibc-202c9deb15ee43bcbe70b36fa9bae050b8633c27.tar.gz
glibc-202c9deb15ee43bcbe70b36fa9bae050b8633c27.tar.xz
glibc-202c9deb15ee43bcbe70b36fa9bae050b8633c27.zip
Better DLA_FMS
It's better to use __builtin_fma if it works.  Use it for gcc 4.6 and
higher.  Move the x86-64 dla.h to the correct place.
-rw-r--r--ChangeLog6
-rw-r--r--sysdeps/x86_64/fpu/dla.h (renamed from sysdeps/x86_64/dla.h)9
2 files changed, 12 insertions, 3 deletions
diff --git a/ChangeLog b/ChangeLog
index 108d9a96c3..992ad4cb2a 100644
--- a/ChangeLog
+++ b/ChangeLog
@@ -1,7 +1,9 @@
 2011-10-24  Ulrich Drepper  <drepper@gmail.com>
 
-	* sysdeps/x86_64/dla.h (DLA_FMS): Some compilers fail to inline
-	__builtin_fma in some situations.  Have to use an asm.
+	* sysdeps/x86_64/dla.h: Move to ...
+	* sysdeps/x86_64/fpu/dla.h: ...here.
+	(DLA_FMS): Some compilers fail to inline __builtin_fma in some
+	situations.  Use __builtin_fma only for gcc 4.6 and up.
 
 	* config.make.in: Add have-mfma4 entry.
 	* configure.in: Substitute libc_cv_cc_fma4.
diff --git a/sysdeps/x86_64/dla.h b/sysdeps/x86_64/fpu/dla.h
index 6fe8f740f3..fa2d52bbf0 100644
--- a/sysdeps/x86_64/dla.h
+++ b/sysdeps/x86_64/fpu/dla.h
@@ -1,10 +1,17 @@
+#include <features.h>
+
 #ifdef __FMA4__
-# define DLA_FMS(x,y,z) \
+# if __GNUC_PREREQ (4, 6)
+#  define DLA_FMS(x,y,z) \
+  __builtin_fma (x, y, -(z))
+# else
+#  define DLA_FMS(x,y,z) \
   ({ double __z;							      \
      asm ("vfmsubsd %3, %2, %1, %0"					      \
 	  : "=x" (__z)							      \
 	  : "x" ((double) (x)), "xm" ((double) (y)) , "x" ((double) (z)));    \
     __z; })
+# endif
 #endif
 
 #include "sysdeps/ieee754/dbl-64/dla.h"