bug #1674: workaround clang fast-math aggressive optimizations

2025-08-12 03:39:01 +08:00 · 2019-02-22 15:48:53 +01:00 · 2019-02-22 15:48:53 +01:00 · 1c09ee8541
commit 1c09ee8541
parent 7e3084bb6f
1 changed files with 13 additions and 0 deletions
--- a/Eigen/src/Core/arch/Default/GenericPacketMathFunctions.h
+++ b/Eigen/src/Core/arch/Default/GenericPacketMathFunctions.h
@ -324,6 +324,14 @@ __attribute__((optimize("-fno-unsafe-math-optimizations")))
 #endif
 Packet psincos_float(const Packet& _x)
 {
 // Workaround -ffast-math aggressive optimizations
 // See bug 1674
 #if EIGEN_COMP_CLANG && defined(EIGEN_VECTORIZE_SSE)
 #define EIGEN_SINCOS_DONT_OPT(X) __asm__  ("" : "+x" (X));
 #else
 #define EIGEN_SINCOS_DONT_OPT(X)
 #endif
  typedef typename unpacket_traits<Packet>::integer_packet PacketI;
  const Packet  cst_2oPI            = pset1<Packet>(0.636619746685028076171875f); // 2/PI
@ -338,6 +346,7 @@ Packet psincos_float(const Packet& _x)
  // Rounding trick:
  Packet y_round = padd(y, cst_rounding_magic);
  EIGEN_SINCOS_DONT_OPT(y_round)
  PacketI y_int = preinterpret<PacketI>(y_round); // last 23 digits represent integer (if abs(x)<2^24)
  y = psub(y_round, cst_rounding_magic); // nearest integer to x*4/pi
@ -359,7 +368,9 @@ Packet psincos_float(const Packet& _x)
  // and 2 ULP up to:
  const float huge_th = ComputeSine ? 25966.f : 18838.f;
  x = pmadd(y, pset1<Packet>(-1.5703125), x); // = 0xbfc90000
  EIGEN_SINCOS_DONT_OPT(x)
  x = pmadd(y, pset1<Packet>(-0.000483989715576171875), x); // = 0xb9fdc000
  EIGEN_SINCOS_DONT_OPT(x)
  x = pmadd(y, pset1<Packet>(1.62865035235881805419921875e-07), x); // = 0x342ee000
  x = pmadd(y, pset1<Packet>(5.5644315544167710640977020375430583953857421875e-11), x); // = 0x2e74b9ee
@ -436,6 +447,8 @@ Packet psincos_float(const Packet& _x)
  // Update the sign and filter huge inputs
  return pxor(y, sign_bit);
 #undef EIGEN_SINCOS_DONT_OPT
 }
 template<typename Packet>