Update ConfigureVectorization.h to not optimize fp16 routines when compiling with cuda.

2025-08-13 12:19:12 +08:00 · 2019-11-06 22:40:38 +00:00 · 2019-11-06 22:40:38 +00:00 · c1a67cb5af
commit c1a67cb5af
parent cc3d0e6a40
1 changed files with 1 additions and 1 deletions
--- a/Eigen/src/Core/util/ConfigureVectorization.h
+++ b/Eigen/src/Core/util/ConfigureVectorization.h
@ -372,7 +372,7 @@
  #endif
 #endif
-#if defined(__F16C__) && (!defined(EIGEN_COMP_CLANG) || EIGEN_COMP_CLANG>=380)
+#if defined(__F16C__) && (!defined(EIGEN_GPUCC) && (!defined(EIGEN_COMP_CLANG) || EIGEN_COMP_CLANG>=380))
  // We can use the optimized fp16 to float and float to fp16 conversion routines
  #define EIGEN_HAS_FP16_C