Update ConfigureVectorization.h to not optimize fp16 routines when compiling with cuda.

This commit is contained in:
Anshul Jaiswal 2019-11-06 22:40:38 +00:00
parent cc3d0e6a40
commit c1a67cb5af

View File

@ -372,7 +372,7 @@
#endif #endif
#endif #endif
#if defined(__F16C__) && (!defined(EIGEN_COMP_CLANG) || EIGEN_COMP_CLANG>=380) #if defined(__F16C__) && (!defined(EIGEN_GPUCC) && (!defined(EIGEN_COMP_CLANG) || EIGEN_COMP_CLANG>=380))
// We can use the optimized fp16 to float and float to fp16 conversion routines // We can use the optimized fp16 to float and float to fp16 conversion routines
#define EIGEN_HAS_FP16_C #define EIGEN_HAS_FP16_C