Add workaround for choosing the right include files with FP16C support with clang.

This commit is contained in:
Rasmus Munk Larsen 2019-06-05 13:36:37 -07:00
parent c1b0aea653
commit f715f6e816

View File

@ -375,6 +375,13 @@
#if defined(__F16C__) && (!defined(EIGEN_COMP_CLANG) || EIGEN_COMP_CLANG>=380)
// We can use the optimized fp16 to float and float to fp16 conversion routines
#define EIGEN_HAS_FP16_C
#if defined(EIGEN_COMP_CLANG)
// Workaround for clang: The FP16C intrinsics for clang are included by
// immintrin.h, as opposed to emmintrin.h as suggested by Intel:
// https://software.intel.com/sites/landingpage/IntrinsicsGuide/#othertechs=FP16C&expand=1711
#include <immintrin.h>
#endif
#endif
#if defined EIGEN_CUDACC