Fixed another compilation problem with TensorIntDiv.h

2025-08-13 20:26:03 +08:00 · 2015-02-26 11:14:23 -08:00 · 2015-02-26 11:14:23 -08:00 · f074bb4b5f
commit f074bb4b5f
parent 57154fdb32
1 changed files with 4 additions and 4 deletions
--- a/unsupported/Eigen/CXX11/src/Tensor/TensorIntDiv.h
+++ b/unsupported/Eigen/CXX11/src/Tensor/TensorIntDiv.h
@ -33,17 +33,17 @@ namespace {
  template <typename T>
  EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE int count_leading_zeros(const T val)
  {
-#ifndef __CUDA_ARCH__
+#ifdef __CUDA_ARCH__
-    return __builtin_clz(static_cast<uint32_t>(val));
+    return __clz(val);
 #elif EIGEN_COMP_MSVC
    DWORD leading_zero = 0;
    _BitScanReverse( &leading_zero, value);
    return 31 - leading_zero;
 #else
-    return __clz(val);
+    return __builtin_clz(static_cast<uint32_t>(val));
 #endif
  }
-};
+}
 template <typename T>
 struct TensorIntDivisor {