Merged eigen/eigen into default

2025-07-01 18:55:11 +08:00 · 2016-11-01 15:37:00 -07:00 · 2016-11-01 15:37:00 -07:00 · 0a6ae41555
commit 0a6ae41555
parent b730952414 7a0e96b80d
8 changed files with 38 additions and 35 deletions
--- a/Eigen/src/Core/arch/CUDA/PacketMathHalf.h
+++ b/Eigen/src/Core/arch/CUDA/PacketMathHalf.h
@ -15,7 +15,7 @@ namespace Eigen {
 namespace internal {
 // Most of the following operations require arch >= 3.0
-#if defined(EIGEN_HAS_CUDA_FP16) && defined(__CUDA_ARCH__) && __CUDA_ARCH__ >= 300
+#if defined(EIGEN_HAS_CUDA_FP16) && defined(__CUDACC__) && defined(__CUDA_ARCH__) && __CUDA_ARCH__ >= 300
 template<> struct is_arithmetic<half2> { enum { value = true }; };
--- a/unsupported/Eigen/CXX11/src/Tensor/TensorEvalTo.h
+++ b/unsupported/Eigen/CXX11/src/Tensor/TensorEvalTo.h
@ -38,7 +38,9 @@ struct traits<TensorEvalToOp<XprType, MakePointer_> >
  };
  template <class T>
  struct MakePointer {
-    typedef typename MakePointer_<T>::Type Type;
+    // Intermediate typedef to workaround MSVC issue.
    typedef MakePointer_<T> MakePointerT;
    typedef typename MakePointerT::Type Type;
  };
 };
--- a/unsupported/Eigen/CXX11/src/Tensor/TensorForcedEval.h
+++ b/unsupported/Eigen/CXX11/src/Tensor/TensorForcedEval.h
@ -42,9 +42,10 @@ struct traits<TensorForcedEvalOp<XprType, MakePointer_> >
  enum {
    Flags = 0
  };
-  template <class T>
+  template <class T> struct MakePointer {
-  struct MakePointer {
+    // Intermediate typedef to workaround MSVC issue.
-    typedef typename MakePointer_<T>::Type Type;
+    typedef MakePointer_<T> MakePointerT;
    typedef typename MakePointerT::Type Type;
  };
 };
--- a/unsupported/Eigen/CXX11/src/Tensor/TensorTraits.h
+++ b/unsupported/Eigen/CXX11/src/Tensor/TensorTraits.h
@ -142,16 +142,16 @@ struct eval<const TensorFixedSize<Scalar_, Dimensions, Options, IndexType_>, Eig
  typedef const TensorFixedSize<Scalar_, Dimensions, Options, IndexType_>& type;
 };
-template<typename PlainObjectType, int Options>
+template<typename PlainObjectType, int Options, template <class> class MakePointer>
-struct eval<TensorMap<PlainObjectType, Options>, Eigen::Dense>
+struct eval<TensorMap<PlainObjectType, Options, MakePointer>, Eigen::Dense>
 {
-  typedef const TensorMap<PlainObjectType, Options>& type;
+  typedef const TensorMap<PlainObjectType, Options, MakePointer>& type;
 };
-template<typename PlainObjectType, int Options>
+template<typename PlainObjectType, int Options, template <class> class MakePointer>
-struct eval<const TensorMap<PlainObjectType, Options>, Eigen::Dense>
+struct eval<const TensorMap<PlainObjectType, Options, MakePointer>, Eigen::Dense>
 {
-  typedef const TensorMap<PlainObjectType, Options>& type;
+  typedef const TensorMap<PlainObjectType, Options, MakePointer>& type;
 };
 template<typename PlainObjectType>
@ -197,16 +197,16 @@ struct nested<const TensorFixedSize<Scalar_, Dimensions, Options, IndexType_> >
 };
-template <typename PlainObjectType, int Options>
+template <typename PlainObjectType, int Options, template <class> class MakePointer>
-struct nested<TensorMap<PlainObjectType, Options> >
+struct nested<TensorMap<PlainObjectType, Options, MakePointer> >
 {
-  typedef const TensorMap<PlainObjectType, Options>& type;
+  typedef const TensorMap<PlainObjectType, Options, MakePointer>& type;
 };
-template <typename PlainObjectType, int Options>
+template <typename PlainObjectType, int Options, template <class> class MakePointer>
-struct nested<const TensorMap<PlainObjectType, Options> >
+struct nested<const TensorMap<PlainObjectType, Options, MakePointer> >
 {
-  typedef const TensorMap<PlainObjectType, Options>& type;
+  typedef const TensorMap<PlainObjectType, Options, MakePointer>& type;
 };
 template <typename PlainObjectType>
--- a/unsupported/test/cxx11_tensor_contract_cuda.cu
+++ b/unsupported/test/cxx11_tensor_contract_cuda.cu
@ -69,7 +69,7 @@ void test_cuda_contraction(int m_size, int k_size, int n_size)
  t_result = t_left.contract(t_right, dims);
  cudaMemcpy(t_result_gpu.data(), d_t_result, t_result_bytes, cudaMemcpyDeviceToHost);
-  for (size_t i = 0; i < t_result.size(); i++) {
+  for (DenseIndex i = 0; i < t_result.size(); i++) {
    if (fabs(t_result(i) - t_result_gpu(i)) < 1e-4f) {
      continue;
    }
--- a/unsupported/test/cxx11_tensor_cuda.cu
+++ b/unsupported/test/cxx11_tensor_cuda.cu
@ -303,8 +303,8 @@ void test_cuda_contraction()
  cudaMemcpy(t_result.data(), d_t_result, t_result_bytes, cudaMemcpyDeviceToHost);
-  for (size_t i = 0; i < t_result.dimensions().TotalSize(); i++) {
+  for (DenseIndex i = 0; i < t_result.size(); i++) {
-    if (fabs(t_result.data()[i] - m_result.data()[i]) >= 1e-4) {
+    if (fabs(t_result.data()[i] - m_result.data()[i]) >= 1e-4f) {
      std::cout << "mismatch detected at index " << i << ": " << t_result.data()[i] << " vs " <<  m_result.data()[i] << std::endl;
      assert(false);
    }
--- a/unsupported/test/cxx11_tensor_image_patch.cpp
+++ b/unsupported/test/cxx11_tensor_image_patch.cpp
@ -13,7 +13,7 @@
 using Eigen::Tensor;
-static void test_simple_patch()
+void test_simple_patch()
 {
  Tensor<float, 4> tensor(2,3,5,7);
  tensor.setRandom();
@ -180,7 +180,7 @@ static void test_simple_patch()
 }
 // Verifies VALID padding (no padding) with incrementing values.
-static void test_patch_padding_valid()
+void test_patch_padding_valid()
 {
  int input_depth = 3;
  int input_rows = 3;
@ -256,7 +256,7 @@ static void test_patch_padding_valid()
 }
 // Verifies VALID padding (no padding) with the same value.
-static void test_patch_padding_valid_same_value()
+void test_patch_padding_valid_same_value()
 {
  int input_depth = 1;
  int input_rows = 5;
@ -329,7 +329,7 @@ static void test_patch_padding_valid_same_value()
 }
 // Verifies SAME padding.
-static void test_patch_padding_same()
+void test_patch_padding_same()
 {
  int input_depth = 3;
  int input_rows = 4;
@ -405,7 +405,7 @@ static void test_patch_padding_same()
  }
 }
-static void test_patch_no_extra_dim()
+void test_patch_no_extra_dim()
 {
  Tensor<float, 3> tensor(2,3,5);
  tensor.setRandom();
@ -553,7 +553,7 @@ static void test_patch_no_extra_dim()
  }
 }
-static void test_imagenet_patches()
+void test_imagenet_patches()
 {
  // Test the code on typical configurations used by the 'imagenet' benchmarks at
  // https://github.com/soumith/convnet-benchmarks
@ -748,10 +748,10 @@ static void test_imagenet_patches()
 void test_cxx11_tensor_image_patch()
 {
-  CALL_SUBTEST(test_simple_patch());
+  CALL_SUBTEST_1(test_simple_patch());
-  CALL_SUBTEST(test_patch_no_extra_dim());
+  CALL_SUBTEST_2(test_patch_no_extra_dim());
-  CALL_SUBTEST(test_patch_padding_valid());
+  CALL_SUBTEST_3(test_patch_padding_valid());
-  CALL_SUBTEST(test_patch_padding_valid_same_value());
+  CALL_SUBTEST_4(test_patch_padding_valid_same_value());
-  CALL_SUBTEST(test_patch_padding_same());
+  CALL_SUBTEST_5(test_patch_padding_same());
-  CALL_SUBTEST(test_imagenet_patches());
+  CALL_SUBTEST_6(test_imagenet_patches());
 }
--- a/unsupported/test/cxx11_tensor_scan_cuda.cu
+++ b/unsupported/test/cxx11_tensor_scan_cuda.cu
@ -55,7 +55,7 @@ void test_cuda_cumsum(int m_size, int k_size, int n_size)
  t_result = t_input.cumsum(1);
  cudaMemcpy(t_result_gpu.data(), d_t_result, t_result_bytes, cudaMemcpyDeviceToHost);
-  for (size_t i = 0; i < t_result.size(); i++) {
+  for (DenseIndex i = 0; i < t_result.size(); i++) {
    if (fabs(t_result(i) - t_result_gpu(i)) < 1e-4f) {
      continue;
    }