mirror of
https://gitlab.com/libeigen/eigen.git
synced 2025-06-04 18:54:00 +08:00
Replace usage of CudaStreamDevice with GpuStreamDevice in tensor benchmarks GPU
This commit is contained in:
parent
8c43bf2b5b
commit
07e4604b19
@ -10,7 +10,7 @@
|
||||
#define BM_FuncGPU(FUNC) \
|
||||
static void BM_##FUNC(int iters, int N) { \
|
||||
StopBenchmarkTiming(); \
|
||||
Eigen::CudaStreamDevice stream; \
|
||||
Eigen::GpuStreamDevice stream; \
|
||||
Eigen::GpuDevice device(&stream); \
|
||||
BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, N); \
|
||||
cudaDeviceSynchronize(); \
|
||||
@ -40,7 +40,7 @@ BM_FuncGPU(fullReduction);
|
||||
#define BM_FuncWithInputDimsGPU(FUNC, D1, D2, D3) \
|
||||
static void BM_##FUNC##_##D1##x##D2##x##D3(int iters, int N) { \
|
||||
StopBenchmarkTiming(); \
|
||||
Eigen::CudaStreamDevice stream; \
|
||||
Eigen::GpuStreamDevice stream; \
|
||||
Eigen::GpuDevice device(&stream); \
|
||||
BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, D1, D2, D3); \
|
||||
cudaDeviceSynchronize(); \
|
||||
@ -59,7 +59,7 @@ BM_FuncWithInputDimsGPU(contraction, N, N, 64);
|
||||
#define BM_FuncWithKernelDimsGPU(FUNC, DIM1, DIM2) \
|
||||
static void BM_##FUNC##_##DIM1##x##DIM2(int iters, int N) { \
|
||||
StopBenchmarkTiming(); \
|
||||
Eigen::CudaStreamDevice stream; \
|
||||
Eigen::GpuStreamDevice stream; \
|
||||
Eigen::GpuDevice device(&stream); \
|
||||
BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, N); \
|
||||
cudaDeviceSynchronize(); \
|
||||
|
@ -10,7 +10,7 @@
|
||||
#define BM_FuncGPU(FUNC) \
|
||||
static void BM_##FUNC(int iters, int N) { \
|
||||
StopBenchmarkTiming(); \
|
||||
Eigen::CudaStreamDevice stream; \
|
||||
Eigen::GpuStreamDevice stream; \
|
||||
Eigen::GpuDevice device(&stream); \
|
||||
BenchmarkSuite<Eigen::GpuDevice, float> suite(device, N); \
|
||||
cudaDeviceSynchronize(); \
|
||||
@ -40,7 +40,7 @@ BM_FuncGPU(fullReduction);
|
||||
#define BM_FuncWithInputDimsGPU(FUNC, D1, D2, D3) \
|
||||
static void BM_##FUNC##_##D1##x##D2##x##D3(int iters, int N) { \
|
||||
StopBenchmarkTiming(); \
|
||||
Eigen::CudaStreamDevice stream; \
|
||||
Eigen::GpuStreamDevice stream; \
|
||||
Eigen::GpuDevice device(&stream); \
|
||||
BenchmarkSuite<Eigen::GpuDevice, float> suite(device, D1, D2, D3); \
|
||||
cudaDeviceSynchronize(); \
|
||||
@ -59,7 +59,7 @@ BM_FuncWithInputDimsGPU(contraction, N, N, 64);
|
||||
#define BM_FuncWithKernelDimsGPU(FUNC, DIM1, DIM2) \
|
||||
static void BM_##FUNC##_##DIM1##x##DIM2(int iters, int N) { \
|
||||
StopBenchmarkTiming(); \
|
||||
Eigen::CudaStreamDevice stream; \
|
||||
Eigen::GpuStreamDevice stream; \
|
||||
Eigen::GpuDevice device(&stream); \
|
||||
BenchmarkSuite<Eigen::GpuDevice, float> suite(device, N); \
|
||||
cudaDeviceSynchronize(); \
|
||||
|
Loading…
x
Reference in New Issue
Block a user