Replace usage of CudaStreamDevice with GpuStreamDevice in tensor benchmarks GPU
This commit is contained in:
		
							parent
							
								
									8c43bf2b5b
								
							
						
					
					
						commit
						07e4604b19
					
				| @ -10,7 +10,7 @@ | ||||
| #define BM_FuncGPU(FUNC)                                                       \ | ||||
|   static void BM_##FUNC(int iters, int N) {                                    \ | ||||
|     StopBenchmarkTiming();                                                     \ | ||||
|     Eigen::CudaStreamDevice stream;                                            \ | ||||
|     Eigen::GpuStreamDevice stream;                                             \ | ||||
|     Eigen::GpuDevice device(&stream);                                          \ | ||||
|     BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, N);            \ | ||||
|     cudaDeviceSynchronize();                                                   \ | ||||
| @ -40,7 +40,7 @@ BM_FuncGPU(fullReduction); | ||||
| #define BM_FuncWithInputDimsGPU(FUNC, D1, D2, D3)                              \ | ||||
|   static void BM_##FUNC##_##D1##x##D2##x##D3(int iters, int N) {               \ | ||||
|     StopBenchmarkTiming();                                                     \ | ||||
|     Eigen::CudaStreamDevice stream;                                            \ | ||||
|     Eigen::GpuStreamDevice stream;                                             \ | ||||
|     Eigen::GpuDevice device(&stream);                                          \ | ||||
|     BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, D1, D2, D3);   \ | ||||
|     cudaDeviceSynchronize();                                                   \ | ||||
| @ -59,7 +59,7 @@ BM_FuncWithInputDimsGPU(contraction, N, N, 64); | ||||
| #define BM_FuncWithKernelDimsGPU(FUNC, DIM1, DIM2)                             \ | ||||
|   static void BM_##FUNC##_##DIM1##x##DIM2(int iters, int N) {                  \ | ||||
|     StopBenchmarkTiming();                                                     \ | ||||
|     Eigen::CudaStreamDevice stream;                                            \ | ||||
|     Eigen::GpuStreamDevice stream;                                             \ | ||||
|     Eigen::GpuDevice device(&stream);                                          \ | ||||
|     BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, N);            \ | ||||
|     cudaDeviceSynchronize();                                                   \ | ||||
|  | ||||
| @ -10,7 +10,7 @@ | ||||
| #define BM_FuncGPU(FUNC)                                                       \ | ||||
|   static void BM_##FUNC(int iters, int N) {                                    \ | ||||
|     StopBenchmarkTiming();                                                     \ | ||||
|     Eigen::CudaStreamDevice stream;                                            \ | ||||
|     Eigen::GpuStreamDevice stream;                                             \ | ||||
|     Eigen::GpuDevice device(&stream);                                          \ | ||||
|     BenchmarkSuite<Eigen::GpuDevice, float> suite(device, N);                  \ | ||||
|     cudaDeviceSynchronize();                                                   \ | ||||
| @ -40,7 +40,7 @@ BM_FuncGPU(fullReduction); | ||||
| #define BM_FuncWithInputDimsGPU(FUNC, D1, D2, D3)                              \ | ||||
|   static void BM_##FUNC##_##D1##x##D2##x##D3(int iters, int N) {               \ | ||||
|     StopBenchmarkTiming();                                                     \ | ||||
|     Eigen::CudaStreamDevice stream;                                            \ | ||||
|     Eigen::GpuStreamDevice stream;                                             \ | ||||
|     Eigen::GpuDevice device(&stream);                                          \ | ||||
|     BenchmarkSuite<Eigen::GpuDevice, float> suite(device, D1, D2, D3);         \ | ||||
|     cudaDeviceSynchronize();                                                   \ | ||||
| @ -59,7 +59,7 @@ BM_FuncWithInputDimsGPU(contraction, N, N, 64); | ||||
| #define BM_FuncWithKernelDimsGPU(FUNC, DIM1, DIM2)                             \ | ||||
|   static void BM_##FUNC##_##DIM1##x##DIM2(int iters, int N) {                  \ | ||||
|     StopBenchmarkTiming();                                                     \ | ||||
|     Eigen::CudaStreamDevice stream;                                            \ | ||||
|     Eigen::GpuStreamDevice stream;                                             \ | ||||
|     Eigen::GpuDevice device(&stream);                                          \ | ||||
|     BenchmarkSuite<Eigen::GpuDevice, float> suite(device, N);                  \ | ||||
|     cudaDeviceSynchronize();                                                   \ | ||||
|  | ||||
		Loading…
	
		Reference in New Issue
	
	Block a user
	 Alejandro Acosta
						Alejandro Acosta