1
1
#include " module_base/blas_connector.h"
2
2
#include " module_base/constants.h"
3
+ #include " module_base/module_device/memory_op.h"
3
4
#include " module_hsolver/kernels/math_kernel_op.h"
4
5
#include " module_psi/kernels/memory_op.h"
5
6
@@ -37,7 +38,7 @@ class PerfModuleHsolverMathKernel : public benchmark::Fixture {
37
38
public:
38
39
39
40
// DEVICE SYMBOL
40
- const psi ::DEVICE_CPU* cpu_ctx = {};
41
+ const base_device ::DEVICE_CPU* cpu_ctx = {};
41
42
42
43
int dim_vector = 1 ;
43
44
@@ -53,24 +54,24 @@ class PerfModuleHsolverMathKernel : public benchmark::Fixture {
53
54
std::complex<double > zconstant_a = {1.0 ,1.0 };
54
55
55
56
#if __CUDA || __UT_USE_CUDA || __ROCM || __UT_USE_ROCM
56
- const psi ::DEVICE_GPU * gpu_ctx = {};
57
+ const base_device ::DEVICE_GPU * gpu_ctx = {};
57
58
58
59
// from CPU to GPU
59
60
using synchronize_memory_op
60
- = psi ::memory::synchronize_memory_op<std::complex<double >, psi ::DEVICE_GPU, psi ::DEVICE_CPU>;
61
+ = base_device ::memory::synchronize_memory_op<std::complex<double >, base_device ::DEVICE_GPU, base_device ::DEVICE_CPU>;
61
62
62
63
// form GPU to CPU
63
64
using synchronize_memory_op_gpu
64
- = psi ::memory::synchronize_memory_op<std::complex<double >, psi ::DEVICE_CPU, psi ::DEVICE_GPU>;
65
+ = base_device ::memory::synchronize_memory_op<std::complex<double >, base_device ::DEVICE_CPU, base_device ::DEVICE_GPU>;
65
66
66
- using resize_memory_op = psi ::memory::resize_memory_op<std::complex<double >, psi ::DEVICE_GPU>;
67
- using delete_memory_op = psi ::memory::delete_memory_op<std::complex<double >, psi ::DEVICE_GPU>;
68
- using resize_memory_op_double = psi ::memory::resize_memory_op<double , psi ::DEVICE_GPU>;
69
- using delete_memory_op_double = psi ::memory::delete_memory_op<double , psi ::DEVICE_GPU>;
70
- using synchronize_memory_op_double = psi ::memory::synchronize_memory_op<double , psi ::DEVICE_GPU, psi ::DEVICE_CPU>;
67
+ using resize_memory_op = base_device ::memory::resize_memory_op<std::complex<double >, base_device ::DEVICE_GPU>;
68
+ using delete_memory_op = base_device ::memory::delete_memory_op<std::complex<double >, base_device ::DEVICE_GPU>;
69
+ using resize_memory_op_double = base_device ::memory::resize_memory_op<double , base_device ::DEVICE_GPU>;
70
+ using delete_memory_op_double = base_device ::memory::delete_memory_op<double , base_device ::DEVICE_GPU>;
71
+ using synchronize_memory_op_double = base_device ::memory::synchronize_memory_op<double , base_device ::DEVICE_GPU, base_device ::DEVICE_CPU>;
71
72
72
- using set_memory_op = psi ::memory::set_memory_op<std::complex<double >, psi ::DEVICE_GPU>;
73
- using set_memory_op_double = psi ::memory::set_memory_op<double , psi ::DEVICE_GPU>;
73
+ using set_memory_op = base_device ::memory::set_memory_op<std::complex<double >, base_device ::DEVICE_GPU>;
74
+ using set_memory_op_double = base_device ::memory::set_memory_op<double , base_device ::DEVICE_GPU>;
74
75
75
76
std::complex<double >* test_zvector_a_gpu = nullptr ;
76
77
std::complex<double >* test_zvector_b_gpu = nullptr ;
@@ -132,29 +133,29 @@ class PerfModuleHsolverMathKernel : public benchmark::Fixture {
132
133
133
134
// OPs need benchmark
134
135
// CPU operator
135
- using zdot_real_cpu_op = hsolver::dot_real_op<std::complex<double >, psi ::DEVICE_CPU>;
136
+ using zdot_real_cpu_op = hsolver::dot_real_op<std::complex<double >, base_device ::DEVICE_CPU>;
136
137
137
- using vector_div_constant_op_cpu = hsolver::vector_div_constant_op<std::complex<double >, psi ::DEVICE_CPU>;
138
- using vector_mul_vector_op_cpu = hsolver::vector_mul_vector_op<std::complex<double >, psi ::DEVICE_CPU>;
139
- using vector_div_vector_op_cpu = hsolver::vector_div_vector_op<std::complex<double >, psi ::DEVICE_CPU>;
138
+ using vector_div_constant_op_cpu = hsolver::vector_div_constant_op<std::complex<double >, base_device ::DEVICE_CPU>;
139
+ using vector_mul_vector_op_cpu = hsolver::vector_mul_vector_op<std::complex<double >, base_device ::DEVICE_CPU>;
140
+ using vector_div_vector_op_cpu = hsolver::vector_div_vector_op<std::complex<double >, base_device ::DEVICE_CPU>;
140
141
using constantvector_addORsub_constantVector_op_cpu
141
- = hsolver::constantvector_addORsub_constantVector_op<std::complex<double >, psi ::DEVICE_CPU>;
142
- using axpy_op_cpu = hsolver::axpy_op<std::complex<double >, psi ::DEVICE_CPU>;
143
- using scal_op_cpu = hsolver::scal_op<double , psi ::DEVICE_CPU>;
144
- using gemv_op_cpu = hsolver::gemv_op<std::complex<double >, psi ::DEVICE_CPU>;
142
+ = hsolver::constantvector_addORsub_constantVector_op<std::complex<double >, base_device ::DEVICE_CPU>;
143
+ using axpy_op_cpu = hsolver::axpy_op<std::complex<double >, base_device ::DEVICE_CPU>;
144
+ using scal_op_cpu = hsolver::scal_op<double , base_device ::DEVICE_CPU>;
145
+ using gemv_op_cpu = hsolver::gemv_op<std::complex<double >, base_device ::DEVICE_CPU>;
145
146
146
147
#if __CUDA || __UT_USE_CUDA || __ROCM || __UT_USE_ROCM
147
148
148
149
// GPU operator
149
- using zdot_real_gpu_op = hsolver::dot_real_op<std::complex<double >, psi ::DEVICE_GPU>;
150
+ using zdot_real_gpu_op = hsolver::dot_real_op<std::complex<double >, base_device ::DEVICE_GPU>;
150
151
151
- using vector_div_constant_op_gpu = hsolver::vector_div_constant_op<std::complex<double >, psi ::DEVICE_GPU>;
152
- using vector_mul_vector_op_gpu = hsolver::vector_mul_vector_op<std::complex<double >, psi ::DEVICE_GPU>;
153
- using vector_div_vector_op_gpu = hsolver::vector_div_vector_op<std::complex<double >, psi ::DEVICE_GPU>;
152
+ using vector_div_constant_op_gpu = hsolver::vector_div_constant_op<std::complex<double >, base_device ::DEVICE_GPU>;
153
+ using vector_mul_vector_op_gpu = hsolver::vector_mul_vector_op<std::complex<double >, base_device ::DEVICE_GPU>;
154
+ using vector_div_vector_op_gpu = hsolver::vector_div_vector_op<std::complex<double >, base_device ::DEVICE_GPU>;
154
155
using constantvector_addORsub_constantVector_op_gpu
155
- = hsolver::constantvector_addORsub_constantVector_op<std::complex<double >, psi ::DEVICE_GPU>;
156
- using axpy_op_gpu = hsolver::axpy_op<std::complex<double >, psi ::DEVICE_GPU>;
157
- using scal_op_gpu = hsolver::scal_op<double , psi ::DEVICE_GPU>;
156
+ = hsolver::constantvector_addORsub_constantVector_op<std::complex<double >, base_device ::DEVICE_GPU>;
157
+ using axpy_op_gpu = hsolver::axpy_op<std::complex<double >, base_device ::DEVICE_GPU>;
158
+ using scal_op_gpu = hsolver::scal_op<double , base_device ::DEVICE_GPU>;
158
159
159
160
#endif // __CUDA || __UT_USE_CUDA || __ROCM || __UT_USE_ROCM
160
161
};
0 commit comments