Remove ctx in dot_real_op

Critsium-xy · Critsium-xy · commit 937eb35fe1b2 · 2025-02-11T15:55:34.000+08:00
diff --git a/source/module_base/kernels/cuda/math_kernel_op.cu b/source/module_base/kernels/cuda/math_kernel_op.cu
@@ -451,8 +451,7 @@ void calc_grad_with_block_op<T, base_device::DEVICE_GPU>::operator()(const Real*
 }
 
 template <>
-double dot_real_op<double, base_device::DEVICE_GPU>::operator()(const base_device::DEVICE_GPU* d,
-                                                                const int& dim,
+double dot_real_op<double, base_device::DEVICE_GPU>::operator()(const int& dim,
                                                                 const double* psi_L,
                                                                 const double* psi_R,
                                                                 const bool reduce)
@@ -488,17 +487,15 @@ inline FPTYPE dot_complex_wrapper(const base_device::DEVICE_GPU* d,
 }
 
 template <>
-float dot_real_op<std::complex<float>, base_device::DEVICE_GPU>::operator()(const base_device::DEVICE_GPU* d,
-                                                                            const int& dim,
+float dot_real_op<std::complex<float>, base_device::DEVICE_GPU>::operator()(const int& dim,
                                                                             const std::complex<float>* psi_L,
                                                                             const std::complex<float>* psi_R,
                                                                             const bool reduce)
 {
     return dot_complex_wrapper(d, dim, psi_L, psi_R, reduce);
 }
 template <>
-double dot_real_op<std::complex<double>, base_device::DEVICE_GPU>::operator()(const base_device::DEVICE_GPU* d,
-                                                                              const int& dim,
+double dot_real_op<std::complex<double>, base_device::DEVICE_GPU>::operator()(const int& dim,
                                                                               const std::complex<double>* psi_L,
                                                                               const std::complex<double>* psi_R,
                                                                               const bool reduce)
diff --git a/source/module_base/kernels/math_kernel_op.cpp b/source/module_base/kernels/math_kernel_op.cpp
@@ -110,8 +110,7 @@ struct calc_grad_with_block_op<T, base_device::DEVICE_CPU>
 template <typename FPTYPE>
 struct dot_real_op<FPTYPE, base_device::DEVICE_CPU>
 {
-    FPTYPE operator()(const base_device::DEVICE_CPU* d,
-                      const int& dim,
+    FPTYPE operator()(const int& dim,
                       const FPTYPE* psi_L,
                       const FPTYPE* psi_R,
                       const bool reduce)
@@ -129,8 +128,7 @@ struct dot_real_op<FPTYPE, base_device::DEVICE_CPU>
 template <typename FPTYPE>
 struct dot_real_op<std::complex<FPTYPE>, base_device::DEVICE_CPU>
 {
-    FPTYPE operator()(const base_device::DEVICE_CPU* d,
-                      const int& dim,
+    FPTYPE operator()(const int& dim,
                       const std::complex<FPTYPE>* psi_L,
                       const std::complex<FPTYPE>* psi_R,
                       const bool reduce)
diff --git a/source/module_base/kernels/math_kernel_op.h b/source/module_base/kernels/math_kernel_op.h
@@ -98,7 +98,7 @@ template <typename T, typename Device> struct dot_real_op {
   ///
   /// \return
   /// FPTYPE : dot product result
-  Real operator()(const Device *d, const int &dim, const T *psi_L,
+  Real operator()(const int &dim, const T *psi_L,
                   const T *psi_R, const bool reduce = true);
 };
 
@@ -347,7 +347,7 @@ struct calc_grad_with_block_op<T, base_device::DEVICE_GPU> {
 // Partially specialize functor for base_device::GpuDevice.
 template <typename T> struct dot_real_op<T, base_device::DEVICE_GPU> {
   using Real = typename GetTypeReal<T>::type;
-  Real operator()(const base_device::DEVICE_GPU *d, const int &dim,
+  Real operator()(const int &dim,
                   const T *psi_L, const T *psi_R, const bool reduce = true);
 };
 
diff --git a/source/module_base/kernels/rocm/math_kernel_op.hip.cu b/source/module_base/kernels/rocm/math_kernel_op.hip.cu
@@ -374,8 +374,7 @@ void calc_grad_with_block_op<T, base_device::DEVICE_GPU>::operator()(const Real*
 }
 
 template <>
-double dot_real_op<double, base_device::DEVICE_GPU>::operator()(const base_device::DEVICE_GPU* d,
-                                                                const int& dim,
+double dot_real_op<double, base_device::DEVICE_GPU>::operator()(const int& dim,
                                                                 const double* psi_L,
                                                                 const double* psi_R,
                                                                 const bool reduce)
@@ -411,17 +410,15 @@ inline FPTYPE dot_complex_wrapper(const base_device::DEVICE_GPU* d,
     return result;
 }
 template <>
-float dot_real_op<std::complex<float>, base_device::DEVICE_GPU>::operator()(const base_device::DEVICE_GPU* d,
-                                                                            const int& dim,
+float dot_real_op<std::complex<float>, base_device::DEVICE_GPU>::operator()(const int& dim,
                                                                             const std::complex<float>* psi_L,
                                                                             const std::complex<float>* psi_R,
                                                                             const bool reduce)
 {
     return dot_complex_wrapper(d, dim, psi_L, psi_R, reduce);
 }
 template <>
-double dot_real_op<std::complex<double>, base_device::DEVICE_GPU>::operator()(const base_device::DEVICE_GPU* d,
-                                                                              const int& dim,
+double dot_real_op<std::complex<double>, base_device::DEVICE_GPU>::operator()(const int& dim,
                                                                               const std::complex<double>* psi_L,
                                                                               const std::complex<double>* psi_R,
                                                                               const bool reduce)
diff --git a/source/module_base/kernels/test/math_kernel_test.cpp b/source/module_base/kernels/test/math_kernel_test.cpp
@@ -257,7 +257,7 @@ class TestModuleHsolverMathKernel : public ::testing::Test
 // base_device::AbacusDevice_t device = base_device::CpuDevice, const bool reduce = true);
 TEST_F(TestModuleHsolverMathKernel, zdot_real_op_cpu)
 {
-    double result = zdot_real_cpu_op()(cpu_ctx, dim, psi_L.data(), psi_R.data(), false);
+    double result = zdot_real_cpu_op()(dim, psi_L.data(), psi_R.data(), false);
     EXPECT_LT(fabs(result - expected_result), 1e-12);
 }
 
@@ -376,7 +376,7 @@ TEST_F(TestModuleHsolverMathKernel, zdot_real_op_gpu)
     synchronize_memory_op()(psi_L_dev, psi_L.data(), psi_L.size());
     synchronize_memory_op()(psi_R_dev, psi_R.data(), psi_R.size());
     ModuleBase::createGpuBlasHandle();
-    double result = zdot_real_gpu_op()(gpu_ctx, dim, psi_L_dev, psi_R_dev, false);
+    double result = zdot_real_gpu_op()(dim, psi_L_dev, psi_R_dev, false);
     ModuleBase::destoryBLAShandle();
     EXPECT_LT(fabs(result - expected_result), 1e-12);
     delete_memory_op()(psi_L_dev);
diff --git a/source/module_hsolver/diago_cg.cpp b/source/module_hsolver/diago_cg.cpp
@@ -127,7 +127,7 @@ void DiagoCG<T, Device>::diag_mock(const ct::Tensor& prec_in,
         this->spsi_func_(phi_m, sphi); // sphi = S|psi(m)>
         this->hpsi_func_(phi_m, hphi); // hphi = H|psi(m)>
 
-        eigen_pack[m] = dot_real_op()(ctx_, this->n_basis_, phi_m.data<T>(), hphi.data<T>());
+        eigen_pack[m] = dot_real_op()(this->n_basis_, phi_m.data<T>(), hphi.data<T>());
 
         int iter = 0;
         Real gg_last = 0.0;
@@ -231,9 +231,9 @@ void DiagoCG<T, Device>::calc_grad(const ct::Tensor& prec,
 
     // Update lambda !
     // (4) <psi|SPH|psi >
-    const Real eh = ModuleBase::dot_real_op<T, Device>()(ctx_, this->n_basis_, sphi.data<T>(), grad.data<T>());
+    const Real eh = ModuleBase::dot_real_op<T, Device>()(this->n_basis_, sphi.data<T>(), grad.data<T>());
     // (5) <psi|SPS|psi >
-    const Real es = ModuleBase::dot_real_op<T, Device>()(ctx_, this->n_basis_, sphi.data<T>(), pphi.data<T>());
+    const Real es = ModuleBase::dot_real_op<T, Device>()(this->n_basis_, sphi.data<T>(), pphi.data<T>());
     const Real lambda = eh / es;
 
     // Update g!
@@ -328,7 +328,7 @@ void DiagoCG<T, Device>::calc_gamma_cg(const int& iter,
         // gg_inter = <g|g0>
         // Attention : the 'g' in g0 is getted last time
         gg_inter
-            = ModuleBase::dot_real_op<T, Device>()(ctx_, this->n_basis_, grad.data<T>(), g0.data<T>()); // b means before
+            = ModuleBase::dot_real_op<T, Device>()(this->n_basis_, grad.data<T>(), g0.data<T>()); // b means before
     }
 
     // (2) Update for g0!
@@ -346,7 +346,7 @@ void DiagoCG<T, Device>::calc_gamma_cg(const int& iter,
 
     // (3) Update gg_now!
     // gg_now = < g|P|scg > = < g|g0 >
-    const Real gg_now = ModuleBase::dot_real_op<T, Device>()(ctx_, this->n_basis_, grad.data<T>(), g0.data<T>());
+    const Real gg_now = ModuleBase::dot_real_op<T, Device>()(this->n_basis_, grad.data<T>(), g0.data<T>());
 
     if (iter == 0)
     {
@@ -404,15 +404,15 @@ bool DiagoCG<T, Device>::update_psi(const ct::Tensor& pphi,
                                     ct::Tensor& sphi,
                                     ct::Tensor& hphi)
 {
-    cg_norm = sqrt(ModuleBase::dot_real_op<T, Device>()(ctx_, this->n_basis_, cg.data<T>(), scg.data<T>()));
+    cg_norm = sqrt(ModuleBase::dot_real_op<T, Device>()(this->n_basis_, cg.data<T>(), scg.data<T>()));
 
     if (cg_norm < 1.0e-10)
         return true;
 
     const Real a0
-        = ModuleBase::dot_real_op<T, Device>()(ctx_, this->n_basis_, phi_m.data<T>(), pphi.data<T>()) * 2.0 / cg_norm;
+        = ModuleBase::dot_real_op<T, Device>()(this->n_basis_, phi_m.data<T>(), pphi.data<T>()) * 2.0 / cg_norm;
     const Real b0
-        = ModuleBase::dot_real_op<T, Device>()(ctx_, this->n_basis_, cg.data<T>(), pphi.data<T>()) / (cg_norm * cg_norm);
+        = ModuleBase::dot_real_op<T, Device>()(this->n_basis_, cg.data<T>(), pphi.data<T>()) / (cg_norm * cg_norm);
 
     const Real e0 = eigen;
     theta = atan(a0 / (e0 - b0)) / 2.0;
@@ -538,7 +538,7 @@ void DiagoCG<T, Device>::schmit_orth(const int& m, const ct::Tensor& psi, const
     }*/
     //>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
     auto psi_norm = ct::extract<Real>(lagrange_so[m])
-                    - dot_real_op()(ctx_, m, lagrange_so.data<T>(), lagrange_so.data<T>(), false);
+                    - dot_real_op()(m, lagrange_so.data<T>(), lagrange_so.data<T>(), false);
 
     if (psi_norm <= 0.0)
     {
diff --git a/source/module_hsolver/diago_dav_subspace.cpp b/source/module_hsolver/diago_dav_subspace.cpp
@@ -375,8 +375,7 @@ void Diago_DavSubspace<T, Device>::cal_grad(const HPsiFunc& hpsi_func,
     std::vector<Real> psi_norm(notconv, 0.0);
     for (size_t i = 0; i < notconv; i++)
     {
-        psi_norm[i] = ModuleBase::dot_real_op<T, Device>()(this->ctx,
-                                                           this->dim,
+        psi_norm[i] = ModuleBase::dot_real_op<T, Device>()(this->dim,
                                                            psi_iter + (nbase + i) * this->dim,
                                                            psi_iter + (nbase + i) * this->dim,
                                                            true);
diff --git a/source/module_hsolver/diago_david.cpp b/source/module_hsolver/diago_david.cpp
@@ -953,7 +953,7 @@ void DiagoDavid<T, Device>::SchmidtOrth(const int& dim,
                                      1);
 
     // psi_norm = psi_norm - lagrange_m · lagrange_m
-    psi_norm -= ModuleBase::dot_real_op<T, Device>()(this->ctx, m, lagrange_m, lagrange_m, false);
+    psi_norm -= ModuleBase::dot_real_op<T, Device>()(m, lagrange_m, lagrange_m, false);
 
     // for (int j = 0; j < m; j++)
     // {
diff --git a/source/module_hsolver/kernels/test/perf_math_kernel.cpp b/source/module_hsolver/kernels/test/perf_math_kernel.cpp
@@ -162,7 +162,7 @@ class PerfModuleHsolverMathKernel : public benchmark::Fixture {
 
 BENCHMARK_DEFINE_F(PerfModuleHsolverMathKernel, BM_zdot_real_cpu_op)(benchmark::State& state) {
     for (auto _ : state) {
-        double result = zdot_real_cpu_op()(cpu_ctx, dim_vector, test_zvector_a, test_zvector_b, false);
+        double result = zdot_real_cpu_op()(dim_vector, test_zvector_a, test_zvector_b, false);
     }
 }
 
@@ -232,7 +232,7 @@ BENCHMARK_DEFINE_F(PerfModuleHsolverMathKernel, BM_zdot_real_gpu_op)(benchmark::
 
 BENCHMARK_DEFINE_F(PerfModuleHsolverMathKernel, BM_zdot_real_gpu_op)(benchmark::State& state) {
     for (auto _ : state) {
-        double result = zdot_real_gpu_op()(gpu_ctx, dim_vector, test_zvector_a_gpu, test_zvector_b_gpu, false);
+        double result = zdot_real_gpu_op()(dim_vector, test_zvector_a_gpu, test_zvector_b_gpu, false);
     }
 }
 

Original file line number	Diff line number	Diff line change
`@@ -162,7 +162,7 @@ class PerfModuleHsolverMathKernel : public benchmark::Fixture {`
`162`	`162`
`163`	`163`	`BENCHMARK_DEFINE_F(PerfModuleHsolverMathKernel, BM_zdot_real_cpu_op)(benchmark::State& state) {`
`164`	`164`	`for (auto _ : state) {`
`165`		`- double result = zdot_real_cpu_op()(cpu_ctx, dim_vector, test_zvector_a, test_zvector_b, false);`
	`165`	`+ double result = zdot_real_cpu_op()(dim_vector, test_zvector_a, test_zvector_b, false);`
`166`	`166`	`}`
`167`	`167`	`}`
`168`	`168`
`@@ -232,7 +232,7 @@ BENCHMARK_DEFINE_F(PerfModuleHsolverMathKernel, BM_zdot_real_gpu_op)(benchmark::`
`232`	`232`
`233`	`233`	`BENCHMARK_DEFINE_F(PerfModuleHsolverMathKernel, BM_zdot_real_gpu_op)(benchmark::State& state) {`
`234`	`234`	`for (auto _ : state) {`
`235`		`- double result = zdot_real_gpu_op()(gpu_ctx, dim_vector, test_zvector_a_gpu, test_zvector_b_gpu, false);`
	`235`	`+ double result = zdot_real_gpu_op()(dim_vector, test_zvector_a_gpu, test_zvector_b_gpu, false);`
`236`	`236`	`}`
`237`	`237`	`}`
`238`	`238`