deepmodeling
diff --git a/‎source/module_esolver/esolver_ks_lcao_tddft.cpp‎
Lines changed: 2 additions & 0 deletions b/‎source/module_esolver/esolver_ks_lcao_tddft.cpp‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎source/module_esolver/esolver_ks_lcao_tddft.h‎
Lines changed: 0 additions & 1 deletion b/‎source/module_esolver/esolver_ks_lcao_tddft.h‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎source/module_hamilt_lcao/module_tddft/band_energy.cpp‎
Lines changed: 25 additions & 20 deletions b/‎source/module_hamilt_lcao/module_tddft/band_energy.cpp‎
Lines changed: 25 additions & 20 deletions
diff --git a/‎source/module_hamilt_lcao/module_tddft/band_energy.h‎
Lines changed: 6 additions & 3 deletions b/‎source/module_hamilt_lcao/module_tddft/band_energy.h‎
Lines changed: 6 additions & 3 deletions
diff --git a/‎source/module_hamilt_lcao/module_tddft/evolve_elec.cpp‎
Lines changed: 4 additions & 0 deletions b/‎source/module_hamilt_lcao/module_tddft/evolve_elec.cpp‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎source/module_hamilt_lcao/module_tddft/evolve_elec.h‎
Lines changed: 3 additions & 2 deletions b/‎source/module_hamilt_lcao/module_tddft/evolve_elec.h‎
Lines changed: 3 additions & 2 deletions
@@ -106,6 +106,7 @@ void ESolver_KS_LCAO_TDDFT<Device>::hamilt2density_single(UnitCell& ucell,
                                                          this->Hk_laststep,
                                                          this->Sk_laststep,
                                                          this->pelec->ekb,
+                                                         GlobalV::ofs_running,
                                                          td_htype,
                                                          PARAM.inp.propagator,
                                                          use_tensor,
@@ -127,6 +128,7 @@ void ESolver_KS_LCAO_TDDFT<Device>::hamilt2density_single(UnitCell& ucell,
                                                      this->Hk_laststep,
                                                      this->Sk_laststep,
                                                      this->pelec->ekb,
+                                                     GlobalV::ofs_running,
                                                      td_htype,
                                                      PARAM.inp.propagator,
                                                      use_tensor,
 
@@ -45,7 +45,6 @@ void gatherMatrix(const int myid, const int root_proc, const hamilt::MatrixBlock
     // Call the Cpxgemr2d function in ScaLAPACK to collect the matrix data
     Cpxgemr2d(nrows, ncols, mat_l.p, 1, 1, const_cast<int*>(desca), mat_g.p.get(), 1, 1, mat_g.desc.get(), ctxt);
 }
-
 //------------------------ MPI gathering and distributing functions ------------------------//
 
 template <typename Device = base_device::DEVICE_CPU>
 
@@ -25,7 +25,8 @@ void compute_ekb(const Parallel_Orbitals* pv,
                  const int nlocal,
                  const std::complex<double>* Htmp,
                  const std::complex<double>* psi_k,
-                 double* ekb)
+                 double* ekb,
+                 std::ofstream& ofs_running)
 {
 
     std::complex<double>* tmp1 = new std::complex<double>[pv->nloc_wfc];
@@ -76,10 +77,10 @@ void compute_ekb(const Parallel_Orbitals* pv,
 
     if (PARAM.inp.td_print_eij > 0.0)
     {
-        GlobalV::ofs_running
+        ofs_running
             << "------------------------------------------------------------------------------------------------"
             << std::endl;
-        GlobalV::ofs_running << " Eij:" << std::endl;
+        ofs_running << " Eij:" << std::endl;
         for (int i = 0; i < pv->nrow_bands; i++)
         {
             for (int j = 0; j < pv->ncol_bands; j++)
@@ -98,12 +99,12 @@ void compute_ekb(const Parallel_Orbitals* pv,
                 }
                 if (aa > 0.0 || bb > 0.0)
                 {
-                    GlobalV::ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;
+                    ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;
                 }
             }
         }
-        GlobalV::ofs_running << std::endl;
-        GlobalV::ofs_running
+        ofs_running << std::endl;
+        ofs_running
             << "------------------------------------------------------------------------------------------------"
             << std::endl;
     }
@@ -156,7 +157,8 @@ void compute_ekb_tensor(const Parallel_Orbitals* pv,
                         const int nlocal,
                         const ct::Tensor& Htmp,
                         const ct::Tensor& psi_k,
-                        ct::Tensor& ekb)
+                        ct::Tensor& ekb,
+                        std::ofstream& ofs_running)
 {
     // Create Tensor objects for temporary data
     ct::Tensor tmp1(ct::DataType::DT_COMPLEX_DOUBLE, ct::DeviceType::CpuDevice, ct::TensorShape({pv->nloc_wfc}));
@@ -209,10 +211,10 @@ void compute_ekb_tensor(const Parallel_Orbitals* pv,
 
     if (PARAM.inp.td_print_eij >= 0.0)
     {
-        GlobalV::ofs_running
+        ofs_running
             << "------------------------------------------------------------------------------------------------"
             << std::endl;
-        GlobalV::ofs_running << " Eij:" << std::endl;
+        ofs_running << " Eij:" << std::endl;
         for (int i = 0; i < pv->nrow_bands; i++)
         {
             for (int j = 0; j < pv->ncol_bands; j++)
@@ -231,12 +233,12 @@ void compute_ekb_tensor(const Parallel_Orbitals* pv,
                 }
                 if (aa > 0.0 || bb > 0.0)
                 {
-                    GlobalV::ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;
+                    ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;
                 }
             }
         }
-        GlobalV::ofs_running << std::endl;
-        GlobalV::ofs_running
+        ofs_running << std::endl;
+        ofs_running
             << "------------------------------------------------------------------------------------------------"
             << std::endl;
     }
@@ -290,7 +292,8 @@ void compute_ekb_tensor_lapack(const Parallel_Orbitals* pv,
                                const int nlocal,
                                const ct::Tensor& Htmp,
                                const ct::Tensor& psi_k,
-                               ct::Tensor& ekb)
+                               ct::Tensor& ekb,
+                               std::ofstream& ofs_running)
 {
     // ct_device_type = ct::DeviceType::CpuDevice or ct::DeviceType::GpuDevice
     ct::DeviceType ct_device_type = ct::DeviceTypeToEnum<Device>::value;
@@ -346,10 +349,10 @@ void compute_ekb_tensor_lapack(const Parallel_Orbitals* pv,
     {
         ct::Tensor Eij_cpu = Eij.to_device<ct::DEVICE_CPU>();
 
-        GlobalV::ofs_running
+        ofs_running
             << "------------------------------------------------------------------------------------------------"
             << std::endl;
-        GlobalV::ofs_running << " Eij:" << std::endl;
+        ofs_running << " Eij:" << std::endl;
         for (int i = 0; i < nband; i++)
         {
             for (int j = 0; j < nband; j++)
@@ -368,12 +371,12 @@ void compute_ekb_tensor_lapack(const Parallel_Orbitals* pv,
                 }
                 if (aa > 0.0 || bb > 0.0)
                 {
-                    GlobalV::ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;
+                    ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;
                 }
             }
         }
-        GlobalV::ofs_running << std::endl;
-        GlobalV::ofs_running
+        ofs_running << std::endl;
+        ofs_running
             << "------------------------------------------------------------------------------------------------"
             << std::endl;
     }
@@ -406,15 +409,17 @@ template void compute_ekb_tensor_lapack<base_device::DEVICE_CPU>(const Parallel_
                                                                  const int nlocal,
                                                                  const ct::Tensor& Htmp,
                                                                  const ct::Tensor& psi_k,
-                                                                 ct::Tensor& ekb);
+                                                                 ct::Tensor& ekb,
+                                                                 std::ofstream& ofs_running);
 
 #if ((defined __CUDA) /* || (defined __ROCM) */)
 template void compute_ekb_tensor_lapack<base_device::DEVICE_GPU>(const Parallel_Orbitals* pv,
                                                                  const int nband,
                                                                  const int nlocal,
                                                                  const ct::Tensor& Htmp,
                                                                  const ct::Tensor& psi_k,
-                                                                 ct::Tensor& ekb);
+                                                                 ct::Tensor& ekb,
+                                                                 std::ofstream& ofs_running);
 #endif // __CUDA
 #endif // __MPI
 
 
@@ -29,22 +29,25 @@ void compute_ekb(const Parallel_Orbitals* pv,
                  const int nlocal,
                  const std::complex<double>* Htmp,
                  const std::complex<double>* psi_k,
-                 double* ekb);
+                 double* ekb,
+                 std::ofstream& ofs_running);
 
 void compute_ekb_tensor(const Parallel_Orbitals* pv,
                         const int nband,
                         const int nlocal,
                         const ct::Tensor& Htmp,
                         const ct::Tensor& psi_k,
-                        ct::Tensor& ekb);
+                        ct::Tensor& ekb,
+                        std::ofstream& ofs_running);
 
 template <typename Device>
 void compute_ekb_tensor_lapack(const Parallel_Orbitals* pv,
                                const int nband,
                                const int nlocal,
                                const ct::Tensor& Htmp,
                                const ct::Tensor& psi_k,
-                               ct::Tensor& ekb);
+                               ct::Tensor& ekb,
+                               std::ofstream& ofs_running);
 #endif // __MPI
 } // namespace module_tddft
 #endif
@@ -31,6 +31,7 @@ void Evolve_elec<Device>::solve_psi(const int& istep,
                                     std::complex<double>** Hk_laststep,
                                     std::complex<double>** Sk_laststep,
                                     ModuleBase::matrix& ekb,
+                                    std::ofstream& ofs_running,
                                     const int htype,
                                     const int propagator,
                                     const bool use_tensor,
@@ -62,6 +63,7 @@ void Evolve_elec<Device>::solve_psi(const int& istep,
                        &(ekb(ik, 0)),
                        htype,
                        propagator,
+                       ofs_running,
                        print_matrix);
         }
         else if (htype == 1)
@@ -79,6 +81,7 @@ void Evolve_elec<Device>::solve_psi(const int& istep,
                            &(ekb(ik, 0)),
                            htype,
                            propagator,
+                           ofs_running,
                            print_matrix);
                 // std::cout << "Print ekb: " << std::endl;
                 // ekb.print(std::cout);
@@ -161,6 +164,7 @@ void Evolve_elec<Device>::solve_psi(const int& istep,
                                           ekb_tensor,
                                           htype,
                                           propagator,
+                                          ofs_running,
                                           print_matrix,
                                           use_lapack);
 
 
@@ -92,6 +92,7 @@ inline void print_tensor_data<std::complex<double>>(const ct::Tensor& tensor, co
 namespace module_tddft
 {
 #ifdef __MPI
+//------------------------ MPI gathering and distributing functions ------------------------//
 template <typename T>
 void gatherPsi(const int myid,
                const int root_proc,
@@ -133,13 +134,12 @@ void distributePsi(const Parallel_Orbitals& para_orb, T* psi_l, const ModuleESol
     // Call the Cpxgemr2d function in ScaLAPACK to distribute the matrix data
     Cpxgemr2d(nrows, ncols, psi_g.p.get(), 1, 1, psi_g.desc.get(), psi_l, 1, 1, const_cast<int*>(desc_psi), ctxt);
 }
+//------------------------ MPI gathering and distributing functions ------------------------//
 #endif // __MPI
 
 template <typename Device = base_device::DEVICE_CPU>
 class Evolve_elec
 {
-
-    friend class ELEC_scf;
     friend class ModuleESolver::ESolver_KS_LCAO<std::complex<double>, double>;
 
     // Template parameter is needed for the friend class declaration
@@ -161,6 +161,7 @@ class Evolve_elec
                           std::complex<double>** Hk_laststep,
                           std::complex<double>** Sk_laststep,
                           ModuleBase::matrix& ekb,
+                          std::ofstream& ofs_running,
                           const int htype,
                           const int propagator,
                           const bool use_tensor,
Original file line number	Diff line number	Diff line change
`@@ -45,7 +45,6 @@ void gatherMatrix(const int myid, const int root_proc, const hamilt::MatrixBlock`
`45`	`45`	`// Call the Cpxgemr2d function in ScaLAPACK to collect the matrix data`
`46`	`46`	`Cpxgemr2d(nrows, ncols, mat_l.p, 1, 1, const_cast<int*>(desca), mat_g.p.get(), 1, 1, mat_g.desc.get(), ctxt);`
`47`	`47`	`}`
`48`		`-`
`49`	`48`	`//------------------------ MPI gathering and distributing functions ------------------------//`
`50`	`49`
`51`	`50`	`template <typename Device = base_device::DEVICE_CPU>`
Original file line number	Diff line number	Diff line change
`@@ -25,7 +25,8 @@ void compute_ekb(const Parallel_Orbitals* pv,`
`25`	`25`	`const int nlocal,`
`26`	`26`	`const std::complex<double>* Htmp,`
`27`	`27`	`const std::complex<double>* psi_k,`
`28`		`- double* ekb)`
	`28`	`+ double* ekb,`
	`29`	`+ std::ofstream& ofs_running)`
`29`	`30`	`{`
`30`	`31`
`31`	`32`	`std::complex<double>* tmp1 = new std::complex<double>[pv->nloc_wfc];`
`@@ -76,10 +77,10 @@ void compute_ekb(const Parallel_Orbitals* pv,`
`76`	`77`
`77`	`78`	`if (PARAM.inp.td_print_eij > 0.0)`
`78`	`79`	`{`
`79`		`- GlobalV::ofs_running`
	`80`	`+ ofs_running`
`80`	`81`	`<< "------------------------------------------------------------------------------------------------"`
`81`	`82`	`<< std::endl;`
`82`		`- GlobalV::ofs_running << " Eij:" << std::endl;`
	`83`	`+ ofs_running << " Eij:" << std::endl;`
`83`	`84`	`for (int i = 0; i < pv->nrow_bands; i++)`
`84`	`85`	`{`
`85`	`86`	`for (int j = 0; j < pv->ncol_bands; j++)`
`@@ -98,12 +99,12 @@ void compute_ekb(const Parallel_Orbitals* pv,`
`98`	`99`	`}`
`99`	`100`	`if (aa > 0.0 \|\| bb > 0.0)`
`100`	`101`	`{`
`101`		`- GlobalV::ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;`
	`102`	`+ ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;`
`102`	`103`	`}`
`103`	`104`	`}`
`104`	`105`	`}`
`105`		`- GlobalV::ofs_running << std::endl;`
`106`		`- GlobalV::ofs_running`
	`106`	`+ ofs_running << std::endl;`
	`107`	`+ ofs_running`
`107`	`108`	`<< "------------------------------------------------------------------------------------------------"`
`108`	`109`	`<< std::endl;`
`109`	`110`	`}`
`@@ -156,7 +157,8 @@ void compute_ekb_tensor(const Parallel_Orbitals* pv,`
`156`	`157`	`const int nlocal,`
`157`	`158`	`const ct::Tensor& Htmp,`
`158`	`159`	`const ct::Tensor& psi_k,`
`159`		`- ct::Tensor& ekb)`
	`160`	`+ ct::Tensor& ekb,`
	`161`	`+ std::ofstream& ofs_running)`
`160`	`162`	`{`
`161`	`163`	`// Create Tensor objects for temporary data`
`162`	`164`	`ct::Tensor tmp1(ct::DataType::DT_COMPLEX_DOUBLE, ct::DeviceType::CpuDevice, ct::TensorShape({pv->nloc_wfc}));`
`@@ -209,10 +211,10 @@ void compute_ekb_tensor(const Parallel_Orbitals* pv,`
`209`	`211`
`210`	`212`	`if (PARAM.inp.td_print_eij >= 0.0)`
`211`	`213`	`{`
`212`		`- GlobalV::ofs_running`
	`214`	`+ ofs_running`
`213`	`215`	`<< "------------------------------------------------------------------------------------------------"`
`214`	`216`	`<< std::endl;`
`215`		`- GlobalV::ofs_running << " Eij:" << std::endl;`
	`217`	`+ ofs_running << " Eij:" << std::endl;`
`216`	`218`	`for (int i = 0; i < pv->nrow_bands; i++)`
`217`	`219`	`{`
`218`	`220`	`for (int j = 0; j < pv->ncol_bands; j++)`
`@@ -231,12 +233,12 @@ void compute_ekb_tensor(const Parallel_Orbitals* pv,`
`231`	`233`	`}`
`232`	`234`	`if (aa > 0.0 \|\| bb > 0.0)`
`233`	`235`	`{`
`234`		`- GlobalV::ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;`
	`236`	`+ ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;`
`235`	`237`	`}`
`236`	`238`	`}`
`237`	`239`	`}`
`238`		`- GlobalV::ofs_running << std::endl;`
`239`		`- GlobalV::ofs_running`
	`240`	`+ ofs_running << std::endl;`
	`241`	`+ ofs_running`
`240`	`242`	`<< "------------------------------------------------------------------------------------------------"`
`241`	`243`	`<< std::endl;`
`242`	`244`	`}`
`@@ -290,7 +292,8 @@ void compute_ekb_tensor_lapack(const Parallel_Orbitals* pv,`
`290`	`292`	`const int nlocal,`
`291`	`293`	`const ct::Tensor& Htmp,`
`292`	`294`	`const ct::Tensor& psi_k,`
`293`		`- ct::Tensor& ekb)`
	`295`	`+ ct::Tensor& ekb,`
	`296`	`+ std::ofstream& ofs_running)`
`294`	`297`	`{`
`295`	`298`	`// ct_device_type = ct::DeviceType::CpuDevice or ct::DeviceType::GpuDevice`
`296`	`299`	`ct::DeviceType ct_device_type = ct::DeviceTypeToEnum<Device>::value;`
`@@ -346,10 +349,10 @@ void compute_ekb_tensor_lapack(const Parallel_Orbitals* pv,`
`346`	`349`	`{`
`347`	`350`	`ct::Tensor Eij_cpu = Eij.to_device<ct::DEVICE_CPU>();`
`348`	`351`
`349`		`- GlobalV::ofs_running`
	`352`	`+ ofs_running`
`350`	`353`	`<< "------------------------------------------------------------------------------------------------"`
`351`	`354`	`<< std::endl;`
`352`		`- GlobalV::ofs_running << " Eij:" << std::endl;`
	`355`	`+ ofs_running << " Eij:" << std::endl;`
`353`	`356`	`for (int i = 0; i < nband; i++)`
`354`	`357`	`{`
`355`	`358`	`for (int j = 0; j < nband; j++)`
`@@ -368,12 +371,12 @@ void compute_ekb_tensor_lapack(const Parallel_Orbitals* pv,`
`368`	`371`	`}`
`369`	`372`	`if (aa > 0.0 \|\| bb > 0.0)`
`370`	`373`	`{`
`371`		`- GlobalV::ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;`
	`374`	`+ ofs_running << i << " " << j << " " << aa << "+" << bb << "i " << std::endl;`
`372`	`375`	`}`
`373`	`376`	`}`
`374`	`377`	`}`
`375`		`- GlobalV::ofs_running << std::endl;`
`376`		`- GlobalV::ofs_running`
	`378`	`+ ofs_running << std::endl;`
	`379`	`+ ofs_running`
`377`	`380`	`<< "------------------------------------------------------------------------------------------------"`
`378`	`381`	`<< std::endl;`
`379`	`382`	`}`
`@@ -406,15 +409,17 @@ template void compute_ekb_tensor_lapack<base_device::DEVICE_CPU>(const Parallel_`
`406`	`409`	`const int nlocal,`
`407`	`410`	`const ct::Tensor& Htmp,`
`408`	`411`	`const ct::Tensor& psi_k,`
`409`		`- ct::Tensor& ekb);`
	`412`	`+ ct::Tensor& ekb,`
	`413`	`+ std::ofstream& ofs_running);`
`410`	`414`
`411`	`415`	`#if ((defined __CUDA) /* \|\| (defined __ROCM) */)`
`412`	`416`	`template void compute_ekb_tensor_lapack<base_device::DEVICE_GPU>(const Parallel_Orbitals* pv,`
`413`	`417`	`const int nband,`
`414`	`418`	`const int nlocal,`
`415`	`419`	`const ct::Tensor& Htmp,`
`416`	`420`	`const ct::Tensor& psi_k,`
`417`		`- ct::Tensor& ekb);`
	`421`	`+ ct::Tensor& ekb,`
	`422`	`+ std::ofstream& ofs_running);`
`418`	`423`	`#endif // __CUDA`
`419`	`424`	`#endif // __MPI`
`420`	`425`