deepmodeling
diff --git a/‎docs/advanced/input_files/input-main.md‎
Lines changed: 15 additions & 3 deletions b/‎docs/advanced/input_files/input-main.md‎
Lines changed: 15 additions & 3 deletions
diff --git a/‎source/module_base/blas_connector.cpp‎
Lines changed: 264 additions & 44 deletions b/‎source/module_base/blas_connector.cpp‎
Lines changed: 264 additions & 44 deletions
diff --git a/‎source/module_base/blas_connector.h‎
Lines changed: 44 additions & 5 deletions b/‎source/module_base/blas_connector.h‎
Lines changed: 44 additions & 5 deletions
diff --git a/‎source/module_esolver/esolver_ks_lcao.cpp‎
Lines changed: 5 additions & 5 deletions b/‎source/module_esolver/esolver_ks_lcao.cpp‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎source/module_esolver/esolver_ks_pw.cpp‎
Lines changed: 4 additions & 5 deletions b/‎source/module_esolver/esolver_ks_pw.cpp‎
Lines changed: 4 additions & 5 deletions
diff --git a/‎source/module_esolver/lcao_before_scf.cpp‎
Lines changed: 5 additions & 0 deletions b/‎source/module_esolver/lcao_before_scf.cpp‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎source/module_hamilt_lcao/hamilt_lcaodft/operator_lcao/td_ekinetic_lcao.cpp‎
Lines changed: 2 additions & 2 deletions b/‎source/module_hamilt_lcao/hamilt_lcaodft/operator_lcao/td_ekinetic_lcao.cpp‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎source/module_hamilt_lcao/module_gint/temp_gint/gint_atom.cpp‎
Lines changed: 1 addition & 0 deletions b/‎source/module_hamilt_lcao/module_gint/temp_gint/gint_atom.cpp‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎source/module_hamilt_lcao/module_gint/temp_gint/gint_common.cpp‎
Lines changed: 25 additions & 12 deletions b/‎source/module_hamilt_lcao/module_gint/temp_gint/gint_common.cpp‎
Lines changed: 25 additions & 12 deletions
diff --git a/‎source/module_hamilt_lcao/module_gint/temp_gint/gint_common.h‎
Lines changed: 3 additions & 2 deletions b/‎source/module_hamilt_lcao/module_gint/temp_gint/gint_common.h‎
Lines changed: 3 additions & 2 deletions
@@ -177,6 +177,7 @@
     - [dos\_emax\_ev](#dos_emax_ev)
     - [dos\_nche](#dos_nche)
     - [stm\_bias](#stm_bias)
+    - [ldos\_line](#ldos_line)
   - [NAOs](#naos)
     - [bessel\_nao\_ecut](#bessel_nao_ecut)
     - [bessel\_nao\_tolerence](#bessel_nao_tolerence)
@@ -1705,9 +1706,13 @@ These variables are used to control the output of properties.
 
 ### out_ldos
 
-- **Type**: Boolean
-- **Description**: Whether to output the local density of states for given bias in cube file format, which is controlled by [stm_bias](#stm_bias). 
-- **Default**: False
+- **Type**: Integer
+- **Description**: Whether to output the local density of states (LDOS), optionally output precision can be set by a second parameter, default is 3.
+  - 0: no output
+  - 1: output the partial charge density for given bias (controlled by [stm_bias](#stm_bias)) in cube file format, which can be used to plot scanning tunneling spectroscopys to mimick STM images using the Python script [plot.py](../../../tools/stm/plot.py).
+  - 2: output LDOS along a line in real space (controlled by [ldos_line](#ldos_line)). Parameters used to control DOS output are also valid for LDOS.
+  - 3: output both two LDOS modes above.
+- **Default**: 0
 
 ### out_band
 
@@ -1986,6 +1991,13 @@ These variables are used to control the calculation of DOS. [Detailed introducti
 - **Default**: 1.0
 - **Unit**: V
 
+### ldos_line
+
+- **Type**: Real*6 Integer(optional)
+- **Description**: Specify the path of the three-dimensional space and display LDOS in the form of a two-dimensional color chart, see details in [out_ldos](#out_ldos). The first three paramenters are the direct coordinates of the start point, the next three paramenters are the direct coordinates of the end point, and the final one is the number of points along the path, whose default is 100.
+- **Default**: 0.0 0.0 0.0 0.0 0.0 1.0 100
+
+
 [back to top](#full-list-of-input-keywords)
 
 ## NAOs
 
@@ -65,7 +65,7 @@ extern "C"
 	void cgemv_(const char *trans, const int *m, const int *n, const std::complex<float> *alpha,
 			const std::complex<float> *a, const int *lda, const std::complex<float> *x, const int *incx,
 			const std::complex<float> *beta, std::complex<float> *y, const int *incy);
-		
+
 	void zgemv_(const char *trans, const int *m, const int *n, const std::complex<double> *alpha,
 			const std::complex<double> *a, const int *lda, const std::complex<double> *x, const int *incx,
 			const std::complex<double> *beta, std::complex<double> *y, const int *incy);
@@ -180,11 +180,36 @@ class BlasConnector
 	// Peize Lin add 2017-10-27
 	// d=x*y
 	static
-	float dot( const int n, const float *X, const int incX, const float *Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+	float dot( const int n, const float*const X, const int incX, const float*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+
+	static
+	double dot( const int n, const double*const X, const int incX, const double*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+
+	// d=x*y
+	static
+	float dotu( const int n, const float*const X, const int incX, const float*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+
+	static
+	double dotu( const int n, const double*const X, const int incX, const double*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+
+	static
+	std::complex<float> dotu( const int n, const std::complex<float>*const X, const int incX, const std::complex<float>*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+
+	static
+	std::complex<double> dotu( const int n, const std::complex<double>*const X, const int incX, const std::complex<double>*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+
+	// d=x.conj()*y
+	static
+	float dotc( const int n, const float*const X, const int incX, const float*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+
+	static
+	double dotc( const int n, const double*const X, const int incX, const double*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
 
 	static
-	double dot( const int n, const double *X, const int incX, const double *Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+	std::complex<float> dotc( const int n, const std::complex<float>*const X, const int incX, const std::complex<float>*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
 
+	static
+	std::complex<double> dotc( const int n, const std::complex<double>*const X, const int incX, const std::complex<double>*const Y, const int incY, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
 
 	// Peize Lin add 2017-10-27, fix bug trans 2019-01-17
 	// C = a * A.? * B.? + b * C
@@ -231,6 +256,9 @@ class BlasConnector
 		const std::complex<double> alpha, const std::complex<double> *a, const int lda, const std::complex<double> *b, const int ldb,
 		const std::complex<double> beta, std::complex<double> *c, const int ldc, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
 
+	// side=='L': C = a * A * B + b * C.
+	// side=='R': C = a * B * A + b * C.
+	// 		A == A^T
 	// Because you cannot pack symm or hemm into a row-major kernel by exchanging parameters, so only col-major functions are provided.
 	static
 	void symm_cm(const char side, const char uplo, const int m, const int n,
@@ -252,6 +280,19 @@ class BlasConnector
 		const std::complex<double> alpha, const std::complex<double> *a, const int lda, const std::complex<double> *b, const int ldb,
 		const std::complex<double> beta, std::complex<double> *c, const int ldc, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
 
+	// side=='L': C = a * A * B + b * C.
+	// side=='R': C = a * B * A + b * C.
+	// 		A == A^H
+	static
+	void hemm_cm(const char side, const char uplo, const int m, const int n,
+		const float alpha, const float *a, const int lda, const float *b, const int ldb,
+		const float beta, float *c, const int ldc, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+
+	static
+	void hemm_cm(const char side, const char uplo, const int m, const int n,
+		const double alpha, const double *a, const int lda, const double *b, const int ldb,
+		const double beta, double *c, const int ldc, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
+
 	static
     void hemm_cm(char side, char uplo, int m, int n,
             std::complex<float> alpha, std::complex<float> *a, int lda, std::complex<float> *b, int ldb,
@@ -263,7 +304,6 @@ class BlasConnector
 		std::complex<double> beta, std::complex<double> *c, int ldc, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
 
 	// y = A*x + beta*y
-
 	static
 	void gemv(const char trans, const int m, const int n,
         const float alpha, const float* A, const int lda, const float* X, const int incx,
@@ -283,7 +323,6 @@ class BlasConnector
     void gemv(const char trans, const int m, const int n,
               const std::complex<double> alpha, const std::complex<double> *A, const int lda, const std::complex<double> *X, const int incx,
               const std::complex<double> beta, std::complex<double> *Y, const int incy, base_device::AbacusDevice_t device_type = base_device::AbacusDevice_t::CpuDevice);
- 
 
 	// Peize Lin add 2018-06-12
 	// out = ||x||_2
 
@@ -690,11 +690,11 @@ void ESolver_KS_LCAO<TK, TR>::iter_init(UnitCell& ucell, const int istep, const
     {
         this->p_hamilt->refresh();
     }
-    if (iter == 1 && istep == 0)
-    {
-        // initialize DMR
-        this->ld.init_DMR(ucell, orb_, this->pv, this->gd);
-    }
+    // if (iter == 1 && istep == 0)
+    // {
+    //     // initialize DMR
+    //     this->ld.init_DMR(ucell, orb_, this->pv, this->gd);
+    // }
 #endif
 
     if (PARAM.inp.vl_in_h)
 
@@ -947,11 +947,10 @@ void ESolver_KS_PW<T, Device>::after_all_runners(UnitCell& ucell)
     //----------------------------------------------------------
     if (PARAM.inp.out_ldos[0])
     {
-        ModuleIO::Cal_ldos<std::complex<double>>::cal_ldos_pw(
-            reinterpret_cast<elecstate::ElecStatePW<std::complex<double>>*>(this->pelec),
-            this->psi[0],
-            this->Pgrid,
-            ucell);
+        ModuleIO::cal_ldos_pw(reinterpret_cast<elecstate::ElecStatePW<std::complex<double>>*>(this->pelec),
+                              this->psi[0],
+                              this->Pgrid,
+                              ucell);
     }
 
     //----------------------------------------------------------
 
@@ -243,6 +243,11 @@ void ESolver_KS_LCAO<TK, TR>::before_scf(UnitCell& ucell, const int istep)
         ->get_DM()
         ->init_DMR(*(dynamic_cast<hamilt::HamiltLCAO<TK, TR>*>(this->p_hamilt)->getHR()));
 
+#ifdef __DEEPKS
+    // initialize DMR of DeePKS
+    this->ld.init_DMR(ucell, orb_, this->pv, this->gd);
+#endif
+
     // 15) two cases are considered:
     // 1. DMK in DensityMatrix is not empty (istep > 0), then DMR is initialized by DMK
     // 2. DMK in DensityMatrix is empty (istep == 0), then DMR is initialized by zeros
 
@@ -244,8 +244,8 @@ void TDEkinetic<OperatorLCAO<TK, TR>>::init_td()
 
     // mohan update 2025-04-20
     ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Ax(t)", cart_At[0]);
-    ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Ax(t)", cart_At[1]);
-    ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Ax(t)", cart_At[2]);
+    ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Ay(t)", cart_At[1]);
+    ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Az(t)", cart_At[2]);
 }
 
 template <typename TK, typename TR>
 
@@ -203,5 +203,6 @@ void GintAtom::set_phi_dphi(
 
 // explicit instantiation
 template void GintAtom::set_phi(const std::vector<Vec3d>& coords, const int stride, double* phi) const;
+template void GintAtom::set_phi(const std::vector<Vec3d>& coords, const int stride, std::complex<double>* phi) const;
 template void GintAtom::set_phi_dphi(const std::vector<Vec3d>& coords, const int stride, double* phi, double* dphi_x, double* dphi_y, double* dphi_z) const;
 }
@@ -23,7 +23,7 @@ void compose_hr_gint(std::shared_ptr<HContainer<double>> hr_gint)
             assert(upper_ap != nullptr);
 #endif
             for (int ir = 0; ir < ap.get_R_size(); ir++)
-            {   
+            {
                 auto R_index = ap.get_R_index(ir);
                 auto upper_mat = upper_ap->find_matrix(-R_index);
                 auto lower_mat = lower_ap->find_matrix(R_index);
@@ -36,7 +36,7 @@ void compose_hr_gint(std::shared_ptr<HContainer<double>> hr_gint)
                 }
             }
         }
-    } 
+    }
 }
 
 void compose_hr_gint(std::vector<std::shared_ptr<HContainer<double>>> hr_gint_part,
@@ -54,7 +54,7 @@ void compose_hr_gint(std::vector<std::shared_ptr<HContainer<double>>> hr_gint_pa
             const hamilt::AtomPair<double>* ap_nspin_0 = hr_gint_part[0]->find_pair(iat1, iat2);
             const hamilt::AtomPair<double>* ap_nspin_3 = hr_gint_part[3]->find_pair(iat1, iat2);
             for (int ir = 0; ir < upper_ap->get_R_size(); ir++)
-            {   
+            {
                 const auto R_index = upper_ap->get_R_index(ir);
                 auto upper_mat = upper_ap->find_matrix(R_index);
                 auto mat_nspin_0 = ap_nspin_0->find_matrix(R_index);
@@ -124,10 +124,11 @@ void transfer_hr_gint_to_hR(std::shared_ptr<const HContainer<T>> hr_gint, HConta
 
 // gint_info should not have been a parameter, but it was added to initialize dm_gint_full
 // In the future, we might try to remove the gint_info parameter
+template<typename T>
 void transfer_dm_2d_to_gint(
     std::shared_ptr<const GintInfo> gint_info,
-    std::vector<HContainer<double>*> dm,
-    std::vector<std::shared_ptr<HContainer<double>>> dm_gint)
+    std::vector<HContainer<T>*> dm,
+    std::vector<std::shared_ptr<HContainer<T>>> dm_gint)
 {
     // To check whether input parameter dm_2d has been initialized
 #ifdef __DEBUG
@@ -150,12 +151,12 @@ void transfer_dm_2d_to_gint(
     {
 #ifdef __MPI
         const int npol = 2;
-        std::shared_ptr<HContainer<double>> dm_full = gint_info->get_hr<double>(npol);
+        std::shared_ptr<HContainer<T>> dm_full = gint_info->get_hr<T>(npol);
         hamilt::transferParallels2Serials(*dm[0], dm_full.get());
 #else
-        HContainer<double>* dm_full = dm[0];
+        HContainer<T>* dm_full = dm[0];
 #endif
-        std::vector<double*> tmp_pointer(4, nullptr);
+        std::vector<T*> tmp_pointer(4, nullptr);
         for (int iap = 0; iap < dm_full->size_atom_pairs(); iap++)
         {
             auto& ap = dm_full->get_atom_pair(iap);
@@ -166,10 +167,10 @@ void transfer_dm_2d_to_gint(
                 const ModuleBase::Vector3<int> r_index = ap.get_R_index(ir);
                 for (int is = 0; is < 4; is++)
                 {
-                    tmp_pointer[is] = 
+                    tmp_pointer[is] =
                         dm_gint[is]->find_matrix(iat1, iat2, r_index)->get_pointer();
                 }
-                double* data_full = ap.get_pointer(ir);
+                T* data_full = ap.get_pointer(ir);
                 for (int irow = 0; irow < ap.get_row_size(); irow += 2)
                 {
                     for (int icol = 0; icol < ap.get_col_size(); icol += 2)
@@ -191,6 +192,18 @@ void transfer_dm_2d_to_gint(
 }
 
 
-template void transfer_hr_gint_to_hR(std::shared_ptr<const HContainer<double>> hr_gint, HContainer<double>* hR);
-template void transfer_hr_gint_to_hR(std::shared_ptr<const HContainer<std::complex<double>>> hr_gint, HContainer<std::complex<double>>* hR);
+template void transfer_hr_gint_to_hR(
+    std::shared_ptr<const HContainer<double>> hr_gint,
+    HContainer<double>* hR);
+template void transfer_hr_gint_to_hR(
+    std::shared_ptr<const HContainer<std::complex<double>>> hr_gint,
+    HContainer<std::complex<double>>* hR);
+template void transfer_dm_2d_to_gint(
+    std::shared_ptr<const GintInfo> gint_info,
+    std::vector<HContainer<double>*> dm,
+    std::vector<std::shared_ptr<HContainer<double>>> dm_gint);
+template void transfer_dm_2d_to_gint(
+    std::shared_ptr<const GintInfo> gint_info,
+    std::vector<HContainer<std::complex<double>>*> dm,
+    std::vector<std::shared_ptr<HContainer<std::complex<double>>>> dm_gint);
 }
@@ -13,9 +13,10 @@ namespace ModuleGint
     template <typename T>
     void transfer_hr_gint_to_hR(std::shared_ptr<const HContainer<T>> hr_gint, HContainer<T>* hR);
 
+    template<typename T>
     void transfer_dm_2d_to_gint(
         std::shared_ptr<const GintInfo> gint_info,
-        std::vector<HContainer<double>*> dm,
-        std::vector<std::shared_ptr<HContainer<double>>> dm_gint);
+        std::vector<HContainer<T>*> dm,
+        std::vector<std::shared_ptr<HContainer<T>>> dm_gint);
 
 }
Original file line number	Diff line number	Diff line change
`@@ -244,8 +244,8 @@ void TDEkinetic<OperatorLCAO<TK, TR>>::init_td()`
`244`	`244`
`245`	`245`	`// mohan update 2025-04-20`
`246`	`246`	`ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Ax(t)", cart_At[0]);`
`247`		`- ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Ax(t)", cart_At[1]);`
`248`		`- ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Ax(t)", cart_At[2]);`
	`247`	`+ ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Ay(t)", cart_At[1]);`
	`248`	`+ ModuleBase::GlobalFunc::OUT(GlobalV::ofs_running, "Cartesian vector potential Az(t)", cart_At[2]);`
`249`	`249`	`}`
`250`	`250`
`251`	`251`	`template <typename TK, typename TR>`
Original file line number	Diff line number	Diff line change
`@@ -203,5 +203,6 @@ void GintAtom::set_phi_dphi(`
`203`	`203`
`204`	`204`	`// explicit instantiation`
`205`	`205`	`template void GintAtom::set_phi(const std::vector<Vec3d>& coords, const int stride, double* phi) const;`
	`206`	`+template void GintAtom::set_phi(const std::vector<Vec3d>& coords, const int stride, std::complex<double>* phi) const;`
`206`	`207`	`template void GintAtom::set_phi_dphi(const std::vector<Vec3d>& coords, const int stride, double* phi, double* dphi_x, double* dphi_y, double* dphi_z) const;`
`207`	`208`	`}`