deepmodeling
diff --git a/‎docs/advanced/input_files/input-main.md‎
Lines changed: 7 additions & 0 deletions b/‎docs/advanced/input_files/input-main.md‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎source/Makefile.Objects‎
Lines changed: 0 additions & 1 deletion b/‎source/Makefile.Objects‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎source/module_basis/module_ao/parallel_2d.h‎
Lines changed: 1 addition & 0 deletions b/‎source/module_basis/module_ao/parallel_2d.h‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎source/module_esolver/esolver.cpp‎
Lines changed: 2 additions & 7 deletions b/‎source/module_esolver/esolver.cpp‎
Lines changed: 2 additions & 7 deletions
diff --git a/‎source/module_io/read_input_item_tddft.cpp‎
Lines changed: 6 additions & 4 deletions b/‎source/module_io/read_input_item_tddft.cpp‎
Lines changed: 6 additions & 4 deletions
diff --git a/‎source/module_io/test/read_input_ptest.cpp‎
Lines changed: 1 addition & 0 deletions b/‎source/module_io/test/read_input_ptest.cpp‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎source/module_lr/AX/AX.h‎
Lines changed: 14 additions & 14 deletions b/‎source/module_lr/AX/AX.h‎
Lines changed: 14 additions & 14 deletions
diff --git a/‎source/module_lr/AX/AX_parallel.cpp‎
Lines changed: 20 additions & 26 deletions b/‎source/module_lr/AX/AX_parallel.cpp‎
Lines changed: 20 additions & 26 deletions
diff --git a/‎source/module_lr/AX/AX_serial.cpp‎
Lines changed: 14 additions & 16 deletions b/‎source/module_lr/AX/AX_serial.cpp‎
Lines changed: 14 additions & 16 deletions
@@ -3957,6 +3957,13 @@ Currently supported: `RPA`, `LDA`, `PBE`, `HSE`, `HF`.
 - **Description**:  The number of 2-particle states to be solved
 - **Default**: 0
 
+### lr_unrestricted
+- **Type**: Boolean
+- **Description**: Whether to use unrestricted construction for LR-TDDFT (the matrix size will be doubled).
+  - True:  Always use unrestricted LR-TDDFT. 
+  - False: Use unrestricted LR-TDDFT only when the system is open-shell.
+- **Default**: False
+
 ### abs_wavelen_range
 
 - **Type**: Real Real
 
@@ -728,7 +728,6 @@ OBJS_TENSOR=tensor.o\
     operator_lr_exx.o\
     kernel_xc.o\
     pot_hxc_lrtd.o\
-    hsolver_lrtd.o\
     lr_spectrum.o\
     hamilt_casida.o\
     esolver_lrtd_lcao.o\
@@ -15,6 +15,7 @@ class Parallel_2D
     ~Parallel_2D() = default;
 
     Parallel_2D& operator=(Parallel_2D&& rhs) = default;
+    Parallel_2D(Parallel_2D&& rhs) = default;
 
     /// number of local rows
     int get_row_size() const
 
@@ -187,13 +187,8 @@ ESolver* init_esolver(const Input_para& inp, UnitCell& ucell)
     else if (esolver_type == "lr_lcao")
     {
         // use constructor rather than Init function to initialize reference (instead of pointers) to ucell
-        if (PARAM.globalv.gamma_only_local){
-            return new LR::ESolver_LR<double, double>(inp, ucell);
-        } else if (PARAM.inp.nspin < 2) {
-            return new LR::ESolver_LR<std::complex<double>, double>(inp, ucell);
-        } else {
-            throw std::runtime_error("LR-TDDFT is not implemented for spin polarized case");
-}
+        if (PARAM.globalv.gamma_only_local) { return new LR::ESolver_LR<double, double>(inp, ucell); }
+        else { return new LR::ESolver_LR<std::complex<double>, double>(inp, ucell); }
     }
     else if (esolver_type == "ksdft_lr_lcao")
     {
 
@@ -327,6 +327,12 @@ void ReadInput::item_lr_tddft()
         read_sync_bool(input.out_wfc_lr);
         this->add_item(item);
     }
+    {
+        Input_Item item("lr_unrestricted");
+        item.annotation = "Whether to use unrestricted construction for LR-TDDFT";
+        read_sync_bool(input.lr_unrestricted);
+        this->add_item(item);
+    }
     {
         Input_Item item("abs_wavelen_range");
         item.annotation = "the range of wavelength(nm) to output the absorption spectrum ";
@@ -337,10 +343,6 @@ void ReadInput::item_lr_tddft()
                 para.input.abs_wavelen_range.push_back(std::stod(item.str_values[i]));
             }
             };
-        item.check_value = [](const Input_Item& item, const Parameter& para) {
-            auto& awr = para.input.abs_wavelen_range;
-            if (awr.size() < 2) { ModuleBase::WARNING_QUIT("ReadInput", "abs_wavelen_range must have two values"); }
-            };
         sync_doublevec(input.abs_wavelen_range, 2, 0.0);
         this->add_item(item);
     }
 
@@ -419,6 +419,7 @@ TEST_F(InputParaTest, ParaRead)
     EXPECT_EQ(param.inp.xc_kernel, "LDA");
     EXPECT_EQ(param.inp.lr_solver, "dav");
     EXPECT_DOUBLE_EQ(param.inp.lr_thr, 1e-2);
+    EXPECT_FALSE(param.inp.lr_unrestricted);
     EXPECT_FALSE(param.inp.out_wfc_lr);
     EXPECT_EQ(param.inp.abs_wavelen_range.size(), 2);
     EXPECT_DOUBLE_EQ(param.inp.abs_wavelen_range[0], 0.0);
 
@@ -13,25 +13,25 @@ namespace LR
         const psi::Psi<double>& c,
         const int& nocc,
         const int& nvirt,
-        psi::Psi<double>& AX_istate);
+        double* AX_istate);
     void cal_AX_blas(
         const std::vector<container::Tensor>& V_istate,
         const psi::Psi<double>& c,
         const int& nocc,
         const int& nvirt,
-        psi::Psi<double>& AX_istate,
+        double* AX_istate,
         const bool add_on = true);
 #ifdef __MPI
     void cal_AX_pblas(
         const std::vector<container::Tensor>& V_istate,
         const Parallel_2D& pmat,
         const psi::Psi<double>& c,
         const Parallel_2D& pc,
-        int naos,
-        int nocc,
-        int nvirt,
-        Parallel_2D& pX,
-        psi::Psi<double>& AX_istate,
+        const int& naos,
+        const int& nocc,
+        const int& nvirt,
+        const Parallel_2D& pX,
+        double* AX_istate,
         const bool add_on=true);
 #endif
     // complex
@@ -40,13 +40,13 @@ namespace LR
         const psi::Psi<std::complex<double>>& c,
         const int& nocc,
         const int& nvirt,
-        psi::Psi<std::complex<double>>& AX_istate);
+        std::complex<double>* AX_istate);
     void cal_AX_blas(
         const std::vector<container::Tensor>& V_istate,
         const psi::Psi<std::complex<double>>& c,
         const int& nocc,
         const int& nvirt,
-        psi::Psi<std::complex<double>>& AX_istate,
+        std::complex<double>* AX_istate,
         const bool add_on = true);
 
 #ifdef __MPI
@@ -55,11 +55,11 @@ namespace LR
         const Parallel_2D& pmat,
         const psi::Psi<std::complex<double>>& c,
         const Parallel_2D& pc,
-        int naos,
-        int nocc,
-        int nvirt,
-        Parallel_2D& pX,
-        psi::Psi<std::complex<double>>& AX_istate,
+        const int& naos,
+        const int& nocc,
+        const int& nvirt,
+        const Parallel_2D& pX,
+        std::complex<double>* AX_istate,
         const bool add_on = true);
 #endif
 }
@@ -14,28 +14,25 @@ namespace LR
         const Parallel_2D& pmat,
         const psi::Psi<double>& c,
         const Parallel_2D& pc,
-        int naos,
-        int nocc,
-        int nvirt,
-        Parallel_2D& pX,
-        psi::Psi<double>& AX_istate,
+        const int& naos,
+        const int& nocc,
+        const int& nvirt,
+        const Parallel_2D& pX,
+        double* AX_istate,
         const bool add_on)
     {
         ModuleBase::TITLE("hamilt_lrtd", "cal_AX_pblas");
-        assert(pmat.comm() == pc.comm());
-        assert(pmat.blacs_ctxt == pc.blacs_ctxt);
-
-        if (pX.comm() != pmat.comm() || pX.blacs_ctxt != pmat.blacs_ctxt)
-            LR_Util::setup_2d_division(pX, pmat.get_block_size(), nvirt, nocc, pmat.blacs_ctxt);
-        else assert(pX.get_local_size() > 0 && AX_istate.get_nbasis() == pX.get_local_size());
+        assert(pmat.comm() == pc.comm() && pmat.comm() == pX.comm());
+        assert(pmat.blacs_ctxt == pc.blacs_ctxt && pmat.blacs_ctxt == pX.blacs_ctxt);
+        assert(pX.get_local_size() > 0);
 
         const int nks = V_istate.size();
 
         Parallel_2D pVc;        // for intermediate Vc
         LR_Util::setup_2d_division(pVc, pmat.get_block_size(), naos, nocc, pmat.blacs_ctxt);
         for (int isk = 0;isk < nks;++isk)
         {
-            AX_istate.fix_k(isk);
+            const int ax_start = isk * pX.get_local_size();
             c.fix_k(isk);
 
             //Vc
@@ -60,7 +57,7 @@ namespace LR
             pdgemm_(&transa, &transb, &nvirt, &nocc, &naos,
                 &alpha, c.get_pointer(), &i1, &ivirt, pc.desc,
                 Vc.data<double>(), &i1, &i1, pVc.desc,
-                &beta, AX_istate.get_pointer(), &i1, &i1, pX.desc);
+                &beta, AX_istate + ax_start, &i1, &i1, pX.desc);
 
         }
     }
@@ -70,28 +67,25 @@ namespace LR
         const Parallel_2D& pmat,
         const psi::Psi<std::complex<double>>& c,
         const Parallel_2D& pc,
-        int naos,
-        int nocc,
-        int nvirt,
-        Parallel_2D& pX,
-        psi::Psi<std::complex<double>>& AX_istate,
+        const int& naos,
+        const int& nocc,
+        const int& nvirt,
+        const Parallel_2D& pX,
+        std::complex<double>* AX_istate,
         const bool add_on)
     {
         ModuleBase::TITLE("hamilt_lrtd", "cal_AX_plas");
-        assert(pmat.comm() == pc.comm());
-        assert(pmat.blacs_ctxt == pc.blacs_ctxt);
-
-        if (pX.comm() != pmat.comm() || pX.blacs_ctxt != pmat.blacs_ctxt)
-            LR_Util::setup_2d_division(pX, pmat.get_block_size(), nvirt, nocc, pmat.blacs_ctxt);
-        else assert(pX.get_local_size() > 0 && AX_istate.get_nbasis() == pX.get_local_size());
+        assert(pmat.comm() == pc.comm() && pmat.comm() == pX.comm());
+        assert(pmat.blacs_ctxt == pc.blacs_ctxt && pmat.blacs_ctxt == pX.blacs_ctxt);
+        assert(pX.get_local_size() > 0);
 
         const int nks = V_istate.size();
 
         Parallel_2D pVc;        // for intermediate Vc
         LR_Util::setup_2d_division(pVc, pmat.get_block_size(), naos, nocc, pmat.blacs_ctxt);
         for (int isk = 0;isk < nks;++isk)
         {
-            AX_istate.fix_k(isk);
+            const int ax_start = isk * pX.get_local_size();
             c.fix_k(isk);
 
             //Vc
@@ -116,7 +110,7 @@ namespace LR
             pzgemm_(&transa, &transb, &nvirt, &nocc, &naos,
                 &alpha, c.get_pointer(), &i1, &ivirt, pc.desc,
                 Vc.data<std::complex<double>>(), &i1, &i1, pVc.desc,
-                &beta, AX_istate.get_pointer(), &i1, &i1, pX.desc);
+                &beta, AX_istate + ax_start, &i1, &i1, pX.desc);
         }
     }
 }
 
@@ -9,18 +9,17 @@ namespace LR
         const psi::Psi<double>& c,
         const int& nocc,
         const int& nvirt,
-        psi::Psi<double>& AX_istate)
+        double* AX_istate)
     {
         ModuleBase::TITLE("hamilt_lrtd", "cal_AX_forloop");
         const int nks = V_istate.size();
         int naos = c.get_nbasis();
-        AX_istate.fix_k(0);
-        ModuleBase::GlobalFunc::ZEROS(AX_istate.get_pointer(), nks * nocc * nvirt);
+        ModuleBase::GlobalFunc::ZEROS(AX_istate, nks * nocc * nvirt);
 
         for (int isk = 0;isk < nks;++isk)
         {
             c.fix_k(isk);
-            AX_istate.fix_k(isk);
+            const int ax_start = isk * nocc * nvirt;
             for (int i = 0;i < nocc;++i)
             {
                 for (int a = 0;a < nvirt;++a)
@@ -29,7 +28,7 @@ namespace LR
                     {
                         for (int mu = 0;mu < naos;++mu)
                         {
-                            AX_istate(i * nvirt + a) += c(nocc + a, mu) * V_istate[isk].data<double>()[nu * naos + mu] * c(i, nu);
+                            AX_istate[ax_start + i * nvirt + a] += c(nocc + a, mu) * V_istate[isk].data<double>()[nu * naos + mu] * c(i, nu);
                         }
                     }
                 }
@@ -41,18 +40,17 @@ namespace LR
         const psi::Psi<std::complex<double>>& c,
         const int& nocc,
         const int& nvirt,
-        psi::Psi<std::complex<double>>& AX_istate)
+        std::complex<double>* AX_istate)
     {
         ModuleBase::TITLE("hamilt_lrtd", "cal_AX_forloop");
         const int nks = V_istate.size();
         int naos = c.get_nbasis();
-        AX_istate.fix_k(0);
-        ModuleBase::GlobalFunc::ZEROS(AX_istate.get_pointer(), nks * nocc * nvirt);
+        ModuleBase::GlobalFunc::ZEROS(AX_istate, nks * nocc * nvirt);
 
         for (int isk = 0;isk < nks;++isk)
         {
             c.fix_k(isk);
-            AX_istate.fix_k(isk);
+            const int ax_start = isk * nocc * nvirt;
             for (int i = 0;i < nocc;++i)
             {
                 for (int a = 0;a < nvirt;++a)
@@ -61,7 +59,7 @@ namespace LR
                     {
                         for (int mu = 0;mu < naos;++mu)
                         {
-                            AX_istate(i * nvirt + a) += std::conj(c(nocc + a, mu)) * V_istate[isk].data<std::complex<double>>()[nu * naos + mu] * c(i, nu);
+                            AX_istate[ax_start + i * nvirt + a] += std::conj(c(nocc + a, mu)) * V_istate[isk].data<std::complex<double>>()[nu * naos + mu] * c(i, nu);
                         }
                     }
                 }
@@ -74,7 +72,7 @@ namespace LR
         const psi::Psi<double>& c,
         const int& nocc,
         const int& nvirt,
-        psi::Psi<double>& AX_istate,
+        double* AX_istate,
         const bool add_on)
     {
         ModuleBase::TITLE("hamilt_lrtd", "cal_AX_blas");
@@ -84,7 +82,7 @@ namespace LR
         for (int isk = 0;isk < nks;++isk)
         {
             c.fix_k(isk);
-            AX_istate.fix_k(isk);
+            const int ax_start = isk * nocc * nvirt;
 
             // Vc[naos*nocc]
             container::Tensor Vc(DAT::DT_DOUBLE, DEV::CpuDevice, { nocc, naos });// (Vc)^T
@@ -101,15 +99,15 @@ namespace LR
             //AX_istate=c^TVc (nvirt major)
             dgemm_(&transa, &transb, &nvirt, &nocc, &naos, &alpha,
                 c.get_pointer(nocc), &naos, Vc.data<double>(), &naos, &beta,
-                AX_istate.get_pointer(), &nvirt);
+                AX_istate + ax_start, &nvirt);
         }
     }
     void cal_AX_blas(
         const std::vector<container::Tensor>& V_istate,
         const psi::Psi<std::complex<double>>& c,
         const int& nocc,
         const int& nvirt,
-        psi::Psi<std::complex<double>>& AX_istate,
+        std::complex<double>* AX_istate,
         const bool add_on)
     {
         ModuleBase::TITLE("hamilt_lrtd", "cal_AX_blas");
@@ -119,7 +117,7 @@ namespace LR
         for (int isk = 0;isk < nks;++isk)
         {
             c.fix_k(isk);
-            AX_istate.fix_k(isk);
+            const int ax_start = isk * nocc * nvirt;
 
             // Vc[naos*nocc] (V is hermitian)
             container::Tensor Vc(DAT::DT_COMPLEX_DOUBLE, DEV::CpuDevice, { nocc, naos });// (Vc)^T
@@ -136,7 +134,7 @@ namespace LR
             //AX_istate=c^\dagger Vc (nvirt major)
             zgemm_(&transa, &transb, &nvirt, &nocc, &naos, &alpha,
                 c.get_pointer(nocc), &naos, Vc.data<std::complex<double>>(), &naos, &beta,
-                AX_istate.get_pointer(), &nvirt);
+                AX_istate + ax_start, &nvirt);
         }
     }
 }
Original file line number	Diff line number	Diff line change
`@@ -187,13 +187,8 @@ ESolver* init_esolver(const Input_para& inp, UnitCell& ucell)`
`187`	`187`	`else if (esolver_type == "lr_lcao")`
`188`	`188`	`{`
`189`	`189`	`// use constructor rather than Init function to initialize reference (instead of pointers) to ucell`
`190`		`- if (PARAM.globalv.gamma_only_local){`
`191`		`- return new LR::ESolver_LR<double, double>(inp, ucell);`
`192`		`- } else if (PARAM.inp.nspin < 2) {`
`193`		`- return new LR::ESolver_LR<std::complex<double>, double>(inp, ucell);`
`194`		`- } else {`
`195`		`- throw std::runtime_error("LR-TDDFT is not implemented for spin polarized case");`
`196`		`-}`
	`190`	`+ if (PARAM.globalv.gamma_only_local) { return new LR::ESolver_LR<double, double>(inp, ucell); }`
	`191`	`+ else { return new LR::ESolver_LR<std::complex<double>, double>(inp, ucell); }`
`197`	`192`	`}`
`198`	`193`	`else if (esolver_type == "ksdft_lr_lcao")`
`199`	`194`	`{`
Original file line number	Diff line number	Diff line change
`@@ -327,6 +327,12 @@ void ReadInput::item_lr_tddft()`
`327`	`327`	`read_sync_bool(input.out_wfc_lr);`
`328`	`328`	`this->add_item(item);`
`329`	`329`	`}`
	`330`	`+ {`
	`331`	`+ Input_Item item("lr_unrestricted");`
	`332`	`+ item.annotation = "Whether to use unrestricted construction for LR-TDDFT";`
	`333`	`+ read_sync_bool(input.lr_unrestricted);`
	`334`	`+ this->add_item(item);`
	`335`	`+ }`
`330`	`336`	`{`
`331`	`337`	`Input_Item item("abs_wavelen_range");`
`332`	`338`	`item.annotation = "the range of wavelength(nm) to output the absorption spectrum ";`
`@@ -337,10 +343,6 @@ void ReadInput::item_lr_tddft()`
`337`	`343`	`para.input.abs_wavelen_range.push_back(std::stod(item.str_values[i]));`
`338`	`344`	`}`
`339`	`345`	`};`
`340`		`- item.check_value = [](const Input_Item& item, const Parameter& para) {`
`341`		`- auto& awr = para.input.abs_wavelen_range;`
`342`		`- if (awr.size() < 2) { ModuleBase::WARNING_QUIT("ReadInput", "abs_wavelen_range must have two values"); }`
`343`		`- };`
`344`	`346`	`sync_doublevec(input.abs_wavelen_range, 2, 0.0);`
`345`	`347`	`this->add_item(item);`
`346`	`348`	`}`
Original file line number	Diff line number	Diff line change
`@@ -9,18 +9,17 @@ namespace LR`
`9`	`9`	`const psi::Psi<double>& c,`
`10`	`10`	`const int& nocc,`
`11`	`11`	`const int& nvirt,`
`12`		`- psi::Psi<double>& AX_istate)`
	`12`	`+ double* AX_istate)`
`13`	`13`	`{`
`14`	`14`	`ModuleBase::TITLE("hamilt_lrtd", "cal_AX_forloop");`
`15`	`15`	`const int nks = V_istate.size();`
`16`	`16`	`int naos = c.get_nbasis();`
`17`		`- AX_istate.fix_k(0);`
`18`		`- ModuleBase::GlobalFunc::ZEROS(AX_istate.get_pointer(), nks * nocc * nvirt);`
	`17`	`+ ModuleBase::GlobalFunc::ZEROS(AX_istate, nks * nocc * nvirt);`
`19`	`18`
`20`	`19`	`for (int isk = 0;isk < nks;++isk)`
`21`	`20`	`{`
`22`	`21`	`c.fix_k(isk);`
`23`		`- AX_istate.fix_k(isk);`
	`22`	`+ const int ax_start = isk * nocc * nvirt;`
`24`	`23`	`for (int i = 0;i < nocc;++i)`
`25`	`24`	`{`
`26`	`25`	`for (int a = 0;a < nvirt;++a)`
`@@ -29,7 +28,7 @@ namespace LR`
`29`	`28`	`{`
`30`	`29`	`for (int mu = 0;mu < naos;++mu)`
`31`	`30`	`{`
`32`		`- AX_istate(i * nvirt + a) += c(nocc + a, mu) * V_istate[isk].data<double>()[nu * naos + mu] * c(i, nu);`
	`31`	`+ AX_istate[ax_start + i * nvirt + a] += c(nocc + a, mu) * V_istate[isk].data<double>()[nu * naos + mu] * c(i, nu);`
`33`	`32`	`}`
`34`	`33`	`}`
`35`	`34`	`}`
`@@ -41,18 +40,17 @@ namespace LR`
`41`	`40`	`const psi::Psi<std::complex<double>>& c,`
`42`	`41`	`const int& nocc,`
`43`	`42`	`const int& nvirt,`
`44`		`- psi::Psi<std::complex<double>>& AX_istate)`
	`43`	`+ std::complex<double>* AX_istate)`
`45`	`44`	`{`
`46`	`45`	`ModuleBase::TITLE("hamilt_lrtd", "cal_AX_forloop");`
`47`	`46`	`const int nks = V_istate.size();`
`48`	`47`	`int naos = c.get_nbasis();`
`49`		`- AX_istate.fix_k(0);`
`50`		`- ModuleBase::GlobalFunc::ZEROS(AX_istate.get_pointer(), nks * nocc * nvirt);`
	`48`	`+ ModuleBase::GlobalFunc::ZEROS(AX_istate, nks * nocc * nvirt);`
`51`	`49`
`52`	`50`	`for (int isk = 0;isk < nks;++isk)`
`53`	`51`	`{`
`54`	`52`	`c.fix_k(isk);`
`55`		`- AX_istate.fix_k(isk);`
	`53`	`+ const int ax_start = isk * nocc * nvirt;`
`56`	`54`	`for (int i = 0;i < nocc;++i)`
`57`	`55`	`{`
`58`	`56`	`for (int a = 0;a < nvirt;++a)`
`@@ -61,7 +59,7 @@ namespace LR`
`61`	`59`	`{`
`62`	`60`	`for (int mu = 0;mu < naos;++mu)`
`63`	`61`	`{`
`64`		`- AX_istate(i * nvirt + a) += std::conj(c(nocc + a, mu)) * V_istate[isk].data<std::complex<double>>()[nu * naos + mu] * c(i, nu);`
	`62`	`+ AX_istate[ax_start + i * nvirt + a] += std::conj(c(nocc + a, mu)) * V_istate[isk].data<std::complex<double>>()[nu * naos + mu] * c(i, nu);`
`65`	`63`	`}`
`66`	`64`	`}`
`67`	`65`	`}`
`@@ -74,7 +72,7 @@ namespace LR`
`74`	`72`	`const psi::Psi<double>& c,`
`75`	`73`	`const int& nocc,`
`76`	`74`	`const int& nvirt,`
`77`		`- psi::Psi<double>& AX_istate,`
	`75`	`+ double* AX_istate,`
`78`	`76`	`const bool add_on)`
`79`	`77`	`{`
`80`	`78`	`ModuleBase::TITLE("hamilt_lrtd", "cal_AX_blas");`
`@@ -84,7 +82,7 @@ namespace LR`
`84`	`82`	`for (int isk = 0;isk < nks;++isk)`
`85`	`83`	`{`
`86`	`84`	`c.fix_k(isk);`
`87`		`- AX_istate.fix_k(isk);`
	`85`	`+ const int ax_start = isk * nocc * nvirt;`
`88`	`86`
`89`	`87`	`// Vc[naos*nocc]`
`90`	`88`	`container::Tensor Vc(DAT::DT_DOUBLE, DEV::CpuDevice, { nocc, naos });// (Vc)^T`
`@@ -101,15 +99,15 @@ namespace LR`
`101`	`99`	`//AX_istate=c^TVc (nvirt major)`
`102`	`100`	`dgemm_(&transa, &transb, &nvirt, &nocc, &naos, &alpha,`
`103`	`101`	`c.get_pointer(nocc), &naos, Vc.data<double>(), &naos, &beta,`
`104`		`- AX_istate.get_pointer(), &nvirt);`
	`102`	`+ AX_istate + ax_start, &nvirt);`
`105`	`103`	`}`
`106`	`104`	`}`
`107`	`105`	`void cal_AX_blas(`
`108`	`106`	`const std::vector<container::Tensor>& V_istate,`
`109`	`107`	`const psi::Psi<std::complex<double>>& c,`
`110`	`108`	`const int& nocc,`
`111`	`109`	`const int& nvirt,`
`112`		`- psi::Psi<std::complex<double>>& AX_istate,`
	`110`	`+ std::complex<double>* AX_istate,`
`113`	`111`	`const bool add_on)`
`114`	`112`	`{`
`115`	`113`	`ModuleBase::TITLE("hamilt_lrtd", "cal_AX_blas");`
`@@ -119,7 +117,7 @@ namespace LR`
`119`	`117`	`for (int isk = 0;isk < nks;++isk)`
`120`	`118`	`{`
`121`	`119`	`c.fix_k(isk);`
`122`		`- AX_istate.fix_k(isk);`
	`120`	`+ const int ax_start = isk * nocc * nvirt;`
`123`	`121`
`124`	`122`	`// Vc[naos*nocc] (V is hermitian)`
`125`	`123`	`container::Tensor Vc(DAT::DT_COMPLEX_DOUBLE, DEV::CpuDevice, { nocc, naos });// (Vc)^T`
`@@ -136,7 +134,7 @@ namespace LR`
`136`	`134`	`//AX_istate=c^\dagger Vc (nvirt major)`
`137`	`135`	`zgemm_(&transa, &transb, &nvirt, &nocc, &naos, &alpha,`
`138`	`136`	`c.get_pointer(nocc), &naos, Vc.data<std::complex<double>>(), &naos, &beta,`
`139`		`- AX_istate.get_pointer(), &nvirt);`
	`137`	`+ AX_istate + ax_start, &nvirt);`
`140`	`138`	`}`
`141`	`139`	`}`
`142`	`140`	`}`