1. update LRI::cal_loop3()

PeizeLin · PeizeLin · commit 2097fa6de425 · 2023-08-22T15:50:11.000+08:00
diff --git a/include/RI/physics/RPA.hpp b/include/RI/physics/RPA.hpp
@@ -64,7 +64,7 @@ void RPA<TA,Tcell,Ndim,Tdata>::cal_chi0s(
 
 	set_Gs_a1(Gs_tau_positive);
 	set_Gs_a2(Gs_tau_negative);
-	this->lri.cal({
+	this->lri.cal_loop3({
 		Label::ab_ab::a1b1_a2b2,
 		Label::ab_ab::a1b2_a2b1},
 		chi0s_vec);
@@ -73,7 +73,7 @@ void RPA<TA,Tcell,Ndim,Tdata>::cal_chi0s(
 	set_Gs_a2(Gs_tau_positive);			// tmp
 	//set_Gs_a1(conj(Gs_tau_negative));
 	//set_Gs_a2(conj(Gs_tau_positive));
-	this->lri.cal({
+	this->lri.cal_loop3({
 		Label::ab_ab::a1b1_a2b2,
 		Label::ab_ab::a1b2_a2b1},
 		chi0s_vec);
diff --git a/include/RI/ri/LRI-cal_loop3.hpp b/include/RI/ri/LRI-cal_loop3.hpp
@@ -29,22 +29,22 @@ void LRI<TA,Tcell,Ndim,Tdata>::cal_loop3(
 	if(Ds_result.empty())
 		Ds_result.resize(1);
 
-	const bool flag_D_b_transpose = [&labels]() -> bool
+	const bool flag_D_a_transpose = [&labels]() -> bool
 	{
 		for(const Label::ab_ab &label : labels)
 			switch(label)
 			{
-				case Label::ab_ab::a0b0_a2b1:	case Label::ab_ab::a0b0_a2b2:
+				case Label::ab_ab::a0b0_a1b2:	case Label::ab_ab::a0b0_a2b2:	case Label::ab_ab::a1b2_a2b1:
 					return true;
 			}
 		return false;
 	}();
-	const bool flag_D_a_transpose = [&labels]() -> bool
+	const bool flag_D_b_transpose = [&labels]() -> bool
 	{
 		for(const Label::ab_ab &label : labels)
 			switch(label)
 			{
-				case Label::ab_ab::a0b0_a1b2:	case Label::ab_ab::a0b0_a2b2:
+				case Label::ab_ab::a0b0_a2b1:	case Label::ab_ab::a0b0_a2b2:
 					return true;
 			}
 		return false;
@@ -326,6 +326,128 @@ void LRI<TA,Tcell,Ndim,Tdata>::cal_loop3(
 					break;
 				} // end case a0b0_a2b2
 
+				case Label::ab_ab::a1b1_a2b2:
+				{
+					const std::vector<TA >  list_Aa01 = LRI_Cal_Aux::filter_list_map(
+						list_Aa01_Da,
+						this->Ds_ab[Label::ab::a0b0] );
+					const std::vector<TAC>  list_Aa2 = LRI_Cal_Aux::filter_list_map( 
+						list_Aa2_Da,
+						this->Ds_ab[Label::ab::a2b2] );
+					const std::vector<TAC>  list_Ab01 = LRI_Cal_Aux::filter_list_set( 
+						list_Ab01_Db,
+						this->index_Ds_ab[Label::ab::a0b0][0]);
+					const std::vector<TAC>  list_Ab2 = LRI_Cal_Aux::filter_list_set( 
+						list_Ab2_Db,
+						this->index_Ds_ab[Label::ab::a2b2][0]);
+
+					for(const TA &Aa01 : list_Aa01)
+					{
+						std::map<TAC,Tensor<Tdata>> Ds_result_fixed;
+
+						#pragma omp for schedule(dynamic) nowait
+						for(std::size_t ib2=0; ib2<list_Ab2.size(); ++ib2)
+						{
+							const TAC &Ab2 = list_Ab2[ib2];
+							// D_mul = D_a * D_a2b2
+							Tensor<Tdata> D_mul;
+							for(const TAC &Aa2 : list_Aa2)
+							{
+								const Tensor<Tdata> &D_a = tools.get_Ds_ab(Label::ab::a, Aa01, Aa2);
+								if(D_a.empty())	continue;
+								const Tensor<Tdata> D_a2b2 = tools.get_Ds_ab(Label::ab::a2b2, Aa2, Ab2);
+								if(D_a2b2.empty())	continue;
+
+								// b2a0a1 = a2b2 * a0a1a2
+								Tensor<Tdata> D_tmp1 = Tensor_Multiply::x1y0y1_ax1_y0y1a(D_a2b2, D_a);
+								LRI_Cal_Aux::add_Ds(std::move(D_tmp1), D_mul);
+							}
+							if(D_mul.empty())	continue;
+
+							// D_result = D_mul * D_a1b1 * D_b
+							for(const TAC &Ab01 : list_Ab01)
+							{
+								const Tensor<Tdata> &D_b = tools.get_Ds_ab(Label::ab::b, Ab01, Ab2);
+								if(D_b.empty())	continue;
+								const Tensor<Tdata> D_a1b1 = tools.get_Ds_ab(Label::ab::a1b1, Aa01, Ab01);
+								if(D_a1b1.empty())	continue;
+
+								// b1b2a0 = a1b1 * b2a0a1
+								const Tensor<Tdata> D_tmp2 = Tensor_Multiply::x1y0y1_ax1_y0y1a(D_a1b1, D_mul);
+								// a0b0 = b1b2a0 * b0b1b2
+								Tensor<Tdata> D_tmp3 = Tensor_Multiply::x2y0_abx2_y0ab(D_tmp2, D_b);
+								LRI_Cal_Aux::add_Ds(std::move(D_tmp3), Ds_result_fixed[Ab01]);
+							}
+						} // end for Ab01
+
+						if(!Ds_result_fixed.empty())
+							LRI_Cal_Aux::add_Ds( std::move(Ds_result_fixed),
+							                     Ds_result_thread[0][Aa01]);
+						LRI_Cal_Aux::add_Ds_omp_try(std::move(Ds_result_thread), Ds_result, lock_Ds_result_add, fac_add_Ds);
+					} // end for Aa01
+					break;
+				} // end case a0b0_a2b2
+
+				case Label::ab_ab::a1b2_a2b1:
+				{
+					const std::vector<TA >  list_Aa01 = LRI_Cal_Aux::filter_list_map( 
+						list_Aa01_Da,
+						this->Ds_ab[Label::ab::a1b2] );
+					const std::vector<TAC> &list_Aa2 = LRI_Cal_Aux::filter_list_map(
+						list_Aa2_Da,
+						this->Ds_ab[Label::ab::a2b1] );
+					const std::vector<TAC>  list_Ab01 = LRI_Cal_Aux::filter_list_set( 
+						list_Ab01_Db,
+						this->index_Ds_ab[Label::ab::a2b1][0]);
+					const std::vector<TAC>  list_Ab2 = LRI_Cal_Aux::filter_list_set( 
+						list_Ab2_Db,
+						this->index_Ds_ab[Label::ab::a1b2][0]);
+
+					for(const TA &Aa01 : list_Aa01)
+					{
+						#pragma omp for schedule(dynamic) nowait
+						for(std::size_t ib01=0; ib01<list_Ab01.size(); ++ib01)
+						{
+							const TAC &Ab01 = list_Ab01[ib01];
+							// D_mul1 = D_b * D_a1b2
+							Tensor<Tdata> D_mul1;
+							for(const TAC &Ab2 : list_Ab2)
+							{
+								const Tensor<Tdata> D_b = tools.get_Ds_ab(Label::ab::b, Ab01, Ab2);
+								if(D_b.empty())	continue;
+								const Tensor<Tdata> D_a1b2 = tools.get_Ds_ab(Label::ab::a1b2, Aa01, Ab2);
+								if(D_a1b2.empty())	continue;
+
+								// b0b1a1 = b0b1b2 * a1b2
+								Tensor<Tdata> D_tmp1 = Tensor_Multiply::x0x1y0_x0x1a_y0a(D_b, D_a1b2);
+								LRI_Cal_Aux::add_Ds(std::move(D_tmp1), D_mul1);
+							}
+							if(D_mul1.empty())	continue;
+
+							// D_mul2 = D_a2b1 * D_a
+							Tensor<Tdata> D_mul2;
+							for(const TAC &Aa2 : list_Aa2)
+							{
+								const Tensor<Tdata> &D_a_transpose = Global_Func::find(Ds_a_transpose, Aa01, Aa2);
+								if(D_a_transpose.empty())	continue;
+								const Tensor<Tdata> D_a2b1 = tools.get_Ds_ab(Label::ab::a2b1, Aa2, Ab01);
+								if(D_a2b1.empty())	continue;
+								// b1a1a0 = a2b1 * a1a0a2
+								Tensor<Tdata> D_tmp2 = Tensor_Multiply::x1y0y1_ax1_y0y1a(D_a2b1, D_a_transpose);
+								LRI_Cal_Aux::add_Ds(std::move(D_tmp2), D_mul2);
+							}
+							if(D_mul2.empty())	continue;
+
+							// D_result = D_mul2 * D_mul1
+							// a0b0 = b1a1a0 * b0b1a1
+							Ds_result_thread[0][Aa01][Ab01] = Tensor_Multiply::x2y0_abx2_y0ab(D_mul2, D_mul1);
+						} // end for Aa01
+
+						LRI_Cal_Aux::add_Ds_omp_try(std::move(Ds_result_thread), Ds_result, lock_Ds_result_add, fac_add_Ds);
+					} // end for Ab01
+					break;
+				} // end case a1b2_a2b1						
+
 				default:
 					throw std::invalid_argument(std::string(__FILE__)+std::to_string(__LINE__));
 			} // end switch(label)
diff --git a/unittests/Test_All.hpp b/unittests/Test_All.hpp
@@ -20,6 +20,7 @@
 #include "unittests/ri/Cell_Nearest-test.hpp"
 #include "unittests/physics/Exx-test.hpp"
 #include "unittests/physics/RPA-test.hpp"
+#include "unittests/physics/GW-test.hpp"
 
 namespace Test_All
 {
@@ -84,5 +85,10 @@ namespace Test_All
 		RPA_Test::main<double>(argc, argv);
 		RPA_Test::main<std::complex<float>>(argc, argv);
 		RPA_Test::main<std::complex<double>>(argc, argv);
+
+		GW_Test::main<float>(argc, argv);
+		GW_Test::main<double>(argc, argv);
+		GW_Test::main<std::complex<float>>(argc, argv);
+		GW_Test::main<std::complex<double>>(argc, argv);
 	}
 }
diff --git a/unittests/ri/LRI_Loop3-test.hpp b/unittests/ri/LRI_Loop3-test.hpp
@@ -289,7 +289,7 @@ namespace LRI_Loop3_Test
 					* Ds_ab[RI::Label::ab::b][Ab01][{Ab2,{0}}](ib0,ib1,ib2);
 			std::cout<<"a1b0_a2b2\t"<<(Ds_result[0][Aa01][{Ab01,{0}}] - D_test).norm(2)<<std::endl;
 		}
-
+*/
 		{
 			std::vector<T_Ds> Ds_result;
 			lri.cal_loop3({RI::Label::ab_ab::a1b1_a2b2}, Ds_result);
@@ -302,7 +302,7 @@ namespace LRI_Loop3_Test
 					* Ds_ab[RI::Label::ab::b][Ab01][{Ab2,{0}}](ib0,ib1,ib2);
 			std::cout<<"a1b1_a2b2\t"<<(Ds_result[0][Aa01][{Ab01,{0}}] - D_test).norm(2)<<std::endl;
 		}
-
+/*
 		{
 			std::vector<T_Ds> Ds_result;
 			lri.cal_loop3({RI::Label::ab_ab::a1b2_a2b0}, Ds_result);
@@ -315,7 +315,7 @@ namespace LRI_Loop3_Test
 					* Ds_ab[RI::Label::ab::b][Ab01][{Ab2,{0}}](ib0,ib1,ib2);
 			std::cout<<"a1b2_a2b0\t"<<(Ds_result[0][Aa01][{Ab01,{0}}] - D_test).norm(2)<<std::endl;
 		}
-
+*/
 		{
 			std::vector<T_Ds> Ds_result;
 			lri.cal_loop3({RI::Label::ab_ab::a1b2_a2b1}, Ds_result);
@@ -328,7 +328,6 @@ namespace LRI_Loop3_Test
 					* Ds_ab[RI::Label::ab::b][Ab01][{Ab2,{0}}](ib0,ib1,ib2);
 			std::cout<<"a1b2_a2b1\t"<<(Ds_result[0][Aa01][{Ab01,{0}}] - D_test).norm(2)<<std::endl;
 		}
-*/
 
 		MPI_Finalize();
 	}

Original file line number	Diff line number	Diff line change
`@@ -20,6 +20,7 @@`
`20`	`20`	`#include "unittests/ri/Cell_Nearest-test.hpp"`
`21`	`21`	`#include "unittests/physics/Exx-test.hpp"`
`22`	`22`	`#include "unittests/physics/RPA-test.hpp"`
	`23`	`+#include "unittests/physics/GW-test.hpp"`
`23`	`24`
`24`	`25`	`namespace Test_All`
`25`	`26`	`{`
`@@ -84,5 +85,10 @@ namespace Test_All`
`84`	`85`	`RPA_Test::main<double>(argc, argv);`
`85`	`86`	`RPA_Test::main<std::complex<float>>(argc, argv);`
`86`	`87`	`RPA_Test::main<std::complex<double>>(argc, argv);`
	`88`	`+`
	`89`	`+ GW_Test::main<float>(argc, argv);`
	`90`	`+ GW_Test::main<double>(argc, argv);`
	`91`	`+ GW_Test::main<std::complex<float>>(argc, argv);`
	`92`	`+ GW_Test::main<std::complex<double>>(argc, argv);`
`87`	`93`	`}`
`88`	`94`	`}`
Original file line number	Diff line number	Diff line change
`@@ -289,7 +289,7 @@ namespace LRI_Loop3_Test`
`289`	`289`	`* Ds_ab[RI::Label::ab::b][Ab01][{Ab2,{0}}](ib0,ib1,ib2);`
`290`	`290`	`std::cout<<"a1b0_a2b2\t"<<(Ds_result[0][Aa01][{Ab01,{0}}] - D_test).norm(2)<<std::endl;`
`291`	`291`	`}`
`292`		`-`
	`292`	`+*/`
`293`	`293`	`{`
`294`	`294`	`std::vector<T_Ds> Ds_result;`
`295`	`295`	`lri.cal_loop3({RI::Label::ab_ab::a1b1_a2b2}, Ds_result);`
`@@ -302,7 +302,7 @@ namespace LRI_Loop3_Test`
`302`	`302`	`* Ds_ab[RI::Label::ab::b][Ab01][{Ab2,{0}}](ib0,ib1,ib2);`
`303`	`303`	`std::cout<<"a1b1_a2b2\t"<<(Ds_result[0][Aa01][{Ab01,{0}}] - D_test).norm(2)<<std::endl;`
`304`	`304`	`}`
`305`		`-`
	`305`	`+/*`
`306`	`306`	`{`
`307`	`307`	`std::vector<T_Ds> Ds_result;`
`308`	`308`	`lri.cal_loop3({RI::Label::ab_ab::a1b2_a2b0}, Ds_result);`
`@@ -315,7 +315,7 @@ namespace LRI_Loop3_Test`
`315`	`315`	`* Ds_ab[RI::Label::ab::b][Ab01][{Ab2,{0}}](ib0,ib1,ib2);`
`316`	`316`	`std::cout<<"a1b2_a2b0\t"<<(Ds_result[0][Aa01][{Ab01,{0}}] - D_test).norm(2)<<std::endl;`
`317`	`317`	`}`
`318`		`-`
	`318`	`+*/`
`319`	`319`	`{`
`320`	`320`	`std::vector<T_Ds> Ds_result;`
`321`	`321`	`lri.cal_loop3({RI::Label::ab_ab::a1b2_a2b1}, Ds_result);`
`@@ -328,7 +328,6 @@ namespace LRI_Loop3_Test`
`328`	`328`	`* Ds_ab[RI::Label::ab::b][Ab01][{Ab2,{0}}](ib0,ib1,ib2);`
`329`	`329`	`std::cout<<"a1b2_a2b1\t"<<(Ds_result[0][Aa01][{Ab01,{0}}] - D_test).norm(2)<<std::endl;`
`330`	`330`	`}`
`331`		`-*/`
`332`	`331`
`333`	`332`	`MPI_Finalize();`
`334`	`333`	`}`