Merge pull request #1183 from dyzheng/develop

dyzheng · web-flow · commit 754a300e6334 · 2022-08-23T15:52:08.000+08:00
Fix: Veff error when MPI_threads larger than nz
diff --git a/source/input.cpp b/source/input.cpp
@@ -408,6 +408,7 @@ void Input::Default(void)
     // test only
     //==========================================================
     test_just_neighbor = false;
+    test_skip_ewald = false;
 
     //==========================================================
     //    DFT+U     Xin Qu added on 2020-10-29
@@ -1510,6 +1511,10 @@ bool Input::Read(const std::string &fn)
         {
             read_value(ifs, test_just_neighbor);
         }
+        else if (strcmp("test_skip_ewald", word) == 0)
+        {
+            read_value(ifs, test_skip_ewald);
+        }
         //--------------
         //----------------------------------------------------------------------------------
         //         Xin Qu added on 2020-10-29 for DFT+U
@@ -2213,6 +2218,7 @@ void Input::Bcast()
     Parallel_Common::bcast_int(td_vextout);
     Parallel_Common::bcast_int(td_dipoleout);
     Parallel_Common::bcast_bool(test_just_neighbor);
+    Parallel_Common::bcast_bool(test_skip_ewald);
     Parallel_Common::bcast_int(GlobalV::ocp);
     Parallel_Common::bcast_string(GlobalV::ocp_set);
     Parallel_Common::bcast_int(out_mul); // qifeng add 2019/9/10
diff --git a/source/input.h b/source/input.h
@@ -422,7 +422,8 @@ class Input
     //==========================================================
     // variables for test only
     //==========================================================
-    bool test_just_neighbor;
+    bool test_just_neighbor = false;
+    bool test_skip_ewald = false;
 
   private:
     //==========================================================
diff --git a/source/input_conv.cpp b/source/input_conv.cpp
@@ -135,6 +135,7 @@ void Input_Conv::Convert(void)
     GlobalV::VION_IN_H = INPUT.vion_in_h;
     GlobalV::TEST_FORCE = INPUT.test_force;
     GlobalV::TEST_STRESS = INPUT.test_stress;
+    GlobalV::test_skip_ewald = INPUT.test_skip_ewald;
 
     //----------------------------------------------------------
     // iteration (1/3)
diff --git a/source/module_base/global_variable.cpp b/source/module_base/global_variable.cpp
@@ -157,6 +157,8 @@ int test_wf = 0;
 int test_charge = 0;
 int test_potential = 0;
 int test_energy = 0;
+// for test purpose, skip ewald calculation
+bool test_skip_ewald = false;
 //----------------------------------------------------------
 // src_lcao
 //----------------------------------------------------------
diff --git a/source/module_base/global_variable.h b/source/module_base/global_variable.h
@@ -180,6 +180,7 @@ extern int test_wf;
 extern int test_charge;
 extern int test_potential;
 extern int test_energy;
+extern bool test_skip_ewald;
 //==========================================================
 // src_onscaling
 //==========================================================
diff --git a/source/module_base/tool_quit.cpp b/source/module_base/tool_quit.cpp
@@ -128,4 +128,25 @@ void WARNING_QUIT(const std::string &file,const std::string &description)
     QUIT();
 }
 
+
+//Input judgement and communicate , if any judgement is true, do WARNING_QUIT
+void CHECK_WARNING_QUIT(bool error_in, const std::string &file,const std::string &description)
+{
+	int error = (int)error_in;
+#ifdef __NORMAL
+// only for UT, do nothing here
+#else
+#ifdef __MPI
+	int error_max = error;
+	MPI_Reduce(&error, &error_max, 1, MPI_INT, MPI_MAX, 0, MPI_COMM_WORLD);
+	MPI_Bcast(&error_max, 1, MPI_INT, 0, MPI_COMM_WORLD);
+	error = error_max;
+#endif
+#endif
+	if(error)
+	{
+		WARNING_QUIT(file, description);
+	}
+}
+
 }
diff --git a/source/module_base/tool_quit.h b/source/module_base/tool_quit.h
@@ -43,6 +43,14 @@ void QUIT(void);
  */
 void WARNING_QUIT(const std::string &file, const std::string &description);
 
+/**
+ * @brief Check, if true, WARNING_QUIT
+ *
+ * @param file The file where warning happens
+ * @param description The warning information
+ */
+void CHECK_WARNING_QUIT(bool error, const std::string &file,const std::string &description);
+
 } // namespace ModuleBase
 
 #endif
diff --git a/source/module_esolver/esolver_ks_lcao_elec.cpp b/source/module_esolver/esolver_ks_lcao_elec.cpp
@@ -256,7 +256,10 @@ namespace ModuleESolver
 #endif
         // 1. calculate ewald energy.
         // mohan update 2021-02-25
-        H_Ewald_pw::compute_ewald(GlobalC::ucell, GlobalC::rhopw);
+        if(!GlobalV::test_skip_ewald)
+        {
+            H_Ewald_pw::compute_ewald(GlobalC::ucell, GlobalC::rhopw);
+        }
 
         //2. the electron charge density should be symmetrized,
         // here is the initialization
diff --git a/source/module_esolver/esolver_ks_pw.cpp b/source/module_esolver/esolver_ks_pw.cpp
@@ -180,7 +180,10 @@ namespace ModuleESolver
         }
 
         //calculate ewald energy
-        H_Ewald_pw::compute_ewald(GlobalC::ucell, GlobalC::rhopw);
+        if(!GlobalV::test_skip_ewald)
+        {
+            H_Ewald_pw::compute_ewald(GlobalC::ucell, GlobalC::rhopw);
+        }
         //Symmetry_rho should be moved to Init()
         Symmetry_rho srho;
         for (int is = 0; is < GlobalV::NSPIN; is++)
diff --git a/source/module_hamilt/ks_pw/veff_pw.cpp b/source/module_hamilt/ks_pw/veff_pw.cpp
@@ -46,38 +46,47 @@ void Veff<OperatorPW>::act
     {
         if (this->npol == 1)
         {
-            const double* current_veff = &(this->veff[0](current_spin, 0));
             wfcpw->recip2real(tmpsi_in, porter, ik);
-            for (int ir = 0; ir < this->veff->nc; ++ir)
+            // NOTICE: when MPI threads are larger than number of Z grids
+            // veff would contain nothing, and nothing should be done in real space
+            // but the 3DFFT can not be skipped, it will cause hanging
+            if(this->veff->nc != 0)
             {
-                porter[ir] *= current_veff[ir];
+                const double* current_veff = &(this->veff[0](current_spin, 0));
+                for (int ir = 0; ir < this->veff->nc; ++ir)
+                {
+                    porter[ir] *= current_veff[ir];
+                }
             }
             wfcpw->real2recip(porter, tmhpsi, ik, true);
         }
         else
         {
-            const double* current_veff[4];
-            for(int is=0;is<4;is++)
-            {
-                current_veff[is] = &(this->veff[0](is, 0));
-            }
             std::complex<double> *porter1 = new std::complex<double>[wfcpw->nmaxgr];
             // fft to real space and doing things.
             wfcpw->recip2real(tmpsi_in, porter, ik);
             wfcpw->recip2real(tmpsi_in + this->max_npw, porter1, ik);
             std::complex<double> sup, sdown;
-            for (int ir = 0; ir < this->veff->nc; ir++)
+            if(this->veff->nc != 0)
             {
-                sup = porter[ir] * (current_veff[0][ir] + current_veff[3][ir])
-                      + porter1[ir]
-                            * (current_veff[1][ir]
-                               - std::complex<double>(0.0, 1.0) * current_veff[2][ir]);
-                sdown = porter1[ir] * (current_veff[0][ir] - current_veff[3][ir])
-                        + porter[ir]
-                              * (current_veff[1][ir]
-                                 + std::complex<double>(0.0, 1.0) * current_veff[2][ir]);
-                porter[ir] = sup;
-                porter1[ir] = sdown;
+                const double* current_veff[4];
+                for(int is=0;is<4;is++)
+                {
+                    current_veff[is] = &(this->veff[0](is, 0));
+                }
+                for (int ir = 0; ir < this->veff->nc; ir++)
+                {
+                    sup = porter[ir] * (current_veff[0][ir] + current_veff[3][ir])
+                        + porter1[ir]
+                                * (current_veff[1][ir]
+                                - std::complex<double>(0.0, 1.0) * current_veff[2][ir]);
+                    sdown = porter1[ir] * (current_veff[0][ir] - current_veff[3][ir])
+                            + porter[ir]
+                                * (current_veff[1][ir]
+                                    + std::complex<double>(0.0, 1.0) * current_veff[2][ir]);
+                    porter[ir] = sup;
+                    porter1[ir] = sdown;
+                }
             }
             // (3) fft back to G space.
             wfcpw->real2recip(porter, tmhpsi, this->ik, true);
diff --git a/source/module_pw/pw_basis_k.cpp b/source/module_pw/pw_basis_k.cpp
@@ -69,6 +69,8 @@ void PW_Basis_K::setupIndGk()
     //count npwk
     this->npwk_max = 0;
     delete[] this->npwk; this->npwk = new int [this->nks];
+    //minimun npw, only for check
+    int npwk_min = this->npw;
     for (int ik = 0; ik < this->nks; ik++)
     {
         int ng = 0;
@@ -89,7 +91,12 @@ void PW_Basis_K::setupIndGk()
         {
             this->npwk_max = ng;
         }
+        if ( npwk_min > ng)
+        {
+            npwk_min = ng;
+        }
     }
+    ModuleBase::CHECK_WARNING_QUIT((npwk_min==0), "PW_Basis_K::setupIndGk", "some cores have no plane waves!");
 
     //get igl2isz_k and igl2ig_k
     delete[] igl2isz_k; this->igl2isz_k = new int [this->nks * this->npwk_max];
diff --git a/tests/integrate/101_PW_15_lowz/INPUT b/tests/integrate/101_PW_15_lowz/INPUT
@@ -0,0 +1,33 @@
+INPUT_PARAMETERS
+#Parameters (1.General)
+suffix			autotest
+calculation     scf
+ntype			1
+nbands			6
+symmetry		1
+pseudo_dir      ../tools/PP_ORB/
+pseudo_type     upf201
+
+#Parameters (2.Iteration)
+ecutwfc			20
+scf_thr				1e-9
+scf_nmax			1
+
+
+#Parameters (3.Basis)
+basis_type		pw
+
+#Parameters (4.Smearing)
+smearing_method		gauss
+smearing_sigma			0.002
+
+#Parameters (5.Mixing)
+mixing_type		pulay
+mixing_beta		0.7
+
+nx                      24
+ny                      24
+nz                      3
+pw_seed                 1
+
+test_skip_ewald         1
diff --git a/tests/integrate/101_PW_15_lowz/KPT b/tests/integrate/101_PW_15_lowz/KPT
@@ -0,0 +1,4 @@
+K_POINTS
+0
+Gamma
+1 1 1 0 0 0
diff --git a/tests/integrate/101_PW_15_lowz/STRU b/tests/integrate/101_PW_15_lowz/STRU
@@ -0,0 +1,19 @@
+ATOMIC_SPECIES
+Si 14 Si_ONCV_PBE-1.0.upf
+
+LATTICE_CONSTANT
+10.2  // add lattice constant
+
+LATTICE_VECTORS
+0.5 0.5 0.0
+0.5 0.0 0.5
+0.0 0.5 0.5
+
+ATOMIC_POSITIONS
+Direct 
+
+Si	// Element type	
+0.0	// magnetism
+2	
+0.00 0.00 0.00 1 1 1
+0.25 0.25 0.25 1 1 1
diff --git a/tests/integrate/101_PW_15_lowz/jd b/tests/integrate/101_PW_15_lowz/jd
@@ -0,0 +1 @@
+test SG15 pseudopotential, symmetry=on, nz is 3 which less than default MPI_threads 4, ewald calculation is skipped in this case
diff --git a/tests/integrate/101_PW_15_lowz/result.ref b/tests/integrate/101_PW_15_lowz/result.ref
@@ -0,0 +1,3 @@
+etotref -1.407077993281502
+etotperatomref -0.7035389966
+totaltimeref 0.15155
diff --git a/tests/integrate/CASES b/tests/integrate/CASES
@@ -6,6 +6,7 @@
 101_PW_upf201_Al_pseudopots
 101_PW_upf201_pseudopots
 101_PW_VW_pseudopots
+101_PW_15_lowz
 102_PW_DA_davidson
 103_PW_15_CS_CF
 103_PW_15_CS_CF_bspline