fix bugs, support cpu environment

Lu · Lu · commit 58ab3f6579f8 · 2019-11-11T19:42:27.000+08:00
diff --git a/source/lib/include/NNPInter.h b/source/lib/include/NNPInter.h
@@ -127,6 +127,7 @@ class NNPInter
   bool init_nbor;
   std::vector<int> sec_a;
   compute_t *array_double;
+  InternalNeighborList nlist;
   NNPAtomMap<VALUETYPE> nnpmap;
   unsigned long long *array_longlong;
   int *ilist, *jrange, *jlist, *array_int;
@@ -135,7 +136,9 @@ class NNPInter
 
   // function used for neighbor list copy
   vector<int> get_sel_a() const;
+#ifdef USE_CUDA_TOOLKIT
   void update_nbor(const InternalNeighborList & nlist, const int nloc);
+#endif
 };
 
 class NNPInterModelDevi
@@ -217,8 +220,9 @@ class NNPInterModelDevi
 
   // copy neighbor list info from host
   bool init_nbor;
-  vector<vector<int> > sec;
   compute_t *array_double;
+  vector<vector<int> > sec;
+  InternalNeighborList nlist;
   NNPAtomMap<VALUETYPE> nnpmap;
   unsigned long long *array_longlong;
   int max_sec_size = 0, max_sec_back = 0;
@@ -229,7 +233,9 @@ class NNPInterModelDevi
   void get_max_sec();
   vector<vector<int> > get_sel() const;
   void cum_sum(const std::vector<std::vector<int32> > n_sel);
+#ifdef USE_CUDA_TOOLKIT
   void update_nbor(const InternalNeighborList & nlist, const int nloc);
+#endif
 };
 
 
diff --git a/source/lib/src/NNPInter.cc b/source/lib/src/NNPInter.cc
@@ -683,6 +683,7 @@ NNPInter::~NNPInter() {
     #endif
 }
 
+#ifdef USE_CUDA_TOOLKIT
 void NNPInter::update_nbor(const InternalNeighborList & nlist, const int nloc) {
     if (!init_nbor) {
         sec_a = cum_sum(get_sel_a());
@@ -742,6 +743,7 @@ void NNPInter::update_nbor(const InternalNeighborList & nlist, const int nloc) {
     cudaErrcheck(cudaMemcpy(jrange, &nlist.jrange[0], sizeof(int) * nlist.jrange.size(), cudaMemcpyHostToDevice));
     cudaErrcheck(cudaMemcpy(jlist, &nlist.jlist[0], sizeof(int) * nlist.jlist.size(), cudaMemcpyHostToDevice));
 }
+#endif // USE_CUDA_TOOLKIT
 
 #ifdef USE_CUDA_TOOLKIT
 void
@@ -912,7 +914,7 @@ compute (ENERGYTYPE &			dener,
 {
   int nall = dcoord_.size() / 3;
   int nloc = nall - nghost;
-  NNPAtomMap<VALUETYPE> nnpmap (datype_.begin(), datype_.begin() + nloc);
+  nnpmap = NNPAtomMap<VALUETYPE> (datype_.begin(), datype_.begin() + nloc);
   assert (nloc == nnpmap.get_type().size());
   validate_fparam_aparam(nloc, fparam, aparam);
 
@@ -946,7 +948,7 @@ compute (ENERGYTYPE &			dener,
         nnpmap = NNPAtomMap<VALUETYPE> (datype_.begin(), datype_.begin() + nloc);
         assert (nloc == nnpmap.get_type().size());
 
-        InternalNeighborList nlist;
+        // InternalNeighborList nlist;
         convert_nlist_lmp_internal (nlist, lmp_list);
         shuffle_nlist (nlist, nnpmap);
         std::vector<std::pair<string, Tensor>> input_tensors;
@@ -987,7 +989,7 @@ compute (ENERGYTYPE &			dener,
 	 const vector<VALUETYPE> &	fparam,
 	 const vector<VALUETYPE> &	aparam)
 {
-  NNPAtomMap<VALUETYPE> nnpmap (datype_.begin(), datype_.end());
+  nnpmap = NNPAtomMap<VALUETYPE> (datype_.begin(), datype_.end());
   validate_fparam_aparam(nnpmap.get_type().size(), fparam, aparam);
 
   std::vector<std::pair<string, Tensor>> input_tensors;
@@ -1019,10 +1021,10 @@ compute (ENERGYTYPE &			dener,
     validate_fparam_aparam(nloc, fparam, aparam);
 
     if (ago == 0) {
-        NNPAtomMap<VALUETYPE> nnpmap (datype_.begin(), datype_.begin() + nloc);
+        nnpmap = NNPAtomMap<VALUETYPE> (datype_.begin(), datype_.begin() + nloc);
         assert (nloc == nnpmap.get_type().size());
 
-        InternalNeighborList nlist;
+        // InternalNeighborList nlist;
         convert_nlist_lmp_internal (nlist, lmp_list);
         shuffle_nlist (nlist, nnpmap);
         std::vector<std::pair<string, Tensor>> input_tensors;
@@ -1240,7 +1242,8 @@ get_max_sec()
     }
 }
 
-void 
+#ifdef USE_CUDA_TOOLKIT
+void
 NNPInterModelDevi::
 update_nbor(const InternalNeighborList & nlist, const int nloc) 
 {
@@ -1303,6 +1306,7 @@ update_nbor(const InternalNeighborList & nlist, const int nloc)
     cudaErrcheck(cudaMemcpy(jrange, &nlist.jrange[0], sizeof(int) * nlist.jrange.size(), cudaMemcpyHostToDevice));
     cudaErrcheck(cudaMemcpy(jlist, &nlist.jlist[0], sizeof(int) * nlist.jlist.size(), cudaMemcpyHostToDevice));
 }
+#endif //USE_CUDA_TOOLKIT
 
 void
 NNPInterModelDevi::
@@ -1332,7 +1336,7 @@ compute (ENERGYTYPE &			dener,
 {
   if (numb_models == 0) return;
 
-  NNPAtomMap<VALUETYPE> nnpmap (datype_.begin(), datype_.end());
+  nnpmap = NNPAtomMap<VALUETYPE> (datype_.begin(), datype_.end());
   validate_fparam_aparam(nnpmap.get_type().size(), fparam, aparam);
 
   std::vector<std::pair<string, Tensor>> input_tensors;
@@ -1389,7 +1393,7 @@ compute (vector<ENERGYTYPE> &		all_energy,
         nnpmap = NNPAtomMap<VALUETYPE> (datype_.begin(), datype_.begin() + nloc);
         assert (nloc == nnpmap.get_type().size());
 
-        InternalNeighborList nlist;
+        // InternalNeighborList nlist;
         convert_nlist_lmp_internal (nlist, lmp_list);
         shuffle_nlist (nlist, nnpmap);
         std::vector<std::pair<string, Tensor>> input_tensors;
@@ -1453,7 +1457,7 @@ compute (vector<ENERGYTYPE> &			all_energy,
         nnpmap = NNPAtomMap<VALUETYPE> (datype_.begin(), datype_.begin() + nloc);
         assert (nloc == nnpmap.get_type().size());
 
-        InternalNeighborList nlist;
+        // InternalNeighborList nlist;
         convert_nlist_lmp_internal (nlist, lmp_list);
         shuffle_nlist (nlist, nnpmap);
         std::vector<std::pair<string, Tensor>> input_tensors;
diff --git a/source/lmp/pair_nnp.cpp b/source/lmp/pair_nnp.cpp
@@ -288,12 +288,20 @@ void PairNNP::compute(int eflag, int vflag)
 #endif
   }
 
-  int ago = numb_models > 1 ? 0 : neighbor->ago;
-
+  // int ago = numb_models > 1 ? 0 : neighbor->ago;
+  int ago = neighbor->ago;
+  if (numb_models > 1) {
+      if (multi_models_no_mod_devi && (out_freq > 0 && update->ntimestep % out_freq == 0)) {
+          ago = 0;
+      }
+      else if (multi_models_mod_devi && (out_freq == 0 || update->ntimestep % out_freq != 0)) {
+        ago = 0;
+      }
+  }
   // compute
-  bool single_model = (numb_models == 1);
-  bool multi_models_no_mod_devi = (numb_models > 1 && (out_freq == 0 || update->ntimestep % out_freq != 0));
-  bool multi_models_mod_devi = (numb_models > 1 && (out_freq > 0 && update->ntimestep % out_freq == 0));
+  single_model = (numb_models == 1);
+  multi_models_no_mod_devi = (numb_models > 1 && (out_freq == 0 || update->ntimestep % out_freq != 0));
+  multi_models_mod_devi = (numb_models > 1 && (out_freq > 0 && update->ntimestep % out_freq == 0));
   if (do_ghost) {
     LammpsNeighborList lmp_list (list->inum, list->ilist, list->numneigh, list->firstneigh);
     if (single_model || multi_models_no_mod_devi) {
diff --git a/source/lmp/pair_nnp.h.in b/source/lmp/pair_nnp.h.in
@@ -82,6 +82,9 @@ private:
   int dim_aparam;
   int out_each;
   int out_rel;
+  bool single_model;
+  bool multi_models_mod_devi;
+  bool multi_models_no_mod_devi;
 #ifdef HIGH_PREC
   vector<double > fparam;
   vector<double > aparam;
diff --git a/source/op/CMakeLists.txt b/source/op/CMakeLists.txt
@@ -11,16 +11,15 @@ file(GLOB OP_PY *.py)
 if (BUILD_CPP_IF) 
     if (USE_CUDA_TOOLKIT)
         add_library(${LIB_DEEPMD_OP} SHARED ${OP_CUDA_SRC})
+        add_subdirectory(cuda)
+        find_package(CUDA REQUIRED)
+        include_directories(${CUDA_INCLUDE_DIRS})
+        set (EXTRA_LIBS ${EXTRA_LIBS} deepmd_op_cuda)
+        target_link_libraries (${LIB_DEEPMD_OP} ${EXTRA_LIBS})
+        target_link_libraries (${LIB_DEEPMD_OP} ${CUDA_LIBRARIES})
     else (USE_CUDA_TOOLKIT)
         add_library(${LIB_DEEPMD_OP} SHARED ${OP_SRC})
     endif (USE_CUDA_TOOLKIT)
-
-    add_subdirectory(cuda)
-    find_package(CUDA REQUIRED)
-    include_directories(${CUDA_INCLUDE_DIRS})
-    set (EXTRA_LIBS ${EXTRA_LIBS} deepmd_op_cuda)
-    target_link_libraries (${LIB_DEEPMD_OP} ${EXTRA_LIBS})
-    target_link_libraries (${LIB_DEEPMD_OP} ${CUDA_LIBRARIES})
 endif (BUILD_CPP_IF)
 
 if (BUILD_PY_IF)