norm descrpt, ener bias for multicomponent system, add type fitting net for smooth version. continue when nei list length is not enough

Han Wang · Han Wang · commit 7312f58ff445 · 2018-07-24T13:24:17.000+08:00
diff --git a/examples/train/water.json b/examples/train/water.json
@@ -11,7 +11,7 @@
     "_comment":	"                    if type < 0, exclude type -(type+1)",
     "_comment": "                    for water (O:0, H:1) it can be",
     "_comment": "                    [0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0]",
-    "n_neuron":		[240, 120, 60, 30, 10],
+    "fitting_neuron":	[240, 120, 60, 30, 10],
 
     "_comment": " traing controls",
     "systems":		["../data/water/"],
diff --git a/examples/train/water_smth.json b/examples/train/water_smth.json
@@ -6,9 +6,11 @@
     "rcut":		6.00,
     "filter_neuron":	[25, 50, 100],
     "filter_resnet_dt":	false,
-    "n_axis_neuron":	16,
-    "n_neuron":		[240, 240, 240],
-    "resnet_dt":	true,
+    "axis_neuron":	16,
+    "fitting_neuron":	[240, 240, 240],
+    "fitting_resnet_dt":true,
+    "coord_norm":	true,
+    "type_fitting_net":	false,
 
     "_comment": " traing controls",
     "systems":		["../data/water/"],
diff --git a/source/lib/include/ComputeDescriptor.h b/source/lib/include/ComputeDescriptor.h
@@ -335,21 +335,25 @@ int format_nlist_fill_a (vector<int > &				fmt_nei_idx_a,
   sort (sel_nei.begin(), sel_nei.end());  
   
   vector<int > nei_iter = sec_a;
+  int overflowed = -1;
   for (unsigned kk = 0; kk < sel_nei.size(); ++kk){
     const int & nei_type = sel_nei[kk].type;
     if (nei_iter[nei_type] >= sec_a[nei_type+1]) {
       int r_idx_iter = (nei_iter[nei_type] ++) - sec_a[nei_type+1] + sec_r[nei_type];
       if (r_idx_iter >= sec_r[nei_type+1]) {
-	return nei_type;
+	// return nei_type;
+	overflowed = nei_type;
+      }
+      else {
+	fmt_nei_idx_r[r_idx_iter] = sel_nei[kk].index;
       }
-      fmt_nei_idx_r[r_idx_iter] = sel_nei[kk].index;
     }
     else {
       fmt_nei_idx_a[nei_iter[nei_type] ++] = sel_nei[kk].index;
     }
   }
   
-  return -1;
+  return overflowed;
 }
 
 
diff --git a/source/op/descrpt.cc b/source/op/descrpt.cc
@@ -75,6 +75,7 @@ class DescrptOp : public OpKernel {
     nnei_r = sec_r.back();
     nnei = nnei_a + nnei_r;
     fill_nei_a = (rcut_a < 0);
+    count_nei_idx_overflow = 0;
   }
 
   void Compute(OpKernelContext* context) override {
@@ -93,24 +94,27 @@ class DescrptOp : public OpKernel {
     OP_REQUIRES (context, (natoms_tensor.shape().dims() == 1),	errors::InvalidArgument ("Dim of natoms should be 1"));
     OP_REQUIRES (context, (box_tensor.shape().dims() == 2),	errors::InvalidArgument ("Dim of box should be 2"));
     OP_REQUIRES (context, (mesh_tensor.shape().dims() == 1),	errors::InvalidArgument ("Dim of mesh should be 1"));
-    OP_REQUIRES (context, (avg_tensor.shape().dims() == 1),	errors::InvalidArgument ("Dim of avg should be 1"));
-    OP_REQUIRES (context, (std_tensor.shape().dims() == 1),	errors::InvalidArgument ("Dim of std should be 1"));
+    OP_REQUIRES (context, (avg_tensor.shape().dims() == 2),	errors::InvalidArgument ("Dim of avg should be 2"));
+    OP_REQUIRES (context, (std_tensor.shape().dims() == 2),	errors::InvalidArgument ("Dim of std should be 2"));
 
     OP_REQUIRES (context, (natoms_tensor.shape().dim_size(0) >= 3),		errors::InvalidArgument ("number of atoms should be larger than (or equal to) 3"));
     auto natoms	= natoms_tensor	.flat<int>();
     int nloc = natoms(0);
     int nall = natoms(1);
+    int ntypes = natoms_tensor.shape().dim_size(0) - 2;
     int nsamples = coord_tensor.shape().dim_size(0);
 
     // check the sizes
     OP_REQUIRES (context, (nsamples == type_tensor.shape().dim_size(0)),	errors::InvalidArgument ("number of samples should match"));
     OP_REQUIRES (context, (nsamples == box_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of samples should match"));
-    OP_REQUIRES (context, (ndescrpt == avg_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of avg should be ndescrpt"));
-    OP_REQUIRES (context, (ndescrpt == std_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of std should be ndescrpt"));
+    OP_REQUIRES (context, (ntypes == avg_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of avg should be ntype"));
+    OP_REQUIRES (context, (ntypes == std_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of std should be ntype"));
 
     OP_REQUIRES (context, (nall * 3 == coord_tensor.shape().dim_size(1)),	errors::InvalidArgument ("number of atoms should match"));
     OP_REQUIRES (context, (nall == type_tensor.shape().dim_size(1)),		errors::InvalidArgument ("number of atoms should match"));
     OP_REQUIRES (context, (9 == box_tensor.shape().dim_size(1)),		errors::InvalidArgument ("number of box should be 9"));
+    OP_REQUIRES (context, (ndescrpt == avg_tensor.shape().dim_size(1)),		errors::InvalidArgument ("number of avg should be ndescrpt"));
+    OP_REQUIRES (context, (ndescrpt == std_tensor.shape().dim_size(1)),		errors::InvalidArgument ("number of std should be ndescrpt"));
 
     int nei_mode = 0;
     if (mesh_tensor.shape().dim_size(0) == 16) {
@@ -156,8 +160,8 @@ class DescrptOp : public OpKernel {
     auto type	= type_tensor	.matrix<int>();
     auto box	= box_tensor	.matrix<VALUETYPE>();
     auto mesh	= mesh_tensor	.flat<int>();
-    auto avg	= avg_tensor	.flat<VALUETYPE>();
-    auto std	= std_tensor	.flat<VALUETYPE>();
+    auto avg	= avg_tensor	.matrix<VALUETYPE>();
+    auto std	= std_tensor	.matrix<VALUETYPE>();
     auto descrpt	= descrpt_tensor	->matrix<VALUETYPE>();
     auto descrpt_deriv	= descrpt_deriv_tensor	->matrix<VALUETYPE>();
     auto rij		= rij_tensor		->matrix<VALUETYPE>();
@@ -170,7 +174,6 @@ class DescrptOp : public OpKernel {
     //   if (type(0, ii) > max_type_v) max_type_v = type(0, ii);
     // }
     // int ntypes = max_type_v + 1;
-    int ntypes = natoms_tensor.shape().dim_size(0) - 2;
     OP_REQUIRES (context, (ntypes == int(sel_a.size())),	errors::InvalidArgument ("number of types should match the length of sel array"));
     OP_REQUIRES (context, (ntypes == int(sel_r.size())),	errors::InvalidArgument ("number of types should match the length of sel array"));
 
@@ -270,8 +273,11 @@ class DescrptOp : public OpKernel {
 	int ret = -1;
 	if (fill_nei_a){
 	  if ((ret = format_nlist_fill_a (fmt_nlist_a, fmt_nlist_r, d_coord3, ntypes, d_type, region, b_pbc, ii, d_nlist_a[ii], d_nlist_r[ii], rcut_r, sec_a, sec_r)) != -1){
-	    cout << "Radial neighbor list length of type " << ret << " is not enough" << endl;
-	    exit(1);
+	    if (count_nei_idx_overflow == 0) {
+	      cout << "WARNING: Radial neighbor list length of type " << ret << " is not enough" << endl;
+	      flush(cout);
+	      count_nei_idx_overflow ++;
+	    }
 	  }
 	}
 
@@ -322,16 +328,16 @@ class DescrptOp : public OpKernel {
 	assert (int(fmt_nlist_r.size()) == nnei_r);
 	// record outputs
 	for (int jj = 0; jj < ndescrpt_a; ++jj) {
-	  descrpt(kk, ii * ndescrpt + jj) = (d_descrpt_a[jj] - avg(jj)) / std(jj);
+	  descrpt(kk, ii * ndescrpt + jj) = (d_descrpt_a[jj] - avg(d_type[ii], jj)) / std(d_type[ii], jj);
 	}
 	for (int jj = 0; jj < ndescrpt_r; ++jj) {
-	  descrpt(kk, ii * ndescrpt + ndescrpt_a + jj) = (d_descrpt_r[jj] - avg(ndescrpt_a + jj)) / std(ndescrpt_a + jj);
+	  descrpt(kk, ii * ndescrpt + ndescrpt_a + jj) = (d_descrpt_r[jj] - avg(d_type[ii], ndescrpt_a + jj)) / std(d_type[ii], ndescrpt_a + jj);
 	}
 	for (int jj = 0; jj < ndescrpt_a * 12; ++jj) {
-	  descrpt_deriv(kk, ii * ndescrpt * 12 + jj) = d_descrpt_a_deriv[jj] / std(jj/12);
+	  descrpt_deriv(kk, ii * ndescrpt * 12 + jj) = d_descrpt_a_deriv[jj] / std(d_type[ii], jj/12);
 	}
 	for (int jj = 0; jj < ndescrpt_r * 12; ++jj) {
-	  descrpt_deriv(kk, ii * ndescrpt * 12 + ndescrpt_a * 12 + jj) = d_descrpt_r_deriv[jj] / std(jj/12 + ndescrpt_a);
+	  descrpt_deriv(kk, ii * ndescrpt * 12 + ndescrpt_a * 12 + jj) = d_descrpt_r_deriv[jj] / std(d_type[ii], jj/12 + ndescrpt_a);
 	}
 	for (int jj = 0; jj < nnei_a * 3; ++jj){
 	  rij (kk, ii * nnei * 3 + jj) = d_rij_a[jj];
@@ -371,6 +377,7 @@ class DescrptOp : public OpKernel {
   int ndescrpt, ndescrpt_a, ndescrpt_r;
   int nnei, nnei_a, nnei_r;
   bool fill_nei_a;
+  int count_nei_idx_overflow;
   void 
   cum_sum (vector<int> & sec,
 	   const vector<int32> & n_sel) const {
diff --git a/source/op/descrpt_norot.cc b/source/op/descrpt_norot.cc
@@ -73,6 +73,7 @@ class DescrptNorotOp : public OpKernel {
     nnei_r = sec_r.back();
     nnei = nnei_a + nnei_r;
     fill_nei_a = (rcut_a < 0);
+    count_nei_idx_overflow = 0;
   }
 
   void Compute(OpKernelContext* context) override {
@@ -92,26 +93,29 @@ class DescrptNorotOp : public OpKernel {
     OP_REQUIRES (context, (natoms_tensor.shape().dims() == 1),	errors::InvalidArgument ("Dim of natoms should be 1"));
     OP_REQUIRES (context, (box_tensor.shape().dims() == 2),	errors::InvalidArgument ("Dim of box should be 2"));
     OP_REQUIRES (context, (mesh_tensor.shape().dims() == 1),	errors::InvalidArgument ("Dim of mesh should be 1"));
-    OP_REQUIRES (context, (avg_tensor.shape().dims() == 1),	errors::InvalidArgument ("Dim of avg should be 1"));
-    OP_REQUIRES (context, (std_tensor.shape().dims() == 1),	errors::InvalidArgument ("Dim of std should be 1"));
+    OP_REQUIRES (context, (avg_tensor.shape().dims() == 2),	errors::InvalidArgument ("Dim of avg should be 2"));
+    OP_REQUIRES (context, (std_tensor.shape().dims() == 2),	errors::InvalidArgument ("Dim of std should be 2"));
     OP_REQUIRES (context, (fill_nei_a),				errors::InvalidArgument ("Rotational free descriptor only support the case rcut_a < 0"));
     OP_REQUIRES (context, (sec_r.back() == 0),			errors::InvalidArgument ("Rotational free descriptor only support all-angular information: sel_r should be all zero."));
 
     OP_REQUIRES (context, (natoms_tensor.shape().dim_size(0) >= 3),		errors::InvalidArgument ("number of atoms should be larger than (or equal to) 3"));
     auto natoms	= natoms_tensor	.flat<int>();
     int nloc = natoms(0);
     int nall = natoms(1);
+    int ntypes = natoms_tensor.shape().dim_size(0) - 2;
     int nsamples = coord_tensor.shape().dim_size(0);
 
     // check the sizes
     OP_REQUIRES (context, (nsamples == type_tensor.shape().dim_size(0)),	errors::InvalidArgument ("number of samples should match"));
     OP_REQUIRES (context, (nsamples == box_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of samples should match"));
-    OP_REQUIRES (context, (ndescrpt == avg_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of avg should be ndescrpt"));
-    OP_REQUIRES (context, (ndescrpt == std_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of std should be ndescrpt"));
+    OP_REQUIRES (context, (ntypes == avg_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of avg should be ntype"));
+    OP_REQUIRES (context, (ntypes == std_tensor.shape().dim_size(0)),		errors::InvalidArgument ("number of std should be ntype"));
 
     OP_REQUIRES (context, (nall * 3 == coord_tensor.shape().dim_size(1)),	errors::InvalidArgument ("number of atoms should match"));
     OP_REQUIRES (context, (nall == type_tensor.shape().dim_size(1)),		errors::InvalidArgument ("number of atoms should match"));
     OP_REQUIRES (context, (9 == box_tensor.shape().dim_size(1)),		errors::InvalidArgument ("number of box should be 9"));
+    OP_REQUIRES (context, (ndescrpt == avg_tensor.shape().dim_size(1)),		errors::InvalidArgument ("number of avg should be ndescrpt"));
+    OP_REQUIRES (context, (ndescrpt == std_tensor.shape().dim_size(1)),		errors::InvalidArgument ("number of std should be ndescrpt"));
 
     int nei_mode = 0;
     if (mesh_tensor.shape().dim_size(0) == 16) {
@@ -161,8 +165,8 @@ class DescrptNorotOp : public OpKernel {
     auto type	= type_tensor	.matrix<int>();
     auto box	= box_tensor	.matrix<VALUETYPE>();
     auto mesh	= mesh_tensor	.flat<int>();
-    auto avg	= avg_tensor	.flat<VALUETYPE>();
-    auto std	= std_tensor	.flat<VALUETYPE>();
+    auto avg	= avg_tensor	.matrix<VALUETYPE>();
+    auto std	= std_tensor	.matrix<VALUETYPE>();
     auto descrpt	= descrpt_tensor	->matrix<VALUETYPE>();
     auto descrpt_deriv	= descrpt_deriv_tensor	->matrix<VALUETYPE>();
     auto rij		= rij_tensor		->matrix<VALUETYPE>();
@@ -174,7 +178,6 @@ class DescrptNorotOp : public OpKernel {
     //   if (type(0, ii) > max_type_v) max_type_v = type(0, ii);
     // }
     // int ntypes = max_type_v + 1;
-    int ntypes = natoms_tensor.shape().dim_size(0) - 2;
     OP_REQUIRES (context, (ntypes == int(sel_a.size())),	errors::InvalidArgument ("number of types should match the length of sel array"));
     OP_REQUIRES (context, (ntypes == int(sel_r.size())),	errors::InvalidArgument ("number of types should match the length of sel array"));
 
@@ -274,8 +277,11 @@ class DescrptNorotOp : public OpKernel {
 	int ret = -1;
 	if (fill_nei_a){
 	  if ((ret = format_nlist_fill_a (fmt_nlist_a, fmt_nlist_r, d_coord3, ntypes, d_type, region, b_pbc, ii, d_nlist_a[ii], d_nlist_r[ii], rcut_r, sec_a, sec_r)) != -1){
-	    cout << "Radial neighbor list length of type " << ret << " is not enough" << endl;
-	    exit(1);
+	    if (count_nei_idx_overflow == 0) {
+	      cout << "WARNING: Radial neighbor list length of type " << ret << " is not enough" << endl;
+	      flush(cout);
+	      count_nei_idx_overflow ++;
+	    }
 	  }
 	}
 
@@ -306,10 +312,10 @@ class DescrptNorotOp : public OpKernel {
 	assert (int(fmt_nlist_a.size()) == nnei_a);
 	// record outputs
 	for (int jj = 0; jj < ndescrpt_a; ++jj) {
-	  descrpt(kk, ii * ndescrpt + jj) = (d_descrpt_a[jj] - avg(jj)) / std(jj);
+	  descrpt(kk, ii * ndescrpt + jj) = (d_descrpt_a[jj] - avg(d_type[ii], jj)) / std(d_type[ii], jj);
 	}
 	for (int jj = 0; jj < ndescrpt_a * 3; ++jj) {
-	  descrpt_deriv(kk, ii * ndescrpt * 3 + jj) = d_descrpt_a_deriv[jj] / std(jj/3);
+	  descrpt_deriv(kk, ii * ndescrpt * 3 + jj) = d_descrpt_a_deriv[jj] / std(d_type[ii], jj/3);
 	}
 	for (int jj = 0; jj < nnei_a * 3; ++jj){
 	  rij (kk, ii * nnei * 3 + jj) = d_rij_a[jj];
@@ -335,6 +341,7 @@ class DescrptNorotOp : public OpKernel {
   int ndescrpt, ndescrpt_a, ndescrpt_r;
   int nnei, nnei_a, nnei_r;
   bool fill_nei_a;
+  int count_nei_idx_overflow;
   void 
   cum_sum (vector<int> & sec,
 	   const vector<int32> & n_sel) const {
diff --git a/source/train/Data.py b/source/train/Data.py
@@ -10,27 +10,20 @@ class DataSets (object):
     def __init__ (self, 
                   sys_path,
                   set_prefix,
-                  do_norm = False,
                   seed = None) :
-        self.dirs = glob.glob (sys_path + "/" + set_prefix + ".*")
+        self.dirs = glob.glob (os.path.join(sys_path, set_prefix + ".*"))
         self.dirs.sort()
-        if os.path.isfile (sys_path + "/ncopies.raw") :
-            self.ncopies = np.loadtxt (sys_path + "/ncopies.raw", dtype=np.int32)
-        else :
-            self.ncopies = [1]
-
         # load atom type
         self.atom_type, self.idx_map, self.idx3_map = self.load_type (sys_path)
-        
-        self.do_norm = do_norm
-        self.eavg = self.stats_energy()
-        # print ("avg is ",self.eavg)
-
+        # train dirs
         self.test_dir   = self.dirs[-1]
         if len(self.dirs) == 1 :
             self.train_dirs = self.dirs
         else :
             self.train_dirs = self.dirs[:-1]
+        # energy norm
+        self.eavg = self.stats_energy()
+        # load sets
         self.set_count = 0
         self.load_batch_set (self.train_dirs[self.set_count % self.get_numb_set()])
         self.load_test_set (self.test_dir)
@@ -65,11 +58,11 @@ def get_numb_set (self) :
         return len (self.train_dirs)
     
     def stats_energy (self) :
-        eners = []
-        for ii in self.dirs:
-            ei = np.load (ii + "/energy.npy")
-            eners.append (np.average(ei))
-        return np.average (eners)
+        eners = np.array([])
+        for ii in self.train_dirs:
+            ei = np.load(os.path.join(ii, "energy.npy"))
+            eners = np.append(eners, ei)
+        return np.average(eners)
     
     def cond_load_vec (self, 
                        nframes,
@@ -119,7 +112,6 @@ def load_batch_set (self,
         self.box_batch = self.box_batch[idx]
         self.type_batch = np.tile (self.atom_type, (nframe, 1))
         self.reset_iter ()
-        if self.do_norm: self.normalization (self.energy_batch)
         # sort according to type
         self.type_batch = self.type_batch[:, self.idx_map]
         self.coord_batch = self.coord_batch[:, self.idx3_map]
@@ -146,7 +138,6 @@ def load_test_set (self,
         self.coord_test = self.coord_test[idx]
         self.box_test = self.box_test[idx]
         self.type_test = np.tile (self.atom_type, (nframe, 1))
-        if self.do_norm: self.normalization (self.energy_test)
         self.type_test = self.type_test[:, self.idx_map]
         self.coord_test = self.coord_test[:, self.idx3_map]
         self.force_test = self.force_test[:, self.idx3_map]
@@ -174,12 +165,6 @@ def get_batch (self,
         self.iterator += batch_size
         return self.prop_c_batch.astype(np.float32), self.energy_batch[idx].astype(np.float64), self.force_batch[idx, :].astype(np.float64), self.virial_batch[idx, :].astype(np.float64), self.coord_batch[idx, :].astype(np.float64), self.box_batch[idx, :].astype(np.float64), self.type_batch[idx, :]
     
-    def normalization (self, 
-                       energy) :
-        if self.do_norm : 
-            for ii in range (energy.shape[0]) :
-                energy[ii] -= self.eavg
-
     def get_natoms (self) :
         sample_type = self.type_batch[0]
         natoms = len(sample_type)
@@ -199,22 +184,18 @@ def get_natoms_vec (self, ntypes) :
         tmp = np.append (tmp, natoms_vec)
         return tmp.astype(np.int32)
 
-    def get_ncopies (self) :
-        return self.ncopies
-
     def set_numb_batch (self, 
                         batch_size) :
         return self.energy_batch.shape[0] // batch_size
 
     def get_sys_numb_batch (self, batch_size) :
         return self.set_numb_batch(batch_size) * self.get_numb_set()
 
-    def get_bias_atom_e (self) :
-        natoms = self.get_natoms ()
-        return self.eavg / natoms
+    def get_ener (self) :
+        return self.eavg
 
 if __name__ == '__main__':
-    data = DataSets (".", "set", do_norm = False)
+    data = DataSets (".", "set")
     energy, force, virial, coord, box, ttype = data.get_batch(1)
     print (energy.shape)
     print (force.shape)
diff --git a/source/train/DataSystem.py b/source/train/DataSystem.py
diff --git a/source/train/Model.py b/source/train/Model.py

Original file line number	Diff line number	Diff line change
`@@ -335,21 +335,25 @@ int format_nlist_fill_a (vector<int > & fmt_nei_idx_a,`
`335`	`335`	`sort (sel_nei.begin(), sel_nei.end());`
`336`	`336`
`337`	`337`	`vector<int > nei_iter = sec_a;`
	`338`	`+ int overflowed = -1;`
`338`	`339`	`for (unsigned kk = 0; kk < sel_nei.size(); ++kk){`
`339`	`340`	`const int & nei_type = sel_nei[kk].type;`
`340`	`341`	`if (nei_iter[nei_type] >= sec_a[nei_type+1]) {`
`341`	`342`	`int r_idx_iter = (nei_iter[nei_type] ++) - sec_a[nei_type+1] + sec_r[nei_type];`
`342`	`343`	`if (r_idx_iter >= sec_r[nei_type+1]) {`
`343`		`- return nei_type;`
	`344`	`+ // return nei_type;`
	`345`	`+ overflowed = nei_type;`
	`346`	`+ }`
	`347`	`+ else {`
	`348`	`+ fmt_nei_idx_r[r_idx_iter] = sel_nei[kk].index;`
`344`	`349`	`}`
`345`		`- fmt_nei_idx_r[r_idx_iter] = sel_nei[kk].index;`
`346`	`350`	`}`
`347`	`351`	`else {`
`348`	`352`	`fmt_nei_idx_a[nei_iter[nei_type] ++] = sel_nei[kk].index;`
`349`	`353`	`}`
`350`	`354`	`}`
`351`	`355`
`352`		`- return -1;`
	`356`	`+ return overflowed;`
`353`	`357`	`}`
`354`	`358`
`355`	`359`