ECP-CANDLE
diff --git a/‎Pilot1/Attn/attn.py‎
Lines changed: 1 addition & 1 deletion b/‎Pilot1/Attn/attn.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎Pilot1/ST1/README.md‎
Lines changed: 0 additions & 1 deletion b/‎Pilot1/ST1/README.md‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎Pilot1/ST1/clr_callback.py‎
Lines changed: 52 additions & 40 deletions b/‎Pilot1/ST1/clr_callback.py‎
Lines changed: 52 additions & 40 deletions
diff --git a/‎Pilot1/ST1/config_st_spe_training.json‎
Lines changed: 43 additions & 44 deletions b/‎Pilot1/ST1/config_st_spe_training.json‎
Lines changed: 43 additions & 44 deletions
diff --git a/‎Pilot1/ST1/polaris_sub_hvd.sh‎
Lines changed: 0 additions & 1 deletion b/‎Pilot1/ST1/polaris_sub_hvd.sh‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎Pilot1/ST1/polaris_sub_smiles_regress_transformer_spe.sh‎
Lines changed: 1 addition & 1 deletion b/‎Pilot1/ST1/polaris_sub_smiles_regress_transformer_spe.sh‎
Lines changed: 1 addition & 1 deletion
@@ -133,7 +133,7 @@ def load_data(params, seed):
         file_train = params["train_data"]
         cdd = os.environ["CANDLE_DATA_DIR"]
         train_file = candle.get_file(
-            file_train, url + file_train, datadir = cdd, cache_subdir="Pilot1"
+            file_train, url + file_train, datadir=cdd, cache_subdir="Pilot1"
         )
 
         df_x_train_0 = pd.read_hdf(train_file, "x_train_0").astype(np.float32)
 
@@ -191,4 +191,3 @@ CHEMBL -- 1.5M training examples (shuffled and resampled so not same 1.5M as cla
 Predicting molecular Weight validation
 Is also 100K samples non-overlapping.
 Regression problem achieves R^2 about .95 after ~20 epochs.
-
@@ -1,45 +1,46 @@
-from tensorflow.keras.callbacks import *
-from tensorflow.keras import backend as K
 import numpy as np
+from tensorflow.keras import backend as K
+from tensorflow.keras.callbacks import *
+
 
 class CyclicLR(Callback):
     """This callback implements a cyclical learning rate policy (CLR).
     The method cycles the learning rate between two boundaries with
     some constant frequency, as detailed in this paper (https://arxiv.org/abs/1506.01186).
-    The amplitude of the cycle can be scaled on a per-iteration or 
+    The amplitude of the cycle can be scaled on a per-iteration or
     per-cycle basis.
     This class has three built-in policies, as put forth in the paper.
     "triangular":
         A basic triangular cycle w/ no amplitude scaling.
     "triangular2":
         A basic triangular cycle that scales initial amplitude by half each cycle.
     "exp_range":
-        A cycle that scales initial amplitude by gamma**(cycle iterations) at each 
+        A cycle that scales initial amplitude by gamma**(cycle iterations) at each
         cycle iteration.
     For more detail, please see paper.
-    
+
     # Example
         ```python
             clr = CyclicLR(base_lr=0.001, max_lr=0.006,
                                 step_size=2000., mode='triangular')
             model.fit(X_train, Y_train, callbacks=[clr])
         ```
-    
+
     Class also supports custom scaling functions:
         ```python
             clr_fn = lambda x: 0.5*(1+np.sin(x*np.pi/2.))
             clr = CyclicLR(base_lr=0.001, max_lr=0.006,
                                 step_size=2000., scale_fn=clr_fn,
                                 scale_mode='cycle')
             model.fit(X_train, Y_train, callbacks=[clr])
-        ```    
+        ```
     # Arguments
         base_lr: initial learning rate which is the
             lower boundary in the cycle.
         max_lr: upper boundary in the cycle. Functionally,
             it defines the cycle amplitude (max_lr - base_lr).
             The lr at any cycle is the sum of base_lr
-            and some scaling of the amplitude; therefore 
+            and some scaling of the amplitude; therefore
             max_lr may not actually be reached depending on
             scaling function.
         step_size: number of training iterations per
@@ -52,17 +53,25 @@ class CyclicLR(Callback):
         gamma: constant in 'exp_range' scaling function:
             gamma**(cycle iterations)
         scale_fn: Custom scaling policy defined by a single
-            argument lambda function, where 
+            argument lambda function, where
             0 <= scale_fn(x) <= 1 for all x >= 0.
-            mode paramater is ignored 
+            mode paramater is ignored
         scale_mode: {'cycle', 'iterations'}.
-            Defines whether scale_fn is evaluated on 
+            Defines whether scale_fn is evaluated on
             cycle number or cycle iterations (training
             iterations since start of cycle). Default is 'cycle'.
     """
 
-    def __init__(self, base_lr=0.001, max_lr=0.006, step_size=2000., mode='triangular',
-                 gamma=1., scale_fn=None, scale_mode='cycle'):
+    def __init__(
+        self,
+        base_lr=0.001,
+        max_lr=0.006,
+        step_size=2000.0,
+        mode="triangular",
+        gamma=1.0,
+        scale_fn=None,
+        scale_mode="cycle",
+    ):
         super(CyclicLR, self).__init__()
 
         self.base_lr = base_lr
@@ -71,26 +80,25 @@ def __init__(self, base_lr=0.001, max_lr=0.006, step_size=2000., mode='triangula
         self.mode = mode
         self.gamma = gamma
         if scale_fn == None:
-            if self.mode == 'triangular':
-                self.scale_fn = lambda x: 1.
-                self.scale_mode = 'cycle'
-            elif self.mode == 'triangular2':
-                self.scale_fn = lambda x: 1/(2.**(x-1))
-                self.scale_mode = 'cycle'
-            elif self.mode == 'exp_range':
-                self.scale_fn = lambda x: gamma**(x)
-                self.scale_mode = 'iterations'
+            if self.mode == "triangular":
+                self.scale_fn = lambda x: 1.0
+                self.scale_mode = "cycle"
+            elif self.mode == "triangular2":
+                self.scale_fn = lambda x: 1 / (2.0 ** (x - 1))
+                self.scale_mode = "cycle"
+            elif self.mode == "exp_range":
+                self.scale_fn = lambda x: gamma ** (x)
+                self.scale_mode = "iterations"
         else:
             self.scale_fn = scale_fn
             self.scale_mode = scale_mode
-        self.clr_iterations = 0.
-        self.trn_iterations = 0.
+        self.clr_iterations = 0.0
+        self.trn_iterations = 0.0
         self.history = {}
 
         self._reset()
 
-    def _reset(self, new_base_lr=None, new_max_lr=None,
-               new_step_size=None):
+    def _reset(self, new_base_lr=None, new_max_lr=None, new_step_size=None):
         """Resets cycle iterations.
         Optional boundary/step size adjustment.
         """
@@ -100,34 +108,38 @@ def _reset(self, new_base_lr=None, new_max_lr=None,
             self.max_lr = new_max_lr
         if new_step_size != None:
             self.step_size = new_step_size
-        self.clr_iterations = 0.
-        
+        self.clr_iterations = 0.0
+
     def clr(self):
-        cycle = np.floor(1+self.clr_iterations/(2*self.step_size))
-        x = np.abs(self.clr_iterations/self.step_size - 2*cycle + 1)
-        if self.scale_mode == 'cycle':
-            return self.base_lr + (self.max_lr-self.base_lr)*np.maximum(0, (1-x))*self.scale_fn(cycle)
+        cycle = np.floor(1 + self.clr_iterations / (2 * self.step_size))
+        x = np.abs(self.clr_iterations / self.step_size - 2 * cycle + 1)
+        if self.scale_mode == "cycle":
+            return self.base_lr + (self.max_lr - self.base_lr) * np.maximum(
+                0, (1 - x)
+            ) * self.scale_fn(cycle)
         else:
-            return self.base_lr + (self.max_lr-self.base_lr)*np.maximum(0, (1-x))*self.scale_fn(self.clr_iterations)
-        
+            return self.base_lr + (self.max_lr - self.base_lr) * np.maximum(
+                0, (1 - x)
+            ) * self.scale_fn(self.clr_iterations)
+
     def on_train_begin(self, logs={}):
         logs = logs or {}
 
         if self.clr_iterations == 0:
             K.set_value(self.model.optimizer.lr, self.base_lr)
         else:
-            K.set_value(self.model.optimizer.lr, self.clr())        
-            
+            K.set_value(self.model.optimizer.lr, self.clr())
+
     def on_batch_end(self, epoch, logs=None):
-        
+
         logs = logs or {}
         self.trn_iterations += 1
         self.clr_iterations += 1
 
-        self.history.setdefault('lr', []).append(K.get_value(self.model.optimizer.lr))
-        self.history.setdefault('iterations', []).append(self.trn_iterations)
+        self.history.setdefault("lr", []).append(K.get_value(self.model.optimizer.lr))
+        self.history.setdefault("iterations", []).append(self.trn_iterations)
 
         for k, v in logs.items():
             self.history.setdefault(k, []).append(v)
-        
+
         K.set_value(self.model.optimizer.lr, self.clr())
@@ -1,52 +1,51 @@
 {
-    "general": {
-        "use_hvd": true,
-        "batch_size": 64,
-        "epochs": 400,
-        "lr": 0.00000991301767144166,
-        "loss_fn": "mean_squared_error"
-    },
+  "general": {
+    "use_hvd": true,
+    "batch_size": 64,
+    "epochs": 400,
+    "lr": 0.00000991301767144166,
+    "loss_fn": "mean_squared_error"
+  },
 
-    "data_loading": {
-        "data_path": "/lus/grand/projects/datascience/avasan/Data_Docking/2M-flatten",
-        "rec": "3CLPro_7BQY_A_1_F",
-        "pattern": "Orderable_zinc_db_enaHLL.sorted.4col.descriptors.parquet.xform-smiles.csv.reg"
-    },
+  "data_loading": {
+    "data_path": "/lus/grand/projects/datascience/avasan/Data_Docking/2M-flatten",
+    "rec": "3CLPro_7BQY_A_1_F",
+    "pattern": "Orderable_zinc_db_enaHLL.sorted.4col.descriptors.parquet.xform-smiles.csv.reg"
+  },
 
-    "tokenization": {
-        "vocab_size": 3132,
-        "maxlen": 45,
-        "tokenizer": {
-            "category": "smilespair",
-            "spe_file": "VocabFiles/SPE_ChEMBL.txt",
-            "vocab_file": "VocabFiles/vocab_spe.txt"
-        }
-    },
+  "tokenization": {
+    "vocab_size": 3132,
+    "maxlen": 45,
+    "tokenizer": {
+      "category": "smilespair",
+      "spe_file": "VocabFiles/SPE_ChEMBL.txt",
+      "vocab_file": "VocabFiles/vocab_spe.txt"
+    }
+  },
 
-    "architecture": {
-        "embedding": {
-            "embed_dim": 128 
-        },
-        "transformer_block": {
-            "num_blocks": 5,
-            "activation": "selu",
-            "ff_dim": 128,
-            "num_heads": 21,
-            "dr1": 0.12717945391278226,
-            "dr2": 0.12717945391278226,
-            "drop_mha": true
-        },
-        "regressor_head": {
-            "activation": "selu",
-            "dr": 0.04990303516069576
-        }
+  "architecture": {
+    "embedding": {
+      "embed_dim": 128
+    },
+    "transformer_block": {
+      "num_blocks": 5,
+      "activation": "selu",
+      "ff_dim": 128,
+      "num_heads": 21,
+      "dr1": 0.12717945391278226,
+      "dr2": 0.12717945391278226,
+      "drop_mha": true
     },
-    
-    "callbacks": {
-        "checkpt_file": "smile_regress.autosave.model.h5",
-        "log_csv": "smile_regress.training.log",
-        "patience_red_lr": 20,
-        "patience_early_stop": 100
+    "regressor_head": {
+      "activation": "selu",
+      "dr": 0.04990303516069576
     }
+  },
 
+  "callbacks": {
+    "checkpt_file": "smile_regress.autosave.model.h5",
+    "log_csv": "smile_regress.training.log",
+    "patience_red_lr": 20,
+    "patience_early_stop": 100
+  }
 }
@@ -36,4 +36,3 @@ else
     mpiexec --np $NP -ppn $PPN --cpu-bind verbose,list:0,1,2,3,4,5,6,7 -env NCCL_COLLNET_ENABLE=1 -env NCCL_NET_GDR_LEVEL=PHB python smiles_regress_transformer_run_hvd.py  --in_train ${DATA_PATH}/${TFIL} --in_vali ${DATA_PATH}/${VFIL} --ep $EP --num_heads $NUMHEAD --DR_TB $DR_TB --DR_ff $DR_ff --activation $ACT --drop_post_MHA $DROP --lr $LR --loss_fn $LOSS --hvd_switch $HVDSWITCH > $OUT
 
 fi
-
@@ -13,7 +13,7 @@
 module load conda/2022-09-08
 conda activate
 
-cd /grand/datascience/avasan/ST_Benchmarks/Test_Tokenizers/SMILESPair_Encoder_continue 
+cd /grand/datascience/avasan/ST_Benchmarks/Test_Tokenizers/SMILESPair_Encoder_continue
 
 NP=16
 PPN=4
Original file line number	Diff line number	Diff line change
`@@ -133,7 +133,7 @@ def load_data(params, seed):`
`133`	`133`	`file_train = params["train_data"]`
`134`	`134`	`cdd = os.environ["CANDLE_DATA_DIR"]`
`135`	`135`	`train_file = candle.get_file(`
`136`		`- file_train, url + file_train, datadir = cdd, cache_subdir="Pilot1"`
	`136`	`+ file_train, url + file_train, datadir=cdd, cache_subdir="Pilot1"`
`137`	`137`	`)`
`138`	`138`
`139`	`139`	`df_x_train_0 = pd.read_hdf(train_file, "x_train_0").astype(np.float32)`
Original file line number	Diff line number	Diff line change
`@@ -36,4 +36,3 @@ else`
`36`	`36`	`mpiexec --np $NP -ppn $PPN --cpu-bind verbose,list:0,1,2,3,4,5,6,7 -env NCCL_COLLNET_ENABLE=1 -env NCCL_NET_GDR_LEVEL=PHB python smiles_regress_transformer_run_hvd.py --in_train ${DATA_PATH}/${TFIL} --in_vali ${DATA_PATH}/${VFIL} --ep $EP --num_heads $NUMHEAD --DR_TB $DR_TB --DR_ff $DR_ff --activation $ACT --drop_post_MHA $DROP --lr $LR --loss_fn $LOSS --hvd_switch $HVDSWITCH > $OUT`
`37`	`37`
`38`	`38`	`fi`
`39`		`-`