Skip to content

Commit f783eda

Browse files
committed
renamed smiles_regress_transformer_run_hvd.py and added polaris run script
1 parent 411daee commit f783eda

File tree

3 files changed

+41
-3
lines changed

3 files changed

+41
-3
lines changed

Pilot1/ST1/polaris_sub_hvd.sh

Lines changed: 39 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,39 @@
1+
#!/bin/bash
2+
#PBS -N st_hvd
3+
#PBS -l select=2
4+
#PBS -l walltime=24:00:00
5+
#PBS -q preemptable
6+
#PBS -l filesystems=grand
7+
#PBS -A datascience
8+
#PBS -o logs/
9+
#PBS -e logs/
10+
#PBS -m abe
11+
12+
13+
DATA_PATH=/grand/datascience/avasan/ST_Benchmarks/Data/1M-flatten
14+
15+
TFIL=ml.3CLPro_7BQY_A_1_F.Orderable_zinc_db_enaHLL.sorted.4col.dd.parquet.xform-smiles.csv.reg.train
16+
VFIL=ml.3CLPro_7BQY_A_1_F.Orderable_zinc_db_enaHLL.sorted.4col.dd.parquet.xform-smiles.csv.reg.val
17+
18+
EP=400
19+
NUMHEAD=16
20+
DR_TB=0.1
21+
DR_ff=0.1
22+
23+
ACT=elu
24+
DROP=False
25+
LR=0.0000025
26+
LOSS=mean_squared_error
27+
HVDSWITCH=True
28+
29+
if [$HVDSWITCH = False]; then
30+
python smiles_regress_transformer_run_hvd.py --in_train ${DATA_PATH}/${TFIL} --in_vali ${DATA_PATH}/${VFIL} --ep $EP --num_heads $NUMHEAD --DR_TB $DR_TB --DR_ff $DR_ff --activation $ACT --drop_post_MHA $DROP --lr $LR --loss_fn $LOSS --hvd_switch $HVDSWITCH
31+
32+
else
33+
NP=8
34+
PPN=4
35+
OUT=logfile.log
36+
mpiexec --np $NP -ppn $PPN --cpu-bind verbose,list:0,1,2,3,4,5,6,7 -env NCCL_COLLNET_ENABLE=1 -env NCCL_NET_GDR_LEVEL=PHB python smiles_regress_transformer_run_hvd.py --in_train ${DATA_PATH}/${TFIL} --in_vali ${DATA_PATH}/${VFIL} --ep $EP --num_heads $NUMHEAD --DR_TB $DR_TB --DR_ff $DR_ff --activation $ACT --drop_post_MHA $DROP --lr $LR --loss_fn $LOSS --hvd_switch $HVDSWITCH > $OUT
37+
38+
fi
39+
File renamed without changes.

Pilot1/ST1/sub_hvd.sh

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -20,13 +20,12 @@ LOSS=mean_squared_error
2020
HVDSWITCH=True
2121

2222
if [$HVDSWITCH = False]; then
23-
python run.py --in_train ${DATA_PATH}/${TFIL} --in_vali ${DATA_PATH}/${VFIL} --ep $EP --num_heads $NUMHEAD --DR_TB $DR_TB --DR_ff $DR_ff --activation $ACT --drop_post_MHA $DROP --lr $LR --loss_fn $LOSS --hvd_switch $HVDSWITCH
23+
python smiles_regress_transformer_run_hvd.py --in_train ${DATA_PATH}/${TFIL} --in_vali ${DATA_PATH}/${VFIL} --ep $EP --num_heads $NUMHEAD --DR_TB $DR_TB --DR_ff $DR_ff --activation $ACT --drop_post_MHA $DROP --lr $LR --loss_fn $LOSS --hvd_switch $HVDSWITCH
2424

2525
else
2626
NP=8
2727
PPN=4
2828
OUT=logfile.log
29-
mpiexec --np $NP -ppn $PPN --cpu-bind verbose,list:0,1,2,3,4,5,6,7 -env NCCL_COLLNET_ENABLE=1 -env NCCL_NET_GDR_LEVEL=PHB python run.py --in_train ${DATA_PATH}/${TFIL} --in_vali ${DATA_PATH}/${VFIL} --ep $EP --num_heads $NUMHEAD --DR_TB $DR_TB --DR_ff $DR_ff --activation $ACT --drop_post_MHA $DROP --lr $LR --loss_fn $LOSS --hvd_switch $HVDSWITCH > $OUT
29+
mpiexec --np $NP -ppn $PPN --cpu-bind verbose,list:0,1,2,3,4,5,6,7 -env NCCL_COLLNET_ENABLE=1 -env NCCL_NET_GDR_LEVEL=PHB python smiles_regress_transformer_run_hvd.py --in_train ${DATA_PATH}/${TFIL} --in_vali ${DATA_PATH}/${VFIL} --ep $EP --num_heads $NUMHEAD --DR_TB $DR_TB --DR_ff $DR_ff --activation $ACT --drop_post_MHA $DROP --lr $LR --loss_fn $LOSS --hvd_switch $HVDSWITCH > $OUT
3030

3131
fi
32-

0 commit comments

Comments
 (0)