-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathtrain-batch.sh
More file actions
35 lines (25 loc) · 976 Bytes
/
train-batch.sh
File metadata and controls
35 lines (25 loc) · 976 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
#!/bin/bash
#SBATCH -J LP_ResNet_train
#SBATCH -p gpu
#SBATCH --gpus-per-node=1
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --time=48:00:00
#SBATCH -o out/LP_ResNet_train/running_jobs/%J_%a.out
#SBATCH -e out/LP_ResNet_train/running_jobs/%J_%a.err
#SBATCH --mail-user=skarukas@iu.edu
#SBATCH --mail-type=ALL,ARRAY_TASKS
#SBATCH --array=0-3
# NOTE: make sure the output/error folders exist before running
module load deeplearning/2.6.0
ParamFiles=(resnet20 resnet32 resnet44 resnet56)
# output dir
ExperimentRelativePath="rotvshn/svhn_std_max"
ParamFile=${ParamFiles[$SLURM_ARRAY_TASK_ID]}
EXPERIMENT_DIR="out/$SLURM_JOB_NAME/${ExperimentRelativePath}_${SLURM_ARRAY_JOB_ID}/${ParamFile}_${SLURM_ARRAY_TASK_ID}"
# path of input YAML file
ParamFile=param-files/LPResNet/RotSVHN/${ParamFile}.yaml
mkdir -p $EXPERIMENT_DIR
echo "Task ID: ${SLURM_ARRAY_TASK_ID}"
echo "Using params from $ParamFile"
python3 train.py --param ${ParamFile} --out_dir $EXPERIMENT_DIR