From a823b0899059844b04fcfb0ba6a42ac7329c8c88 Mon Sep 17 00:00:00 2001 From: Matthieu Dorier Date: Tue, 28 Jan 2020 15:17:09 +0000 Subject: [PATCH] added scripts that use tensorflow 2.0 for one-shot --- workflows/one-shot/job-tf2.sh | 15 +++++++++++++++ workflows/one-shot/run-nt3-tf2.sh | 24 ++++++++++++++++++++++++ workflows/one-shot/submit-tf2.sh | 28 ++++++++++++++++++++++++++++ 3 files changed, 67 insertions(+) create mode 100755 workflows/one-shot/job-tf2.sh create mode 100755 workflows/one-shot/run-nt3-tf2.sh create mode 100755 workflows/one-shot/submit-tf2.sh diff --git a/workflows/one-shot/job-tf2.sh b/workflows/one-shot/job-tf2.sh new file mode 100755 index 00000000..d13466ba --- /dev/null +++ b/workflows/one-shot/job-tf2.sh @@ -0,0 +1,15 @@ +#!/bin/bash -l +set -eu + +# JOB SH + +echo $( basename $0 ) +hostname + +source /opt/modules/default/init/bash +module load modules +PATH=/opt/cray/elogin/eproxy/2.0.14-4.3/bin:$PATH # For aprun +module load alps + +set -x +aprun -n 1 -N 1 $THIS/run-nt3-tf2.sh diff --git a/workflows/one-shot/run-nt3-tf2.sh b/workflows/one-shot/run-nt3-tf2.sh new file mode 100755 index 00000000..e04d8a8a --- /dev/null +++ b/workflows/one-shot/run-nt3-tf2.sh @@ -0,0 +1,24 @@ +#!/bin/bash -l +# Need -l to reset modules ... +set -eu + +# RUN NT3 + +echo $( basename $0 ) +hostname + +# Modules start +module unload cray-python/3.6.5.3 +module load datascience/tensorflow-2.0 +# Modules end + +which python + +# Report original source directory +echo THIS=$THIS + +BENCHMARKS=$( readlink --canonicalize $THIS/../../../Benchmarks ) +NT3=$BENCHMARKS/Pilot1/NT3/nt3_baseline_keras2.py + +set -x +python $NT3 --epochs 1 diff --git a/workflows/one-shot/submit-tf2.sh b/workflows/one-shot/submit-tf2.sh new file mode 100755 index 00000000..eaa64b84 --- /dev/null +++ b/workflows/one-shot/submit-tf2.sh @@ -0,0 +1,28 @@ +#!/bin/bash -l +set -eu + +# SUBMIT SH + +THIS=$( readlink --canonicalize $( dirname $0 ) ) + +DIRECTORY=$THIS +OUTPUT=$THIS/output.txt + +source $THIS/settings.sh + +if [[ -f $OUTPUT ]] +then + mv --backup=numbered $OUTPUT $OUTPUT.bak +fi + +set -x +qsub -n $WORKERS \ + -t $WALLTIME \ + -A $PROJECT \ + -q $QUEUE \ + -o $OUTPUT \ + -e $OUTPUT \ + --env THIS=$THIS \ + --cwd $DIRECTORY \ + --jobname $JOBNAME \ + $THIS/job-tf2.sh