project.py_validation/getAllJobIDs.sh at master · absolution1/project.py_validation · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
#!/bin/bash

#Short script which takes a project.py directory and tries to work out the grid job ids for every job run
#Takes only one argument

if [ -z "$1" ]
then
  echo "$0: No argument passed.  Exiting!"
  exit 1
fi

if [ -n "$2" ]
then
 echo "$0: Too many arguments passed.  The script takes a single directory as an argument.  Exiting!"
 exit 1
fi

#Assume the one argument which is the output directory of a project.py job
OUTPUTDIR="$1"

#This script will produce a text file called jobids.txt.  If it already exists, delete it
if [ -f jobids.txt ]
then
 echo "$0: jobids.txt already exists.  Deleting!"
 rm jobids.txt
fi

#This script will produce a text file called jobfolders.txt.  If it already exists, delete it
if [ -f jobfolders.txt ]
then
 echo "$0: jobfolders.txt already exists.  Deleting!"
 rm jobfolders.txt
fi


#There should be a jobids.list folder in this directory

if [ ! -f $OUTPUTDIR/jobids.list ]
then
  echo "$0: no jobids.list found in $OUTPUTDIR"
  echo "Exiting!"
  exit 1
fi

#OLD: Last time I checked, jobids.list should only ever have 1 entry which is the first grid job id.  So get that then we can cut it up and build the job id list
#UPDATE 12/16: This is NOT true.  If you submit a markup job then it will also contrain the 0th job for the markup resubmission!!!!!
#-----To fix this bug, LOOP over the job id list in jobids.list and then run as normal

for FIRSTJOBID in `cat $OUTPUTDIR/jobids.list`
  do

  #example job id is 14044890.0@fifebatch2.fnal.gov
  #The aim is to extract 14044890 (the cluster ID)
  #Split the job id by the . and take the first element in the subsequent array
  JOBIDARRAYPERIOD=(${FIRSTJOBID//./ })
  CLUSTERID=${JOBIDARRAYPERIOD[0]}

  #We are also going to need the fifebatch address to construct the full jobid
  #Follow the above routine but split on @
  JOBIDARRAYAT=(${FIRSTJOBID//@/ })
  BATCHADDRESS=${JOBIDARRAYAT[1]}

  #Unless project.py changes, the output directory should contain a bunch of folders named $CLUSTERID_*.  Loop over the folders and extract the process ID for each job
  for PATH_CLUSTER_PROCESS in $(ls -d  $OUTPUTDIR/${CLUSTERID}_*)
  do
    #Get just the folder name (using base name
    CLUSTER_PROCESS=`basename $PATH_CLUSTER_PROCESS`
    #Now split the CLUSTER_PROCESS string on the _
    CLUSTER_PROCESS_ARRAY=(${CLUSTER_PROCESS//_/ })
    PROCESSID=${CLUSTER_PROCESS_ARRAY[1]}

    JOBID="$CLUSTERID.$PROCESSID@$BATCHADDRESS"
    echo "$JOBID" >> jobids.txt

  #echo ${OUTPUTDIR}/${CLUSTERID}_${PROCESSID} >> jobfolders.txt
  done
done