|
| 1 | +#!/usr/bin/env bash |
| 2 | +# Script for a correct pinning w/ regard to hardware threads shared by a process |
| 3 | +# using SLURM variables. Also needs an additional HWT multiplicity set in the |
| 4 | +# environment. |
| 5 | +# To share two hardware threads of each core for a process: |
| 6 | +# ... |
| 7 | +# export HWT=2 |
| 8 | +# export PIN=`correct_pinning.sh` |
| 9 | +# ... |
| 10 | +# srun $PIN ... |
| 11 | +# ... |
| 12 | + |
| 13 | +# echo settings? This will break srun integration... |
| 14 | +ECHO=${VERBOSE:-false} |
| 15 | +# to fix the integration, try |
| 16 | +# export PIN=`correct_pinning.sh | grep cpu_bind` |
| 17 | +# |
| 18 | + |
| 19 | +# run for JURECA cluster or booster? |
| 20 | +# JUWELS should be covered anyway. |
| 21 | +MCA="CLS" |
| 22 | +echo "$SLURM_JOB_PARTITION" | grep -q booster && MCA="BOO" |
| 23 | + |
| 24 | +function print_config() { |
| 25 | +`$ECHO` && echo -e "\nHARDWARE CONFIG:" |
| 26 | +`$ECHO` && echo "cores per node: $PHYS_CORES_NODE" |
| 27 | +`$ECHO` && echo "CPUs per node: $SOCKETS" |
| 28 | +`$ECHO` && echo "cores per CPU: $PHYS_CORES_CPU" |
| 29 | +`$ECHO` && echo "hardware threads per core: $SMT" |
| 30 | +`$ECHO` && echo "hardware threads per node: $SLURM_CPUS_ON_NODE" |
| 31 | +`$ECHO` && echo -e "\nJOB CONFIG:" |
| 32 | +`$ECHO` && echo "tasks per node: $SLURM_NTASKS_PER_NODE" |
| 33 | +`$ECHO` && echo "hardware threads per task: $SLURM_CPUS_PER_TASK" |
| 34 | +`$ECHO` && echo "shared hardware threads per process: $HWT" |
| 35 | +} |
| 36 | + |
| 37 | +function pin_cluster() { |
| 38 | +SOCKETS=2 |
| 39 | +SMT=2 |
| 40 | +PHYS_CORES_NODE=$(($SLURM_CPUS_ON_NODE/$SMT)) |
| 41 | +PHYS_CORES_CPU=$(($PHYS_CORES_NODE/$SOCKETS)) |
| 42 | + |
| 43 | +print_config |
| 44 | + |
| 45 | +# exit straight away if we can't evenly distribute threads |
| 46 | +if [ $(($(($SLURM_CPUS_PER_TASK/$HWT))*$HWT)) != $SLURM_CPUS_PER_TASK ] |
| 47 | +then |
| 48 | + `$ECHO` && echo "No nice disitribution of threads possible" |
| 49 | + exit 1 |
| 50 | +fi |
| 51 | + |
| 52 | +CPUid=0 |
| 53 | +MASK="--cpu_bind=mask_cpu:" |
| 54 | +# loop per process on each node |
| 55 | +for PROC in `seq 1 $SLURM_NTASKS_PER_NODE` |
| 56 | +do |
| 57 | + MAP="" |
| 58 | + `$ECHO` && echo "process $PROC" |
| 59 | + for CORE in `seq 1 $(($SLURM_CPUS_PER_TASK/$HWT))` |
| 60 | + do |
| 61 | + CPUid_=$CPUid |
| 62 | + for HW in `seq 1 $HWT` |
| 63 | + do |
| 64 | + MAP="$MAP,$CPUid_" |
| 65 | + ((CPUid_+=$PHYS_CORES_NODE)) |
| 66 | + done |
| 67 | + ((CPUid++)) |
| 68 | + done |
| 69 | + MAP_=`echo $MAP | sed 's/,/2^/' | sed 's/,/+2^/g'` |
| 70 | + MAP=`echo $MAP | sed 's/,//'` |
| 71 | + `$ECHO` && printf "map for process $PROC: %s\n" $MAP |
| 72 | + MASK="$MASK,0x"`echo "obase=16; $MAP_" | bc` |
| 73 | +done |
| 74 | +MASK=`echo $MASK | sed 's/:,/:/'` |
| 75 | +echo $MASK |
| 76 | +} |
| 77 | + |
| 78 | +function pin_booster() { |
| 79 | +SOCKETS=1 |
| 80 | +SMT=4 |
| 81 | +PHYS_CORES_NODE=$(($SLURM_CPUS_ON_NODE/$SMT)) |
| 82 | +PHYS_CORES_CPU=$(($PHYS_CORES_NODE/$SOCKETS)) |
| 83 | + |
| 84 | +print_config |
| 85 | + |
| 86 | +# exit straight away if we can't evenly distribute threads |
| 87 | +if [ $(($(($SLURM_CPUS_PER_TASK/$HWT))*$HWT)) != $SLURM_CPUS_PER_TASK ] |
| 88 | +then |
| 89 | + `$ECHO` && echo "No nice disitribution of threads possible" |
| 90 | + exit 1 |
| 91 | +fi |
| 92 | + |
| 93 | +CPUid=0 |
| 94 | +MASK="--cpu_bind=mask_cpu:" |
| 95 | +# loop per process on each node |
| 96 | +for PROC in `seq 1 $SLURM_NTASKS_PER_NODE` |
| 97 | +do |
| 98 | + MAP="" |
| 99 | + `$ECHO` && echo "process $PROC" |
| 100 | + for CORE in `seq 1 $(($SLURM_CPUS_PER_TASK/$HWT))` |
| 101 | + do |
| 102 | + CPUid_=$CPUid |
| 103 | + for HW in `seq 1 $HWT` |
| 104 | + do |
| 105 | + MAP="$MAP,$CPUid_" |
| 106 | + ((CPUid_+=$PHYS_CORES_CPU)) |
| 107 | + done |
| 108 | + ((CPUid++)) |
| 109 | + if [ $CPUid -eq $PHYS_CORES_CPU ] && [ $HWT -eq 2 ] |
| 110 | + then |
| 111 | + ((CPUid+=$PHYS_CORES_CPU)) |
| 112 | + fi |
| 113 | + done |
| 114 | + MAP_=`echo $MAP | sed 's/,/2^/' | sed 's/,/+2^/g'` |
| 115 | + MAP=`echo $MAP | sed 's/,//'` |
| 116 | + `$ECHO` && printf "map for process $PROC: %s\n" $MAP |
| 117 | + MASK="$MASK,0x"`echo "obase=16; $MAP_" | bc` |
| 118 | +done |
| 119 | +MASK=`echo $MASK | sed 's/:,/:/'` |
| 120 | +echo $MASK |
| 121 | +} |
| 122 | + |
| 123 | +if [ $MCA == "CLS" ] |
| 124 | +then |
| 125 | + pin_cluster |
| 126 | +elif [ $MCA == "BOO" ] |
| 127 | +then |
| 128 | + pin_booster |
| 129 | +fi |
| 130 | + |
| 131 | +exit 0 |
0 commit comments