Skip to content

Commit 88b1b24

Browse files
committed
improve script
1 parent 46bae3f commit 88b1b24

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

benchmarks/run_input_shard.sh

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,7 @@
44

55
# Capture timestamp once for consistent filename
66
TIMESTAMP=$(date +%s)
7-
OUTPUT_FILE="benchmarks_autotune_${TIMESTAMP}_input_shard_${SHARD}_of_${WORLD_SIZE}.txt"
8-
CSV_OUTPUT_DIR="benchmarks_autotune_${TIMESTAMP}_input_shard_${SHARD}_of_${WORLD_SIZE}_csv"
7+
OUTPUT_DIR="benchmarks_autotune_${TIMESTAMP}_input_shard_${SHARD}_of_${WORLD_SIZE}"
98

109
KERNEL_NAME_LIST=(
1110
"rms_norm"
@@ -30,12 +29,13 @@ for KERNEL_NAME in "${KERNEL_NAME_LIST[@]}"; do
3029
# TIMESTAMP=$(date +%s)
3130
# OUTPUT_FILE="benchmarks_autotune_${TIMESTAMP}_input_shard_${SHARD}_of_${WORLD_SIZE}.txt"
3231

33-
mkdir -p ${CSV_OUTPUT_DIR} || true
34-
CUDA_VISIBLE_DEVICES=$((RANK_OFFSET+SHARD-1)) python benchmarks/run.py --input-shard ${SHARD}/${WORLD_SIZE} --kernel ${KERNEL_NAME} --metrics accuracy,tflops,gbps,speedup --csv --output-dir ${CSV_OUTPUT_DIR} >"$OUTPUT_FILE" 2>&1
32+
mkdir -p ${OUTPUT_DIR} || true
33+
OUTPUT_FILE="${OUTPUT_DIR}/${KERNEL_NAME}.log"
34+
CUDA_VISIBLE_DEVICES=$((RANK_OFFSET+SHARD-1)) python benchmarks/run.py --input-shard ${SHARD}/${WORLD_SIZE} --kernel ${KERNEL_NAME} --metrics accuracy,tflops,gbps,speedup --csv --output-dir ${OUTPUT_DIR} >"${OUTPUT_FILE}" 2>&1
3535

3636
exit_code=$?
3737
# Check for success: exit code 0 AND no exception message in output
38-
if [ $exit_code -eq 0 ] && ! grep -q "Caught exception, terminating early with partial results" "$OUTPUT_FILE"; then
38+
if [ $exit_code -eq 0 ] && ! grep -q "Caught exception, terminating early with partial results" "${OUTPUT_FILE}"; then
3939
echo "Success! Benchmark completed for shard ${SHARD}/${WORLD_SIZE}"
4040
break
4141
else

0 commit comments

Comments
 (0)