Skip to content

Commit b447976

Browse files
committed
use --latency-measure-mode inductor_benchmarker
1 parent 182ce0b commit b447976

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

benchmarks/run_input_shard.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@ for KERNEL_NAME in "${KERNEL_NAME_LIST[@]}"; do
3131

3232
mkdir -p ${OUTPUT_DIR} || true
3333
OUTPUT_FILE="${OUTPUT_DIR}/${KERNEL_NAME}.log"
34-
CUDA_VISIBLE_DEVICES=$((RANK_OFFSET+SHARD-1)) python benchmarks/run.py --input-shard ${SHARD}/${WORLD_SIZE} --kernel ${KERNEL_NAME} --metrics accuracy,tflops,gbps,speedup --csv --output-dir ${OUTPUT_DIR} >"${OUTPUT_FILE}" 2>&1
34+
CUDA_VISIBLE_DEVICES=$((RANK_OFFSET+SHARD-1)) python benchmarks/run.py --input-shard ${SHARD}/${WORLD_SIZE} --kernel ${KERNEL_NAME} --metrics accuracy,tflops,gbps,speedup --latency-measure-mode inductor_benchmarker --csv --output-dir ${OUTPUT_DIR} >"${OUTPUT_FILE}" 2>&1
3535

3636
exit_code=$?
3737
# Check for success: exit code 0 AND no exception message in output

0 commit comments

Comments
 (0)