Skip to content
This repository was archived by the owner on Feb 3, 2025. It is now read-only.

Commit c624e14

Browse files
--no_tf32 added to the benchmark code
1 parent 521deb9 commit c624e14

File tree

5 files changed

+16
-39
lines changed

5 files changed

+16
-39
lines changed

tftrt/examples/benchmark_args.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -133,6 +133,13 @@ def __init__(self):
133133
"least as large as the number of samples in the dataset."
134134
)
135135

136+
self._add_bool_argument(
137+
name="no_tf32",
138+
default=False,
139+
required=False,
140+
help="If set to True, the benchmark will force not using TF32."
141+
)
142+
136143
self._add_bool_argument(
137144
name="use_xla",
138145
default=False,

tftrt/examples/benchmark_runner.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -61,6 +61,10 @@ def __init__(self, args):
6161
print("[Benchmark] - Activating XLA JIT Auto Clustering")
6262
os.environ["TF_XLA_FLAGS"] = "--tf_xla_auto_jit=2 --tf_xla_cpu_global_jit"
6363

64+
if args.no_tf32:
65+
print("[Benchmark] - Deactivating the use of TF32 format")
66+
os.environ["NVIDIA_TF32_OVERRIDE"] = "0"
67+
6468
logging.getLogger("tensorflow").setLevel(logging.INFO)
6569
logging.disable(logging.WARNING)
6670

tftrt/examples/image_classification/base_run_inference.sh

Lines changed: 1 addition & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -8,8 +8,6 @@ DATA_DIR=""
88
MODEL_DIR=""
99

1010
# Default Argument Values
11-
NVIDIA_TF32_OVERRIDE=""
12-
1311
BYPASS_ARGUMENTS=""
1412

1513
# Loop through arguments and process them
@@ -20,10 +18,6 @@ do
2018
MODEL_NAME="${arg#*=}"
2119
shift # Remove --model_name from processing
2220
;;
23-
--no_tf32)
24-
NVIDIA_TF32_OVERRIDE="NVIDIA_TF32_OVERRIDE=0"
25-
shift # Remove --no_tf32 from processing
26-
;;
2721
--data_dir=*)
2822
DATA_DIR="${arg#*=}"
2923
shift # Remove --data_dir= from processing
@@ -100,8 +94,6 @@ echo ""
10094
echo "[*] DATA_DIR: ${DATA_DIR}"
10195
echo "[*] MODEL_DIR: ${MODEL_DIR}"
10296
echo ""
103-
echo "[*] NVIDIA_TF32_OVERRIDE: ${NVIDIA_TF32_OVERRIDE}"
104-
echo ""
10597
# Custom Image Classification Task Flags
10698
echo "[*] INPUT_SIZE: ${INPUT_SIZE}"
10799
echo "[*] PREPROCESS_METHOD: ${PREPROCESS_METHOD}"
@@ -151,10 +143,7 @@ BENCH_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" >/dev/null 2>&1 && pwd )"
151143
cd ${BENCH_DIR}
152144

153145
# Execute the example
154-
155-
PREPEND_COMMAND="${NVIDIA_TF32_OVERRIDE}"
156-
157-
COMMAND="${PREPEND_COMMAND} python image_classification.py \
146+
COMMAND="python image_classification.py \
158147
--data_dir ${DATA_DIR} \
159148
--calib_data_dir ${DATA_DIR} \
160149
--input_saved_model_dir ${INPUT_SAVED_MODEL_DIR} \

tftrt/examples/object_detection/base_run_inference.sh

Lines changed: 1 addition & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -8,8 +8,6 @@ DATA_DIR=""
88
MODEL_DIR=""
99

1010
# Default Argument Values
11-
NVIDIA_TF32_OVERRIDE=""
12-
1311
BYPASS_ARGUMENTS=""
1412
BATCH_SIZE=8
1513

@@ -21,10 +19,6 @@ do
2119
MODEL_NAME="${arg#*=}"
2220
shift # Remove --model_name from processing
2321
;;
24-
--no_tf32)
25-
NVIDIA_TF32_OVERRIDE="NVIDIA_TF32_OVERRIDE=0"
26-
shift # Remove --no_tf32 from processing
27-
;;
2822
--batch_size=*)
2923
BATCH_SIZE="${arg#*=}"
3024
shift # Remove --batch_size= from processing
@@ -70,8 +64,6 @@ echo ""
7064
echo "[*] DATA_DIR: ${DATA_DIR}"
7165
echo "[*] MODEL_DIR: ${MODEL_DIR}"
7266
echo ""
73-
echo "[*] NVIDIA_TF32_OVERRIDE: ${NVIDIA_TF32_OVERRIDE}"
74-
echo ""
7567
# Custom Object Detection Task Flags
7668
echo "[*] BATCH_SIZE: ${BATCH_SIZE}"
7769
echo "[*] INPUT_SIZE: ${INPUT_SIZE}"
@@ -142,10 +134,7 @@ if [[ ${DEPENDENCIES_STATUS} != 0 ]]; then
142134
fi
143135

144136
# Step 2: Execute the example
145-
146-
PREPEND_COMMAND="${NVIDIA_TF32_OVERRIDE}"
147-
148-
COMMAND="${PREPEND_COMMAND} python object_detection.py \
137+
COMMAND="python object_detection.py \
149138
--data_dir ${VAL_DATA_DIR} \
150139
--calib_data_dir ${VAL_DATA_DIR} \
151140
--annotation_path ${ANNOTATIONS_DATA_FILE} \

tftrt/examples/transformers/base_run_inference.sh

Lines changed: 3 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -7,14 +7,11 @@ MODEL_NAME=""
77
MODEL_DIR=""
88

99
# Default Argument Values
10-
NVIDIA_TF32_OVERRIDE=""
11-
12-
# TODO: remove when real dataloader is implemented
13-
DATA_DIR="/tmp"
14-
1510
BYPASS_ARGUMENTS=""
1611
BATCH_SIZE=32
1712
SEQ_LEN=128
13+
# TODO: remove when real dataloader is implemented
14+
DATA_DIR="/tmp"
1815

1916
# Loop through arguments and process them
2017
for arg in "$@"
@@ -24,10 +21,6 @@ do
2421
MODEL_NAME="${arg#*=}"
2522
shift # Remove --model_name from processing
2623
;;
27-
--no_tf32)
28-
NVIDIA_TF32_OVERRIDE="NVIDIA_TF32_OVERRIDE=0"
29-
shift # Remove --no_tf32 from processing
30-
;;
3124
--batch_size=*)
3225
BATCH_SIZE="${arg#*=}"
3326
shift # Remove --batch_size= from processing
@@ -90,8 +83,6 @@ echo ""
9083
echo "[*] DATA_DIR: ${DATA_DIR}"
9184
echo "[*] MODEL_DIR: ${MODEL_DIR}"
9285
echo ""
93-
echo "[*] NVIDIA_TF32_OVERRIDE: ${NVIDIA_TF32_OVERRIDE}"
94-
echo ""
9586
# Custom Transormer Task Flags
9687
echo "[*] VOCAB_SIZE: ${VOCAB_SIZE}"
9788
echo "[*] SEQ_LEN: ${SEQ_LEN}"
@@ -142,10 +133,7 @@ BENCH_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )/" >/dev/null 2>&1 && pwd )"
142133
cd ${BENCH_DIR}
143134

144135
# Execute the example
145-
146-
PREPEND_COMMAND="${NVIDIA_TF32_OVERRIDE}"
147-
148-
COMMAND="${PREPEND_COMMAND} python transformers.py \
136+
COMMAND="python transformers.py \
149137
--data_dir ${DATA_DIR} \
150138
--calib_data_dir ${DATA_DIR} \
151139
--input_saved_model_dir ${INPUT_SAVED_MODEL_DIR} \

0 commit comments

Comments
 (0)