This repository was archived by the owner on Feb 3, 2025. It is now read-only.
File tree Expand file tree Collapse file tree 5 files changed +16
-39
lines changed Expand file tree Collapse file tree 5 files changed +16
-39
lines changed Original file line number Diff line number Diff line change @@ -133,6 +133,13 @@ def __init__(self):
133133 "least as large as the number of samples in the dataset."
134134 )
135135
136+ self ._add_bool_argument (
137+ name = "no_tf32" ,
138+ default = False ,
139+ required = False ,
140+ help = "If set to True, the benchmark will force not using TF32."
141+ )
142+
136143 self ._add_bool_argument (
137144 name = "use_xla" ,
138145 default = False ,
Original file line number Diff line number Diff line change @@ -61,6 +61,10 @@ def __init__(self, args):
6161 print ("[Benchmark] - Activating XLA JIT Auto Clustering" )
6262 os .environ ["TF_XLA_FLAGS" ] = "--tf_xla_auto_jit=2 --tf_xla_cpu_global_jit"
6363
64+ if args .no_tf32 :
65+ print ("[Benchmark] - Deactivating the use of TF32 format" )
66+ os .environ ["NVIDIA_TF32_OVERRIDE" ] = "0"
67+
6468 logging .getLogger ("tensorflow" ).setLevel (logging .INFO )
6569 logging .disable (logging .WARNING )
6670
Original file line number Diff line number Diff line change @@ -8,8 +8,6 @@ DATA_DIR=""
88MODEL_DIR=" "
99
1010# Default Argument Values
11- NVIDIA_TF32_OVERRIDE=" "
12-
1311BYPASS_ARGUMENTS=" "
1412
1513# Loop through arguments and process them
2018 MODEL_NAME=" ${arg#* =} "
2119 shift # Remove --model_name from processing
2220 ;;
23- --no_tf32)
24- NVIDIA_TF32_OVERRIDE=" NVIDIA_TF32_OVERRIDE=0"
25- shift # Remove --no_tf32 from processing
26- ;;
2721 --data_dir=* )
2822 DATA_DIR=" ${arg#* =} "
2923 shift # Remove --data_dir= from processing
@@ -100,8 +94,6 @@ echo ""
10094echo " [*] DATA_DIR: ${DATA_DIR} "
10195echo " [*] MODEL_DIR: ${MODEL_DIR} "
10296echo " "
103- echo " [*] NVIDIA_TF32_OVERRIDE: ${NVIDIA_TF32_OVERRIDE} "
104- echo " "
10597# Custom Image Classification Task Flags
10698echo " [*] INPUT_SIZE: ${INPUT_SIZE} "
10799echo " [*] PREPROCESS_METHOD: ${PREPROCESS_METHOD} "
@@ -151,10 +143,7 @@ BENCH_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" >/dev/null 2>&1 && pwd )"
151143cd ${BENCH_DIR}
152144
153145# Execute the example
154-
155- PREPEND_COMMAND=" ${NVIDIA_TF32_OVERRIDE} "
156-
157- COMMAND=" ${PREPEND_COMMAND} python image_classification.py \
146+ COMMAND=" python image_classification.py \
158147 --data_dir ${DATA_DIR} \
159148 --calib_data_dir ${DATA_DIR} \
160149 --input_saved_model_dir ${INPUT_SAVED_MODEL_DIR} \
Original file line number Diff line number Diff line change @@ -8,8 +8,6 @@ DATA_DIR=""
88MODEL_DIR=" "
99
1010# Default Argument Values
11- NVIDIA_TF32_OVERRIDE=" "
12-
1311BYPASS_ARGUMENTS=" "
1412BATCH_SIZE=8
1513
2119 MODEL_NAME=" ${arg#* =} "
2220 shift # Remove --model_name from processing
2321 ;;
24- --no_tf32)
25- NVIDIA_TF32_OVERRIDE=" NVIDIA_TF32_OVERRIDE=0"
26- shift # Remove --no_tf32 from processing
27- ;;
2822 --batch_size=* )
2923 BATCH_SIZE=" ${arg#* =} "
3024 shift # Remove --batch_size= from processing
@@ -70,8 +64,6 @@ echo ""
7064echo " [*] DATA_DIR: ${DATA_DIR} "
7165echo " [*] MODEL_DIR: ${MODEL_DIR} "
7266echo " "
73- echo " [*] NVIDIA_TF32_OVERRIDE: ${NVIDIA_TF32_OVERRIDE} "
74- echo " "
7567# Custom Object Detection Task Flags
7668echo " [*] BATCH_SIZE: ${BATCH_SIZE} "
7769echo " [*] INPUT_SIZE: ${INPUT_SIZE} "
@@ -142,10 +134,7 @@ if [[ ${DEPENDENCIES_STATUS} != 0 ]]; then
142134fi
143135
144136# Step 2: Execute the example
145-
146- PREPEND_COMMAND=" ${NVIDIA_TF32_OVERRIDE} "
147-
148- COMMAND=" ${PREPEND_COMMAND} python object_detection.py \
137+ COMMAND=" python object_detection.py \
149138 --data_dir ${VAL_DATA_DIR} \
150139 --calib_data_dir ${VAL_DATA_DIR} \
151140 --annotation_path ${ANNOTATIONS_DATA_FILE} \
Original file line number Diff line number Diff line change @@ -7,14 +7,11 @@ MODEL_NAME=""
77MODEL_DIR=" "
88
99# Default Argument Values
10- NVIDIA_TF32_OVERRIDE=" "
11-
12- # TODO: remove when real dataloader is implemented
13- DATA_DIR=" /tmp"
14-
1510BYPASS_ARGUMENTS=" "
1611BATCH_SIZE=32
1712SEQ_LEN=128
13+ # TODO: remove when real dataloader is implemented
14+ DATA_DIR=" /tmp"
1815
1916# Loop through arguments and process them
2017for arg in " $@ "
2421 MODEL_NAME=" ${arg#* =} "
2522 shift # Remove --model_name from processing
2623 ;;
27- --no_tf32)
28- NVIDIA_TF32_OVERRIDE=" NVIDIA_TF32_OVERRIDE=0"
29- shift # Remove --no_tf32 from processing
30- ;;
3124 --batch_size=* )
3225 BATCH_SIZE=" ${arg#* =} "
3326 shift # Remove --batch_size= from processing
@@ -90,8 +83,6 @@ echo ""
9083echo " [*] DATA_DIR: ${DATA_DIR} "
9184echo " [*] MODEL_DIR: ${MODEL_DIR} "
9285echo " "
93- echo " [*] NVIDIA_TF32_OVERRIDE: ${NVIDIA_TF32_OVERRIDE} "
94- echo " "
9586# Custom Transormer Task Flags
9687echo " [*] VOCAB_SIZE: ${VOCAB_SIZE} "
9788echo " [*] SEQ_LEN: ${SEQ_LEN} "
@@ -142,10 +133,7 @@ BENCH_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )/" >/dev/null 2>&1 && pwd )"
142133cd ${BENCH_DIR}
143134
144135# Execute the example
145-
146- PREPEND_COMMAND=" ${NVIDIA_TF32_OVERRIDE} "
147-
148- COMMAND=" ${PREPEND_COMMAND} python transformers.py \
136+ COMMAND=" python transformers.py \
149137 --data_dir ${DATA_DIR} \
150138 --calib_data_dir ${DATA_DIR} \
151139 --input_saved_model_dir ${INPUT_SAVED_MODEL_DIR} \
You can’t perform that action at this time.
0 commit comments