You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
"disable_tf32": disable_tf32, # Force FP32 layers to use traditional as FP32 format vs the default behavior of rounding the inputs to 10-bit mantissas before multiplying, but accumulates the sum using 23-bit mantissas
310
-
"sparse_weights": sparse_weights, #Enable sparsity for convolution and fully connected layers.
"strict_types": strict_types, # kernels should strictly run in operating precision
315
-
"capability": capability, # Restrict kernel selection to safe gpu kernels or safe dla kernels
316
-
"num_min_timing_iters": num_min_timing_iters, # Number of minimization timing iterations used to select kernels
317
-
"num_avg_timing_iters": num_avg_timing_iters, # Number of averaging timing iterations used to select kernels
318
-
"workspace_size": workspace_size, # Maximum size of workspace given to TensorRT
319
-
"max_batch_size": max_batch_size, # Maximum batch size (must be >= 1 to be set, 0 means not set)
309
+
"disable_tf32":
310
+
disable_tf32, # Force FP32 layers to use traditional as FP32 format vs the default behavior of rounding the inputs to 10-bit mantissas before multiplying, but accumulates the sum using 23-bit mantissas
311
+
"sparse_weights": sparse_weights, #Enable sparsity for convolution and fully connected layers.
0 commit comments