We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1ac0566 commit 5e272eeCopy full SHA for 5e272ee
tests/unittest/attention/test_gpt_attention.py
@@ -754,7 +754,9 @@ def _construct_execution(
754
precision=dtype,
755
int8=int8_trt_flag,
756
quant_mode=quant_mode)
757
-
+ # Reuce the TRT engine build time by setting the max allowed number of tactics in builder tactic profiling.
758
+ if builder_config.trt_builder_config.max_num_tactics == -1:
759
+ builder_config.trt_builder_config.max_num_tactics = 30
760
if session is None:
761
engine = builder.build_engine(net, builder_config)
762
session = tensorrt_llm.runtime.Session.from_serialized_engine(
0 commit comments