We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 2ce535f commit 743ae21Copy full SHA for 743ae21
deepseek/engine-deepseek-r1-distill-qwen-14b/config.yaml
@@ -38,7 +38,7 @@ trt_llm:
38
tensor_parallel_count: 1
39
plugin_configuration:
40
use_paged_context_fmha: true
41
- use_fp8_context_fmha: true
+ use_fp8_context_fmha: false
42
paged_kv_cache: true
43
runtime:
44
batch_scheduler_policy: max_utilization
deepseek/engine-deepseek-r1-distill-qwen-32b/config.yaml
0 commit comments