We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3ef13a3 commit ddd2386Copy full SHA for ddd2386
docs/source/llm/export-llm.md
@@ -114,7 +114,7 @@ base:
114
metadata: '{"get_bos_id":128000, "get_eos_ids":[128009, 128001]}'
115
model:
116
use_kv_cache: True
117
- use_sdpa_withp_kv_cache: True
+ use_sdpa_with_kv_cache: True
118
quantization:
119
embedding_quantize: 4,32
120
qmode: 8da4w
@@ -144,7 +144,7 @@ base:
144
145
146
147
148
149
150
0 commit comments