We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 69bb9d6 commit 9cacd66Copy full SHA for 9cacd66
exllamav2/model.py
@@ -954,7 +954,7 @@ def forward_chunk(
954
seq_len <= self.config.max_output_len, \
955
"seq_len exceeds max_output_len"
956
957
- if self.config.arch.lm.mrope and "indexed_embeddings" in kwargs:
+ if self.config.arch.lm.mrope and kwargs.get("indexed_embeddings"):
958
assert attn_params is not None and (
959
attn_params.rope_offsets is not None or
960
attn_params.get_alt_rope_embed("cpu") is not None
0 commit comments