We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e224184 commit a328124Copy full SHA for a328124
tests/unittest/_torch/modules/test_mla_helix.py
@@ -80,7 +80,7 @@ class Scenario:
80
rope_original_max_position_embeddings: int = 4096
81
rope_type: str = "yarn"
82
model_type: str = "deepseek_v3"
83
- kv_cache_tokens_per_block: int = 64
+ kv_cache_tokens_per_block: int = 32
84
# TODO only 1 is supported for now here
85
predicted_tokens_per_seq: int = 1
86
bias: bool = False
0 commit comments