We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 00dedb3 commit 7faf6b2Copy full SHA for 7faf6b2
examples/models/llama/model_args.py
@@ -66,6 +66,9 @@ class ModelArgs:
66
target_modules: Optional[list] = None
67
peft_type: Optional[str] = None # PEFT type.
68
base_model_name_or_path: Optional[str] = None # Base model name or path.
69
+ kv_io_bit_width: Optional[int] = (
70
+ None # KV cache bit width. This is for QNN backend only for now.
71
+ )
72
73
def __post_init__(self):
74
if self.n_kv_heads is None:
0 commit comments