Skip to content

Commit 7faf6b2

Browse files
authored
forward fix
Differential Revision: D80281988 Pull Request resolved: #13429
1 parent 00dedb3 commit 7faf6b2

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

examples/models/llama/model_args.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -66,6 +66,9 @@ class ModelArgs:
6666
target_modules: Optional[list] = None
6767
peft_type: Optional[str] = None # PEFT type.
6868
base_model_name_or_path: Optional[str] = None # Base model name or path.
69+
kv_io_bit_width: Optional[int] = (
70+
None # KV cache bit width. This is for QNN backend only for now.
71+
)
6972

7073
def __post_init__(self):
7174
if self.n_kv_heads is None:

0 commit comments

Comments
 (0)