Skip to content

Commit 480eea1

Browse files
authored
Add quantization config for open_llama_3b_v2 (#803)
1 parent 67f9ec1 commit 480eea1

File tree

1 file changed

+1
-0
lines changed

1 file changed

+1
-0
lines changed

optimum/intel/openvino/configuration.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,7 @@
7070
"THUDM/chatglm2-6b": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.72},
7171
"Qwen/Qwen-7B-Chat": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.6},
7272
"openlm-research/open_llama_3b": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True},
73+
"openlm-research/open_llama_3b_v2": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True},
7374
"tiiuae/falcon-7b-instruct": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True},
7475
"psmathur/orca_mini_3b": {
7576
"bits": 4,

0 commit comments

Comments
 (0)