Skip to content

Commit eeb1df0

Browse files
OV configurations alignment (#787)
* Align with genai * Added stable-code-3b * Change order * Update configuration.py
1 parent 1d29904 commit eeb1df0

File tree

1 file changed

+35
-6
lines changed

1 file changed

+35
-6
lines changed

optimum/intel/openvino/configuration.py

Lines changed: 35 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -46,18 +46,47 @@
4646
"dataset": "wikitext2",
4747
"awq": True,
4848
},
49-
"meta-llama/Llama-2-7b": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.7},
49+
"meta-llama/Llama-2-7b": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.6},
5050
"meta-llama/Llama-2-7b-chat": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.8},
5151
"meta-llama/Llama-2-13b-chat": {"bits": 4, "sym": True, "group_size": 64, "ratio": 0.8},
52-
"stabilityai/stablelm-3b-4e1t": {"bits": 4, "sym": True, "group_size": 64, "ratio": 0.8},
53-
"stablelm-epoch-3b-preview": {"bits": 4, "sym": True, "group_size": 64, "ratio": 0.8},
54-
"stabilityai/stablelm-zephyr-3b": {"bits": 4, "sym": False, "group_size": 128, "ratio": 1.0},
52+
"stabilityai/stablelm-3b-4e1t": {
53+
"bits": 4,
54+
"sym": True,
55+
"group_size": 64,
56+
"ratio": 0.8,
57+
"dataset": "wikitext2",
58+
"awq": True,
59+
},
60+
"stabilityai/stablelm-zephyr-3b": {
61+
"bits": 4,
62+
"sym": False,
63+
"group_size": 128,
64+
"ratio": 1.0,
65+
"dataset": "wikitext2",
66+
"awq": True,
67+
},
68+
"stabilityai/stable-code-3b": {"bits": 4, "sym": True, "group_size": 64, "ratio": 0.8},
5569
"pansophic/rocket-3B": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.8},
5670
"THUDM/chatglm2-6b": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.72},
5771
"Qwen/Qwen-7B-Chat": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.6},
5872
"openlm-research/open_llama_3b": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True},
59-
"tiiuae/falcon-7b": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True},
60-
"psmathur/orca_mini_3b": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True},
73+
"tiiuae/falcon-7b-instruct": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True},
74+
"psmathur/orca_mini_3b": {
75+
"bits": 4,
76+
"sym": True,
77+
"group_size": 64,
78+
"all_layers": True,
79+
"dataset": "wikitext2",
80+
"awq": True,
81+
},
82+
"bigscience/bloomz-560m": {
83+
"bits": 4,
84+
"sym": True,
85+
"group_size": 64,
86+
"ratio": 0.8,
87+
"dataset": "wikitext2",
88+
"awq": True,
89+
},
6190
"mistralai/Mixtral-8x7B-v0.1": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.8},
6291
"facebook/opt-2.7b": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.7},
6392
"togethercomputer/RedPajama-INCITE-Chat-3B-v1": {"bits": 4, "sym": False, "group_size": 128, "ratio": 0.8},

0 commit comments

Comments
 (0)