Skip to content

Commit c9629e8

Browse files
authored
1) Updated compression config for tiiuae/falcon-7b-instruct. (#903)
2) Added compression configs for Llama-3-8B and Llama-3-8B-Instruct.
1 parent b760a1d commit c9629e8

File tree

1 file changed

+17
-1
lines changed

1 file changed

+17
-1
lines changed

optimum/intel/openvino/configuration.py

Lines changed: 17 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -92,7 +92,7 @@ class OVQuantizationMethod(str, Enum):
9292
"dataset": "wikitext2",
9393
"quant_method": OVQuantizationMethod.AWQ,
9494
},
95-
"tiiuae/falcon-7b-instruct": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True},
95+
"tiiuae/falcon-7b-instruct": {"bits": 4, "sym": False, "group_size": 64},
9696
"psmathur/orca_mini_3b": {
9797
"bits": 4,
9898
"sym": True,
@@ -164,6 +164,22 @@ class OVQuantizationMethod(str, Enum):
164164
"dataset": "wikitext2",
165165
"scale_estimation": True,
166166
},
167+
"meta-llama/Meta-Llama-3-8B-Instruct": {
168+
"bits": 4,
169+
"sym": False,
170+
"group_size": 64,
171+
"ratio": 0.9,
172+
"dataset": "wikitext2",
173+
"scale_estimation": True,
174+
},
175+
"meta-llama/Meta-Llama-3-8B": {
176+
"bits": 4,
177+
"sym": False,
178+
"group_size": 64,
179+
"ratio": 0.9,
180+
"dataset": "wikitext2",
181+
"scale_estimation": True,
182+
},
167183
}
168184

169185
_DEFAULT_4BIT_CONFIG = {

0 commit comments

Comments
 (0)