Skip to content

Commit d4bd848

Browse files
Update default int4 config for llama-2-7b-chat-hf (#1216)
* Update default int4 config for llama-2-7b-chat-hf * Update configuration.py
1 parent 8fa4ebd commit d4bd848

File tree

1 file changed

+9
-1
lines changed

1 file changed

+9
-1
lines changed

optimum/intel/openvino/configuration.py

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,15 @@ class OVQuantizationMethod(str, Enum):
6767
"quant_method": OVQuantizationMethod.AWQ,
6868
},
6969
"meta-llama/Llama-2-7b-hf": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.6},
70-
"meta-llama/Llama-2-7b-chat-hf": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.8},
70+
"meta-llama/Llama-2-7b-chat-hf": {
71+
"bits": 4,
72+
"sym": True,
73+
"group_size": 128,
74+
"ratio": 1.0,
75+
"dataset": "wikitext2",
76+
"quant_method": OVQuantizationMethod.AWQ,
77+
"scale_estimation": True,
78+
},
7179
"meta-llama/Llama-2-13b-chat-hf": {"bits": 4, "sym": True, "group_size": 64, "ratio": 0.8},
7280
"stabilityai/stablelm-3b-4e1t": {
7381
"bits": 4,

0 commit comments

Comments
 (0)