From 7ba906b7893ad94e03e75ffce7fd75e92723875c Mon Sep 17 00:00:00 2001 From: Nikolay Date: Thu, 30 Oct 2025 18:24:02 +0100 Subject: [PATCH 1/2] common params attempt #1 --- optimum/intel/openvino/configuration.py | 50 ++++++++++++++++++++----- 1 file changed, 40 insertions(+), 10 deletions(-) diff --git a/optimum/intel/openvino/configuration.py b/optimum/intel/openvino/configuration.py index 1bff6d2822..cd91bd3b55 100644 --- a/optimum/intel/openvino/configuration.py +++ b/optimum/intel/openvino/configuration.py @@ -100,7 +100,7 @@ class OVQuantizationMethod(str, Enum): "Qwen/Qwen-7B-Chat": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.6}, "Qwen/Qwen2.5-1.5B-Instruct": { "bits": 4, - "sym": False, + "sym": True, "group_size": 128, "ratio": 0.9, "dataset": "wikitext2", @@ -140,7 +140,7 @@ class OVQuantizationMethod(str, Enum): }, "Qwen/Qwen3-8B": { "bits": 4, - "sym": False, + "sym": True, "group_size": 128, "ratio": 1.0, "dataset": "wikitext2", @@ -233,8 +233,8 @@ class OVQuantizationMethod(str, Enum): }, "meta-llama/Meta-Llama-3.1-8B-Instruct": { "bits": 4, - "sym": False, - "group_size": 64, + "sym": True, + "group_size": 128, "ratio": 0.8, "quant_method": OVQuantizationMethod.AWQ, }, @@ -262,11 +262,42 @@ class OVQuantizationMethod(str, Enum): }, "microsoft/Phi-3.5-mini-instruct": { "bits": 4, - "sym": False, - "group_size": 64, + "sym": True, + "group_size": 128, "ratio": 1.0, "quant_method": OVQuantizationMethod.AWQ, }, + "microsoft/Phi-4-reasoning": { + "bits": 4, + "sym": True, + "group_size": 128, + "ratio": 1.0, + "quant_method": OVQuantizationMethod.AWQ, + }, + "google/gemma-3-4b-it": { + "bits": 4, + "sym": True, + "group_size": 128, + "ratio": 1.0, + }, + "Mistral-7B-Instruct-v0.2": { + "bits": 4, + "sym": True, + "group_size": 128, + "ratio": 1.0, + }, + "openbmb/MiniCPM4-0.5B": { + "bits": 4, + "sym": True, + "group_size": 128, + "ratio": 1.0, + }, + "openbmb/MiniCPM4-8B": { + "bits": 4, + "sym": True, + "group_size": 128, + "ratio": 1.0, + }, "microsoft/Phi-4-mini-instruct": { "bits": 4, "sym": False, @@ -290,10 +321,9 @@ class OVQuantizationMethod(str, Enum): }, "deepseek-ai/DeepSeek-R1-Distill-Llama-8B": { "bits": 4, - "sym": False, - "group_size": 64, - "ratio": 0.8, - "quant_method": OVQuantizationMethod.AWQ, + "sym": True, + "group_size": 128, + "ratio": 1, }, "microsoft/Phi-4-multimodal-instruct": { "quantization_configs": { From e34e54d90f9a61ff9dbc60304ce13fcc7ced3bb6 Mon Sep 17 00:00:00 2001 From: Nikita Savelyev Date: Fri, 31 Oct 2025 12:57:08 +0100 Subject: [PATCH 2/2] Update optimum/intel/openvino/configuration.py --- optimum/intel/openvino/configuration.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/optimum/intel/openvino/configuration.py b/optimum/intel/openvino/configuration.py index cd91bd3b55..5db7a33f22 100644 --- a/optimum/intel/openvino/configuration.py +++ b/optimum/intel/openvino/configuration.py @@ -280,7 +280,7 @@ class OVQuantizationMethod(str, Enum): "group_size": 128, "ratio": 1.0, }, - "Mistral-7B-Instruct-v0.2": { + "mistralai/Mistral-7B-Instruct-v0.2": { "bits": 4, "sym": True, "group_size": 128,