huggingface · echarlaix · Oct 1, 2025 · Oct 1, 2025 · Oct 1, 2025 · Oct 1, 2025
diff --git a/optimum/exporters/openvino/model_configs.py b/optimum/exporters/openvino/model_configs.py
@@ -3969,6 +3969,7 @@ class M2M100OpenVINOConfig(BartOpenVINOConfig):
 )
 @register_in_tasks_manager("deepseek", *["text-generation", "text-generation-with-past"], library_name="transformers")
 class DeepseekOpenVINOConfig(MiniCPM3OpenVINOConfig):
+    MIN_TRANSFORMERS_VERSION = "4.46.0"
     MAX_TRANSFORMERS_VERSION = "4.54.0"
 
     def patch_model_for_export(

diff --git a/tests/openvino/test_decoder.py b/tests/openvino/test_decoder.py
@@ -16,10 +16,13 @@
     pipeline,
     set_seed,
 )
+from transformers.models.auto.configuration_auto import CONFIG_MAPPING_NAMES
 from transformers.testing_utils import slow
 from utils_tests import MODEL_NAMES, get_num_sdpa, mock_torch_cuda_is_available, patch_awq_for_inference
 
+from optimum.exporters.openvino.model_configs import DeepseekOpenVINOConfig
 from optimum.exporters.openvino.model_patcher import patch_update_causal_mask
+from optimum.exporters.tasks import TasksManager
 from optimum.intel import OVModelForCausalLM, OVModelForSequenceClassification
 from optimum.intel.openvino.utils import _print_compiled_model_properties
 from optimum.intel.pipelines import pipeline as optimum_pipeline
@@ -36,67 +39,71 @@
 
 class OVModelForCausalLMIntegrationTest(unittest.TestCase):
     SUPPORTED_ARCHITECTURES = (
-        "bart",
+        "aquila",
+        "aquila2",
+        "arctic",
         "baichuan2",
         "baichuan2-13b",
-        "gpt_bigcode",
+        "bart",
+        "bigbird_pegasus",
+        "biogpt",
         "blenderbot",
         "blenderbot-small",
         "bloom",
         "chatglm",
+        "chatglm4",
         "codegen",
         "codegen2",
+        "cohere",
+        "dbrx",
+        "decilm",
+        "exaone",
+        "falcon",
+        "falcon-40b",
+        "gemma",
+        "gemma2",
         "gpt2",
-        "gptj",
+        "gpt_bigcode",
         "gpt_neo",
         "gpt_neox",
+        "gpt_neox_japanese",
+        "gptj",
+        "granite",
+        "granitemoe",
+        "internlm",
+        "internlm2",
+        "jais",
         "llama",
+        "llama4",
+        "llama4_text",
         "marian",
+        "mbart",
         "minicpm",
         "mistral",
         "mixtral",
         "mpt",
+        "olmo",
         "opt",
-        "pegasus",
-        "qwen",
-        "phi",
-        "internlm2",
         "orion",
-        "falcon",
-        "falcon-40b",
+        "pegasus",
         "persimmon",
-        "biogpt",
-        "gpt_neox_japanese",
-        "xglm",
-        "aquila",
-        "aquila2",
-        "xverse",
-        "internlm",
-        "jais",
-        "chatglm4",
-        "decilm",
-        "gemma",
-        "olmo",
-        "stablelm",
-        "starcoder2",
-        "dbrx",
-        "cohere",
+        "phi",
+        "phi3",
+        "qwen",
         "qwen2",
         "qwen2_moe",
-        "arctic",
-        "phi3",
-        "gemma2",
-        "exaone",
-        "granite",
-        "granite-moe",
+        "stablelm",
+        "starcoder2",
+        "xglm",
+        "xverse",
     )
 
-    SUPPORTED_SSM_ARCHITECTURES = ("mamba", "falcon-mamba")
+    SUPPORTED_SSM_ARCHITECTURES = ("mamba", "falcon_mamba")
 
     SUPPORTED_ARCHITECTURES += SUPPORTED_SSM_ARCHITECTURES
 
     if is_transformers_version(">=", "4.46.0"):
-        SUPPORTED_ARCHITECTURES += ("glm", "mistral-nemo", "minicpm3", "phi3-moe")
+        SUPPORTED_ARCHITECTURES += ("glm", "mistral-nemo", "minicpm3", "phimoe")
         # openvino 2025.0 required for disabling check_trace
         if is_openvino_version(">=", "2025.0"):
             SUPPORTED_ARCHITECTURES += ("deepseek",)
@@ -109,6 +116,9 @@ class OVModelForCausalLMIntegrationTest(unittest.TestCase):
         if is_openvino_version(">=", "2024.6.0") and platform.system() != "Windows":
             SUPPORTED_ARCHITECTURES += ("mixtral_awq",)
 
+    if is_transformers_version(">", "4.47"):
+        SUPPORTED_ARCHITECTURES += ("olmo2",)
+
     if is_transformers_version(">", "4.49"):
         SUPPORTED_ARCHITECTURES += ("gemma3_text",)
 
@@ -119,7 +129,7 @@ class OVModelForCausalLMIntegrationTest(unittest.TestCase):
         SUPPORTED_ARCHITECTURES += ("glm4",)
 
     if is_transformers_version(">=", "4.53.0"):
-        SUPPORTED_ARCHITECTURES += ("arcee",)
+        SUPPORTED_ARCHITECTURES += ("arcee", "smollm3")
 
     if is_transformers_version(">=", "4.54.0"):
         # remote code models differs after transformers v4.54
@@ -167,6 +177,8 @@ class OVModelForCausalLMIntegrationTest(unittest.TestCase):
         "gpt_neo": 4,
         "gpt_neox": 5,
         "llama": 2,
+        "llama4": 5,
+        "llama4_text": 2,
         "marian": 2,
         "minicpm": 4,
         "mistral": 2,
@@ -201,11 +213,11 @@ class OVModelForCausalLMIntegrationTest(unittest.TestCase):
         "gemma2": 4,
         "exaone": 8,
         "granite": 6,
-        "granite-moe": 6,
+        "granitemoe": 6,
         "glm": 28,
         "mistral-nemo": 8,
         "minicpm3": 6,
-        "phi3-moe": 2,
+        "phimoe": 2,
         "deepseek": 2,
         "opt_gptq": 12,
         "mixtral_awq": 2,
@@ -214,9 +226,35 @@ class OVModelForCausalLMIntegrationTest(unittest.TestCase):
         "qwen3": 2,
         "qwen3_moe": 2,
         "mamba": 0,
-        "falcon-mamba": 0,
+        "falcon_mamba": 0,
         "arcee": 2,
     }
+    TASK = "text-generation"
+
+    def test_find_untested_architectures(self):
+        if len(self.SUPPORTED_ARCHITECTURES) != len(set(self.SUPPORTED_ARCHITECTURES)):
+            raise ValueError(
+                f"For the task `{self.TASK}`, some architectures are duplicated in the list of tested architectures: "
+                f"{self.SUPPORTED_ARCHITECTURES}.\n"
+            )
+
+        tested_architectures = set(self.SUPPORTED_ARCHITECTURES)
+        transformers_architectures = set(CONFIG_MAPPING_NAMES.keys())
+        ov_architectures = set(TasksManager.get_supported_model_type_for_task(task=self.TASK, exporter="openvino"))
+        supported_architectures = ov_architectures & transformers_architectures
+
+        if is_transformers_version(">=", str(DeepseekOpenVINOConfig.MAX_TRANSFORMERS_VERSION)):
+            if "deepseek_v2" in supported_architectures:
+                supported_architectures.remove("deepseek_v2")
+            if "deepseek_v3" in supported_architectures:
+                supported_architectures.remove("deepseek_v3")
+
+        untested_architectures = supported_architectures - tested_architectures
+
+        if len(untested_architectures) > 0:
+            raise ValueError(
+                f"For the task `{self.TASK}`, the OpenVINO exporter supports {untested_architectures} which are not tested"
+            )
 
     # TODO: remove gptq/awq from here
     @parameterized.expand(SUPPORTED_ARCHITECTURES)

diff --git a/tests/openvino/test_export.py b/tests/openvino/test_export.py
@@ -81,7 +81,7 @@ class ExportModelTest(unittest.TestCase):
         "speecht5": OVModelForTextToSpeechSeq2Seq,
         "clip": OVModelForZeroShotImageClassification,
         "mamba": OVModelForCausalLM,
-        "falcon-mamba": OVModelForCausalLM,
+        "falcon_mamba": OVModelForCausalLM,
         "stable-diffusion-3": OVStableDiffusion3Pipeline,
         "flux": OVFluxPipeline,
         "ltx-video": OVLTXPipeline,

diff --git a/tests/openvino/test_exporters_cli.py b/tests/openvino/test_exporters_cli.py
@@ -84,7 +84,7 @@ class OVCLIExportTestCase(unittest.TestCase):
         ("text2text-generation", "t5"),
         ("text2text-generation-with-past", "t5"),
         ("text-generation-with-past", "mamba"),
-        ("text-generation-with-past", "falcon-mamba"),
+        ("text-generation-with-past", "falcon_mamba"),
         ("text-classification", "albert"),
         ("question-answering", "distilbert"),
         ("token-classification", "roberta"),
@@ -127,7 +127,7 @@ class OVCLIExportTestCase(unittest.TestCase):
         "speecht5": 2,
         "clip": 2 if is_tokenizers_version("<", "0.20.0") or is_openvino_version(">=", "2024.5") else 0,
         "mamba": 2,
-        "falcon-mamba": 2,
+        "falcon_mamba": 2,
         "qwen3": 2,
     }
 

diff --git a/tests/openvino/utils_tests.py b/tests/openvino/utils_tests.py
@@ -75,7 +75,7 @@
     "gemma3": "katuni4ka/tiny-random-gemma3",
     "falcon": "fxmarty/really-tiny-falcon-testing",
     "falcon-40b": "katuni4ka/tiny-random-falcon-40b",
-    "falcon-mamba": "rkazants/tiny-falcon-mamba",
+    "falcon_mamba": "rkazants/tiny-falcon-mamba",
     "flaubert": "hf-internal-testing/tiny-random-flaubert",
     "flux": "katuni4ka/tiny-random-flux",
     "flux-fill": "katuni4ka/tiny-random-flux-fill",
@@ -88,7 +88,7 @@
     "gpt_oss_mxfp4": "echarlaix/tiny-random-gpt-oss-mxfp4",
     "gptj": "hf-internal-testing/tiny-random-GPTJModel",
     "granite": "katuni4ka/tiny-random-granite",
-    "granite-moe": "katuni4ka/tiny-random-granite-moe",
+    "granitemoe": "katuni4ka/tiny-random-granite-moe",
     "hubert": "hf-internal-testing/tiny-random-HubertModel",
     "ibert": "hf-internal-testing/tiny-random-ibert",
     "idefics3": "hf-internal-testing/tiny-random-Idefics3ForConditionalGeneration",
@@ -101,11 +101,13 @@
     "llama": "HuggingFaceM4/tiny-random-LlamaForCausalLM",
     "llama_awq": "HuggingFaceH4/tiny-random-LlamaForCausalLM",
     "llama4": "hf-internal-testing/tiny-random-llama4",
+    "llama4_text": "trl-internal-testing/tiny-Llama4ForCausalLM",
     "llava": "katuni4ka/tiny-random-llava",
     "llava_next": "katuni4ka/tiny-random-llava-next",
     "llava_next_mistral": "optimum-internal-testing/tiny-random-llava-next-mistral",
     "llava_next_video": "katuni4ka/tiny-random-llava-next-video",
     "m2m_100": "hf-internal-testing/tiny-random-m2m_100",
+    "olmo2": "hf-internal-testing/tiny-random-Olmo2ForCausalLM",
     "opt": "hf-internal-testing/tiny-random-OPTModel",
     "opt125m": "facebook/opt-125m",
     "opt_gptq": "ybelkada/opt-125m-gptq-4bit",
@@ -139,7 +141,7 @@
     "pix2struct": "fxmarty/pix2struct-tiny-random",
     "phi": "echarlaix/tiny-random-PhiForCausalLM",
     "phi3": "Xenova/tiny-random-Phi3ForCausalLM",
-    "phi3-moe": "katuni4ka/phi-3.5-moe-tiny-random",
+    "phimoe": "katuni4ka/phi-3.5-moe-tiny-random",
     "phi3_v": "katuni4ka/tiny-random-phi3-vision",
     "phi4mm": "katuni4ka/tiny-random-phi-4-multimodal",
     "poolformer": "hf-internal-testing/tiny-random-PoolFormerModel",
@@ -156,6 +158,7 @@
     "segformer": "hf-internal-testing/tiny-random-SegformerModel",
     "sentence-transformers-bert": "sentence-transformers-testing/stsb-bert-tiny-safetensors",
     "sam": "fxmarty/sam-vit-tiny-random",
+    "smollm3": "optimum-internal-testing/tiny-random-SmolLM3ForCausalLM",
     "smolvlm": "katuni4ka/tiny-random-smolvlm2",
     "speecht5": "hf-internal-testing/tiny-random-SpeechT5ForTextToSpeech",
     "speech_to_text": "hf-internal-testing/tiny-random-Speech2TextModel",
@@ -326,7 +329,7 @@
     },
     "clip": {"model": 130},
     "mamba": {"model": 386},
-    "falcon-mamba": {"model": 194},
+    "falcon_mamba": {"model": 194},
 }
 
 TEST_IMAGE_URL = "http://images.cocodataset.org/val2017/000000039769.jpg"
@@ -457,10 +460,8 @@ def get_num_sdpa(model):
     "baichuan2-13b": "baichuan",
     "chatglm4": "chatglm",
     "codegen2": "codegen",
-    "falcon-mamba": "falcon_mamba",
     "falcon-40b": "falcon",
     "gpt_oss_mxfp4": "gpt_oss",
-    "granite-moe": "granitemoe",
     "llama_awq": "llama",
     "llava_next_mistral": "llava_next",
     "mistral-nemo": "mistral",
@@ -470,7 +471,6 @@ def get_num_sdpa(model):
     "opt_gptq": "opt",
     "perceiver_text": "perceiver",
     "perceiver_vision": "perceiver",
-    "phi3-moe": "phimoe",
     "swin-window": "swin",
     "vit-with-attentions": "vit",
     "vit-with-hidden-states": "vit",