Look into models from huggingface (#22)

xadupre · web-flow · commit dd5d08fb332c · 2025-03-27T16:39:53.000+01:00
* hub

* bb

* black

* data

* mypy

* doc

* add tiny

* fix dummy inputs

* dd

* doc

* fix llm

* fix issues
diff --git a/.github/workflows/spell-check.yml b/.github/workflows/spell-check.yml
@@ -21,4 +21,4 @@ jobs:
 
       # Run codespell
       - name: Run codespell
-        run: codespell --skip="*.png,*.jpg,*.jpeg,*.gif,*.svg,*.ico,*.pdf,*.js" --ignore-words-list="nd,te,OT" --check-filenames
+        run: codespell --skip="*.png,*.jpg,*.jpeg,*.gif,*.svg,*.ico,*.pdf,*.js,*.css,*.map" --ignore-words-list="nd,te,OT" --check-filenames
diff --git a/_doc/api/torch_models/hghub/hub_api.rst b/_doc/api/torch_models/hghub/hub_api.rst
@@ -0,0 +1,7 @@
+
+onnx_diagnostic.torch_models.hghub.hub_api
+==========================================
+
+.. automodule:: onnx_diagnostic.torch_models.hghub.hub_api
+    :members:
+    :no-undoc-members:
diff --git a/_doc/api/torch_models/hghub/hub_data.rst b/_doc/api/torch_models/hghub/hub_data.rst
@@ -0,0 +1,7 @@
+
+onnx_diagnostic.torch_models.hghub.hub_data
+===========================================
+
+.. automodule:: onnx_diagnostic.torch_models.hghub.hub_data
+    :members:
+    :no-undoc-members:
diff --git a/_doc/api/torch_models/hghub/index.rst b/_doc/api/torch_models/hghub/index.rst
@@ -0,0 +1,16 @@
+onnx_diagnostic.torch_models.hghub
+==================================
+
+.. toctree::
+    :maxdepth: 1
+    :caption: submodules
+
+    hub_api
+    hub_data
+    model_inputs
+
+.. autofunction:: onnx_diagnostic.torch_models.hghub.get_untrained_model_with_inputs
+
+.. automodule:: onnx_diagnostic.torch_models.hghub
+    :members:
+    :no-undoc-members:
diff --git a/_doc/api/torch_models/hghub/model_inputs.rst b/_doc/api/torch_models/hghub/model_inputs.rst
@@ -0,0 +1,8 @@
+
+onnx_diagnostic.torch_models.hghub.model_inputs
+===============================================
+
+.. automodule:: onnx_diagnostic.torch_models.hghub.model_inputs
+    :members:
+    :no-undoc-members:
+    :exclude-members: get_untrained_model_with_inputs
diff --git a/_doc/api/torch_models/index.rst b/_doc/api/torch_models/index.rst
@@ -5,6 +5,7 @@ onnx_diagnostic.torch_models
     :maxdepth: 1
     :caption: submodules
 
+    hghub/index
     llms
 
 .. automodule:: onnx_diagnostic.torch_models
diff --git a/_doc/conf.py b/_doc/conf.py
@@ -124,6 +124,7 @@
     ("py:class", "transformers.cache_utils.MambaCache"),
     ("py:func", "torch.export._draft_export.draft_export"),
     ("py:func", "torch._export.tools.report_exportability"),
+    ("py:meth", "huggingface_hub.HfApi.list_models"),
     ("py:meth", "transformers.GenerationMixin.generate"),
 ]
 
@@ -182,6 +183,7 @@
     "graph break": "https://pytorch.org/docs/stable/torch.compiler_faq.html#graph-breaks",
     "GraphModule": "https://pytorch.org/docs/stable/fx.html#torch.fx.GraphModule",
     "HuggingFace": "https://huggingface.co/docs/hub/en/index",
+    "huggingface_hub": "https://github.com/huggingface/huggingface_hub",
     "Linux": "https://www.linux.org/",
     "ml_dtypes": "https://github.com/jax-ml/ml_dtypes",
     "monai": "https://monai.io/",
@@ -224,3 +226,13 @@
     "vocos": "https://github.com/gemelo-ai/vocos",
     "Windows": "https://www.microsoft.com/windows",
 }
+
+# models
+epkg_dictionary.update(
+    {
+        "arnir0/Tiny-LLM": "https://huggingface.co/arnir0/Tiny-LLM",
+        "microsoft/phi-2": "https://huggingface.co/microsoft/phi-2",
+        "microsoft/Phi-3.5-mini-instruct": "https://huggingface.co/microsoft/Phi-3.5-mini-instruct",
+        "microsoft/Phi-3.5-vision-instruct": "https://huggingface.co/microsoft/Phi-3.5-vision-instruct",
+    }
+)
diff --git a/_doc/examples/plot_export_tiny_llm.py b/_doc/examples/plot_export_tiny_llm.py
@@ -13,8 +13,7 @@
 That example shows to guess the inputs of this method even though the model
 is executed through meth ``generate``.
 
-We focus on the model
-`Tiny-LLM <https://huggingface.co/arnir0/Tiny-LLM>`_.
+We focus on the model :epkg:`arnir0/Tiny-LLM`.
 To avoid downloading any weights, we write a function creating a
 random model based on the same architecture.
 
diff --git a/_doc/examples/plot_export_tiny_llm_patched.py b/_doc/examples/plot_export_tiny_llm_patched.py
@@ -6,8 +6,7 @@
 
 Many models from :epkg:`transformers` cannot be converted because
 the implementation uses cache classes. Let's see how to get around that.
-We focus on the model
-`Tiny-LLM <https://huggingface.co/arnir0/Tiny-LLM>`_.
+We focus on the model :epkg:`arnir0/Tiny-LLM`.
 To avoid downloading any weights, we write a function creating a
 random model based on the same architecture.
 This continues example :ref:`l-plot-tiny-llm-export`.
diff --git a/_unittests/ut_torch_models/test_hghub_api.py b/_unittests/ut_torch_models/test_hghub_api.py
@@ -0,0 +1,116 @@
+import unittest
+import pandas
+from onnx_diagnostic.ext_test_case import (
+    ExtTestCase,
+    hide_stdout,
+    never_test,
+    requires_torch,
+    requires_transformers,
+)
+from onnx_diagnostic.torch_models.hghub.hub_api import (
+    enumerate_model_list,
+    get_model_info,
+    get_pretrained_config,
+    task_from_id,
+    task_from_arch,
+    task_from_tags,
+)
+from onnx_diagnostic.torch_models.hghub.hub_data import load_architecture_task
+
+
+class TestHuggingFaceHubApi(ExtTestCase):
+
+    @requires_transformers("4.50")  # we limit to some versions of the CI
+    @requires_torch("2.7")
+    def test_enumerate_model_list(self):
+        models = list(
+            enumerate_model_list(
+                2,
+                verbose=1,
+                dump="test_enumerate_model_list.csv",
+                filter="text-generation",
+                library="transformers",
+            )
+        )
+        self.assertEqual(len(models), 2)
+        df = pandas.read_csv("test_enumerate_model_list.csv")
+        self.assertEqual(df.shape, (2, 12))
+        tasks = [task_from_id(c) for c in df.id]
+        self.assertEqual(["text-generation", "text-generation"], tasks)
+
+    @requires_transformers("4.50")
+    @requires_torch("2.7")
+    def test_task_from_id(self):
+        for name, etask in [
+            ("arnir0/Tiny-LLM", "text-generation"),
+            ("microsoft/phi-2", "text-generation"),
+        ]:
+            with self.subTest(name=name, task=etask):
+                task = task_from_id(name, True)
+                self.assertEqual(etask, task)
+
+    @requires_transformers("4.50")
+    @requires_torch("2.7")
+    @never_test()
+    def test_task_from_id_long(self):
+        for name, etask in [
+            ("microsoft/Phi-3.5-mini-instruct", "text-generation"),
+            ("microsoft/Phi-3.5-vision-instruct", "text-generation"),
+        ]:
+            with self.subTest(name=name, task=etask):
+                task = task_from_id(name, True)
+                self.assertEqual(etask, task)
+
+    @requires_transformers("4.50")
+    @requires_torch("2.7")
+    @hide_stdout()
+    def test_get_pretrained_config(self):
+        conf = get_pretrained_config("microsoft/phi-2")
+        self.assertNotEmpty(conf)
+        print(conf)
+
+    @requires_transformers("4.50")
+    @requires_torch("2.7")
+    @hide_stdout()
+    def test_get_model_info(self):
+        info = get_model_info("microsoft/phi-2")
+        self.assertEqual(info.pipeline_tag, "text-generation")
+
+        info = get_model_info("microsoft/Phi-3.5-vision-instruct")
+        self.assertEqual(info.pipeline_tag, "image-text-to-text")
+
+        info = get_model_info("microsoft/Phi-4-multimodal-instruct")
+        self.assertEqual(info.pipeline_tag, "automatic-speech-recognition")
+
+    def test_task_from_arch(self):
+        task = task_from_arch("LlamaForCausalLM")
+        self.assertEqual("text-generation", task)
+
+    @never_test()
+    def test_hf_all_models(self):
+        list(enumerate_model_list(-1, verbose=1, dump="test_hf_all_models.csv"))
+
+    def test_load_architecture_task(self):
+        data = load_architecture_task()
+        print(set(data.values()))
+
+    def test_task_from_tags(self):
+        _tags = [
+            ("text-generation|nlp|code|en|text-generation-inference", "text-generation"),
+            (
+                "text-generation|nlp|code|vision|image-text-to-text|conversational",
+                "image-text-to-text",
+            ),
+            (
+                "text-generation|nlp|code|audio|automatic-speech-recognition|speech-summarization|speech-translation|visual-question-answering",
+                "automatic-speech-recognition",
+            ),
+        ]
+        for tags, etask in _tags:
+            with self.subTest(tags=tags, task=etask):
+                task = task_from_tags(tags)
+                self.assertEqual(etask, task)
+
+
+if __name__ == "__main__":
+    unittest.main(verbosity=2)
diff --git a/_unittests/ut_torch_models/test_hghub_model.py b/_unittests/ut_torch_models/test_hghub_model.py
@@ -0,0 +1,60 @@
+import unittest
+import transformers
+from onnx_diagnostic.ext_test_case import (
+    ExtTestCase,
+    hide_stdout,
+    requires_torch,
+    requires_transformers,
+)
+from onnx_diagnostic.torch_models.hghub.model_inputs import (
+    config_class_from_architecture,
+    get_untrained_model_with_inputs,
+)
+
+
+class TestHuggingFaceHubModel(ExtTestCase):
+    @requires_transformers("4.50")  # we limit to some versions of the CI
+    @requires_torch("2.7")
+    def test_config_class_from_architecture(self):
+        config = config_class_from_architecture("LlamaForCausalLM")
+        self.assertEqual(config, transformers.LlamaConfig)
+
+    @hide_stdout()
+    def test_get_untrained_model_with_inputs_tiny_llm(self):
+        mid = "arnir0/Tiny-LLM"
+        data = get_untrained_model_with_inputs(mid, verbose=1)
+        model, inputs = data["model"], data["inputs"]
+        model(**inputs)
+        self.assertEqual((1858125824, 464531456), (data["size"], data["n_weights"]))
+
+    @hide_stdout()
+    def test_get_untrained_model_with_inputs_tiny_xlm_roberta(self):
+        mid = "hf-internal-testing/tiny-xlm-roberta"  # XLMRobertaConfig
+        data = get_untrained_model_with_inputs(mid, verbose=1)
+        model, inputs = data["model"], data["inputs"]
+        model(**inputs)
+        self.assertEqual((126190824, 31547706), (data["size"], data["n_weights"]))
+
+    @hide_stdout()
+    def test_get_untrained_model_with_inputs_tiny_gpt_neo(self):
+        mid = "hf-internal-testing/tiny-random-GPTNeoXForCausalLM"
+        data = get_untrained_model_with_inputs(mid, verbose=1)
+        model, inputs = data["model"], data["inputs"]
+        model(**inputs)
+        self.assertEqual((4291141632, 1072785408), (data["size"], data["n_weights"]))
+
+    @hide_stdout()
+    def test_get_untrained_model_with_inputs_phi_2(self):
+        mid = "microsoft/phi-2"
+        data = get_untrained_model_with_inputs(mid, verbose=1)
+        model, inputs = data["model"], data["inputs"]
+        model(**inputs)
+        # different expected value for different version of transformers
+        self.assertIn(
+            (data["size"], data["n_weights"]),
+            [(1040293888, 260073472), (1040498688, 260124672)],
+        )
+
+
+if __name__ == "__main__":
+    unittest.main(verbosity=2)
diff --git a/onnx_diagnostic/__init__.py b/onnx_diagnostic/__init__.py
@@ -3,5 +3,5 @@
 Functions, classes to dig into a model when this one is right, slow, wrong...
 """
 
-__version__ = "0.2.2"
+__version__ = "0.3.0"
 __author__ = "Xavier Dupré"
diff --git a/onnx_diagnostic/torch_export_patches/patches/patch_torch.py b/onnx_diagnostic/torch_export_patches/patches/patch_torch.py
@@ -131,7 +131,7 @@ def patched__broadcast_shapes(*_shapes):
         assert isinstance(shape, Sequence)
 
     # Computes common shape
-    common_shape: List[Union[int, torch.SymInt]] = [
+    common_shape = [  # List[Union[int, torch.SymInt]]
         1,
     ] * reduce(max, (len(shape) for shape in shapes))
     for _arg_idx, shape in enumerate(shapes):
diff --git a/onnx_diagnostic/torch_models/hghub/__init__.py b/onnx_diagnostic/torch_models/hghub/__init__.py
@@ -0,0 +1 @@
+from .model_inputs import get_untrained_model_with_inputs
diff --git a/onnx_diagnostic/torch_models/hghub/hub_api.py b/onnx_diagnostic/torch_models/hghub/hub_api.py
diff --git a/onnx_diagnostic/torch_models/hghub/hub_data.py b/onnx_diagnostic/torch_models/hghub/hub_data.py
diff --git a/onnx_diagnostic/torch_models/hghub/model_inputs.py b/onnx_diagnostic/torch_models/hghub/model_inputs.py
diff --git a/onnx_diagnostic/torch_models/untrained/llm_phi2.py b/onnx_diagnostic/torch_models/untrained/llm_phi2.py
diff --git a/onnx_diagnostic/torch_models/untrained/llm_tiny_llm.py b/onnx_diagnostic/torch_models/untrained/llm_tiny_llm.py
diff --git a/pyproject.toml b/pyproject.toml
diff --git a/requirements-dev.txt b/requirements-dev.txt