sdpython
diff --git a/‎_unittests/ut_helpers/test_config_helper.py‎
Lines changed: 20 additions & 0 deletions b/‎_unittests/ut_helpers/test_config_helper.py‎
Lines changed: 20 additions & 0 deletions
diff --git a/‎_unittests/ut_tasks/test_tasks.py‎
Lines changed: 105 additions & 0 deletions b/‎_unittests/ut_tasks/test_tasks.py‎
Lines changed: 105 additions & 0 deletions
diff --git a/‎_unittests/ut_torch_models/try_tasks.py‎ renamed to ‎_unittests/ut_tasks/try_tasks.py‎
Lines changed: 22 additions & 6 deletions b/‎_unittests/ut_torch_models/try_tasks.py‎ renamed to ‎_unittests/ut_tasks/try_tasks.py‎
Lines changed: 22 additions & 6 deletions
diff --git a/‎_unittests/ut_torch_models/test_hghub_model.py‎
Lines changed: 1 addition & 99 deletions b/‎_unittests/ut_torch_models/test_hghub_model.py‎
Lines changed: 1 addition & 99 deletions
diff --git a/‎onnx_diagnostic/_command_lines_parser.py‎
Lines changed: 2 additions & 2 deletions b/‎onnx_diagnostic/_command_lines_parser.py‎
Lines changed: 2 additions & 2 deletions
@@ -0,0 +1,20 @@
+import unittest
+import transformers
+from onnx_diagnostic.ext_test_case import (
+    ExtTestCase,
+    requires_torch,
+    requires_transformers,
+)
+from onnx_diagnostic.helpers.config_helper import config_class_from_architecture
+
+
+class TestConfigHelper(ExtTestCase):
+    @requires_transformers("4.50")  # we limit to some versions of the CI
+    @requires_torch("2.7")
+    def test_config_class_from_architecture(self):
+        config = config_class_from_architecture("LlamaForCausalLM")
+        self.assertEqual(config, transformers.LlamaConfig)
+
+
+if __name__ == "__main__":
+    unittest.main(verbosity=2)
@@ -0,0 +1,105 @@
+import unittest
+import torch
+from onnx_diagnostic.ext_test_case import ExtTestCase, hide_stdout
+from onnx_diagnostic.torch_models.hghub.model_inputs import get_untrained_model_with_inputs
+from onnx_diagnostic.torch_export_patches import bypass_export_some_errors
+
+
+class TestTasks(ExtTestCase):
+    @hide_stdout()
+    def test_text2text_generation(self):
+        mid = "sshleifer/tiny-marian-en-de"
+        # mid = "Salesforce/codet5-small"
+        data = get_untrained_model_with_inputs(mid, verbose=1)
+        self.assertIn((data["size"], data["n_weights"]), [(473928, 118482)])
+        model, inputs = data["model"], data["inputs"]
+        raise unittest.SkipTest(f"not working for {mid!r}")
+        model(**inputs)
+
+    @hide_stdout()
+    def test_automatic_speech_recognition(self):
+        mid = "openai/whisper-tiny"
+        data = get_untrained_model_with_inputs(mid, verbose=1)
+        self.assertIn((data["size"], data["n_weights"]), [(132115968, 33028992)])
+        model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
+        Dim = torch.export.Dim
+        self.maxDiff = None
+        self.assertIn("{0:Dim(batch),1:Dim(seq_length)}", self.string_type(ds))
+        self.assertEqualAny(
+            {
+                "decoder_input_ids": {
+                    0: Dim("batch", min=1, max=1024),
+                    1: Dim("seq_length", min=1, max=4096),
+                },
+                "cache_position": {0: Dim("seq_length", min=1, max=4096)},
+                "encoder_outputs": [{0: Dim("batch", min=1, max=1024)}],
+                "past_key_values": [
+                    [
+                        [
+                            {0: Dim("batch", min=1, max=1024)},
+                            {0: Dim("batch", min=1, max=1024)},
+                        ],
+                        [
+                            {0: Dim("batch", min=1, max=1024)},
+                            {0: Dim("batch", min=1, max=1024)},
+                        ],
+                    ],
+                    [
+                        [
+                            {0: Dim("batch", min=1, max=1024)},
+                            {0: Dim("batch", min=1, max=1024)},
+                        ],
+                        [
+                            {0: Dim("batch", min=1, max=1024)},
+                            {0: Dim("batch", min=1, max=1024)},
+                        ],
+                    ],
+                ],
+            },
+            ds,
+        )
+        model(**inputs)
+        self.assertEqual(
+            "#1[T1r3]",
+            self.string_type(torch.utils._pytree.tree_flatten(inputs["encoder_outputs"])[0]),
+        )
+        with bypass_export_some_errors(patch_transformers=True, verbose=10):
+            flat = torch.utils._pytree.tree_flatten(inputs["past_key_values"])[0]
+            self.assertIsInstance(flat, list)
+            self.assertIsInstance(flat[0], torch.Tensor)
+            self.assertEqual(
+                "#8[T1r4,T1r4,T1r4,T1r4,T1r4,T1r4,T1r4,T1r4]",
+                self.string_type(flat),
+            )
+            torch.export.export(model, (), kwargs=inputs, dynamic_shapes=ds, strict=False)
+        with bypass_export_some_errors(patch_transformers=True, verbose=10):
+            flat = torch.utils._pytree.tree_flatten(inputs["past_key_values"])[0]
+            self.assertIsInstance(flat, list)
+            self.assertIsInstance(flat[0], torch.Tensor)
+            self.assertEqual(
+                "#8[T1r4,T1r4,T1r4,T1r4,T1r4,T1r4,T1r4,T1r4]",
+                self.string_type(flat),
+            )
+            torch.export.export(model, (), kwargs=inputs, dynamic_shapes=ds, strict=False)
+
+    @hide_stdout()
+    def test_imagetext2text_generation(self):
+        mid = "HuggingFaceM4/tiny-random-idefics"
+        # mid = "Salesforce/codet5-small"
+        data = get_untrained_model_with_inputs(mid, verbose=1)
+        self.assertIn((data["size"], data["n_weights"]), [(12742888, 3185722)])
+        model, inputs = data["model"], data["inputs"]
+        model(**inputs)
+
+    @hide_stdout()
+    def test_fill_mask(self):
+        mid = "google-bert/bert-base-multilingual-cased"
+        # mid = "Salesforce/codet5-small"
+        data = get_untrained_model_with_inputs(mid, verbose=1)
+        self.assertIn((data["size"], data["n_weights"]), [(12742888, 3185722)])
+        model, inputs = data["model"], data["inputs"]
+        model(**inputs)
+
+
+if __name__ == "__main__":
+    unittest.main(verbosity=2)
@@ -7,7 +7,7 @@
 class TestHuggingFaceHubModel(ExtTestCase):
     @never_test()
     def test_image_classification(self):
-        # clear&&NEVERTEST=1 python _unittests/ut_torch_models/try_tasks.py -k image_c
+        # clear&&NEVERTEST=1 python _unittests/ut_tasks/try_tasks.py -k image_c
 
         from transformers import ViTImageProcessor, ViTModel
         from PIL import Image
@@ -27,7 +27,7 @@ def test_image_classification(self):
 
     @never_test()
     def test_image_classification_resnet(self):
-        # clear&&NEVERTEST=1 python _unittests/ut_torch_models/try_tasks.py -k resnet
+        # clear&&NEVERTEST=1 python _unittests/ut_tasks/try_tasks.py -k resnet
 
         from transformers import ViTImageProcessor, ViTModel
         from PIL import Image
@@ -47,7 +47,7 @@ def test_image_classification_resnet(self):
 
     @never_test()
     def test_zero_shot_image_classification(self):
-        # clear&&NEVERTEST=1 python _unittests/ut_torch_models/try_tasks.py -k zero
+        # clear&&NEVERTEST=1 python _unittests/ut_tasks/try_tasks.py -k zero
         from PIL import Image
         import requests
         from transformers import CLIPProcessor, CLIPModel
@@ -74,7 +74,7 @@ def test_zero_shot_image_classification(self):
 
     @never_test()
     def test_text2text_generation(self):
-        # clear&&NEVERTEST=1 python _unittests/ut_torch_models/try_tasks.py -k text2t
+        # clear&&NEVERTEST=1 python _unittests/ut_tasks/try_tasks.py -k text2t
 
         import torch
         from transformers import RobertaTokenizer, T5ForConditionalGeneration
@@ -100,7 +100,7 @@ def test_text2text_generation(self):
 
     @never_test()
     def test_imagetext2text_generation(self):
-        # clear&&NEVERTEST=1 python _unittests/ut_torch_models/try_tasks.py -k etext2t
+        # clear&&NEVERTEST=1 python _unittests/ut_tasks/try_tasks.py -k etext2t
         # https://huggingface.co/docs/transformers/main/en/tasks/idefics
 
         import torch
@@ -131,7 +131,7 @@ def test_imagetext2text_generation(self):
 
     @never_test()
     def test_automatic_speech_recognition(self):
-        # clear&&NEVERTEST=1 python _unittests/ut_torch_models/try_tasks.py -k automatic_speech
+        # clear&&NEVERTEST=1 python _unittests/ut_tasks/try_tasks.py -k automatic_speech
         # https://huggingface.co/openai/whisper-tiny
 
         from transformers import WhisperProcessor, WhisperForConditionalGeneration
@@ -195,6 +195,22 @@ def test_automatic_speech_recognition(self):
         transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
         print("--", transcription)
 
+    @never_test()
+    def test_fill_mask(self):
+        # clear&&NEVERTEST=1 python _unittests/ut_tasks/try_tasks.py -k fill
+        # https://huggingface.co/google-bert/bert-base-multilingual-cased
+
+        from transformers import BertTokenizer, BertModel
+
+        tokenizer = BertTokenizer.from_pretrained("bert-base-multilingual-cased")
+        model = BertModel.from_pretrained("bert-base-multilingual-cased")
+        text = "Replace me by any text you'd like."
+        encoded_input = tokenizer(text, return_tensors="pt")
+        print()
+        print("-- inputs", string_type(encoded_input, with_shape=True, with_min_max=True))
+        output = model(**encoded_input)
+        print("-- outputs", string_type(output, with_shape=True, with_min_max=True))
+
 
 if __name__ == "__main__":
     unittest.main(verbosity=2)
@@ -1,30 +1,19 @@
 import pprint
 import unittest
-import torch
-import transformers
 from onnx_diagnostic.ext_test_case import (
     ExtTestCase,
     hide_stdout,
     requires_torch,
     requires_transformers,
     ignore_errors,
 )
-from onnx_diagnostic.torch_models.hghub.model_inputs import (
-    config_class_from_architecture,
-    get_untrained_model_with_inputs,
-)
+from onnx_diagnostic.torch_models.hghub.model_inputs import get_untrained_model_with_inputs
 from onnx_diagnostic.torch_models.hghub.hub_api import get_pretrained_config
 from onnx_diagnostic.torch_models.hghub.hub_data import load_models_testing
 from onnx_diagnostic.torch_export_patches import bypass_export_some_errors
 
 
 class TestHuggingFaceHubModel(ExtTestCase):
-    @requires_transformers("4.50")  # we limit to some versions of the CI
-    @requires_torch("2.7")
-    def test_config_class_from_architecture(self):
-        config = config_class_from_architecture("LlamaForCausalLM")
-        self.assertEqual(config, transformers.LlamaConfig)
-
     @hide_stdout()
     def test_get_untrained_model_with_inputs_tiny_llm(self):
         mid = "arnir0/Tiny-LLM"
@@ -107,91 +96,6 @@ def test_get_untrained_model_with_inputs_clip_vit(self):
         # different expected value for different version of transformers
         self.assertIn((data["size"], data["n_weights"]), [(188872708, 47218177)])
 
-    @hide_stdout()
-    def test_get_untrained_model_with_inputs_text2text_generation(self):
-        mid = "sshleifer/tiny-marian-en-de"
-        # mid = "Salesforce/codet5-small"
-        data = get_untrained_model_with_inputs(mid, verbose=1)
-        self.assertIn((data["size"], data["n_weights"]), [(473928, 118482)])
-        model, inputs = data["model"], data["inputs"]
-        raise unittest.SkipTest(f"not working for {mid!r}")
-        model(**inputs)
-
-    @hide_stdout()
-    def test_get_untrained_model_with_inputs_automatic_speech_recognition(self):
-        mid = "openai/whisper-tiny"
-        data = get_untrained_model_with_inputs(mid, verbose=1)
-        self.assertIn((data["size"], data["n_weights"]), [(132115968, 33028992)])
-        model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        Dim = torch.export.Dim
-        self.maxDiff = None
-        self.assertIn("{0:Dim(batch),1:Dim(seq_length)}", self.string_type(ds))
-        self.assertEqualAny(
-            {
-                "decoder_input_ids": {
-                    0: Dim("batch", min=1, max=1024),
-                    1: Dim("seq_length", min=1, max=4096),
-                },
-                "cache_position": {0: Dim("seq_length", min=1, max=4096)},
-                "encoder_outputs": [{0: Dim("batch", min=1, max=1024)}],
-                "past_key_values": [
-                    [
-                        [
-                            {0: Dim("batch", min=1, max=1024)},
-                            {0: Dim("batch", min=1, max=1024)},
-                        ],
-                        [
-                            {0: Dim("batch", min=1, max=1024)},
-                            {0: Dim("batch", min=1, max=1024)},
-                        ],
-                    ],
-                    [
-                        [
-                            {0: Dim("batch", min=1, max=1024)},
-                            {0: Dim("batch", min=1, max=1024)},
-                        ],
-                        [
-                            {0: Dim("batch", min=1, max=1024)},
-                            {0: Dim("batch", min=1, max=1024)},
-                        ],
-                    ],
-                ],
-            },
-            ds,
-        )
-        model(**inputs)
-        self.assertEqual(
-            "#1[T1r3]",
-            self.string_type(torch.utils._pytree.tree_flatten(inputs["encoder_outputs"])[0]),
-        )
-        with bypass_export_some_errors(patch_transformers=True, verbose=10):
-            flat = torch.utils._pytree.tree_flatten(inputs["past_key_values"])[0]
-            self.assertIsInstance(flat, list)
-            self.assertIsInstance(flat[0], torch.Tensor)
-            self.assertEqual(
-                "#8[T1r4,T1r4,T1r4,T1r4,T1r4,T1r4,T1r4,T1r4]",
-                self.string_type(flat),
-            )
-            torch.export.export(model, (), kwargs=inputs, dynamic_shapes=ds, strict=False)
-        with bypass_export_some_errors(patch_transformers=True, verbose=10):
-            flat = torch.utils._pytree.tree_flatten(inputs["past_key_values"])[0]
-            self.assertIsInstance(flat, list)
-            self.assertIsInstance(flat[0], torch.Tensor)
-            self.assertEqual(
-                "#8[T1r4,T1r4,T1r4,T1r4,T1r4,T1r4,T1r4,T1r4]",
-                self.string_type(flat),
-            )
-            torch.export.export(model, (), kwargs=inputs, dynamic_shapes=ds, strict=False)
-
-    @hide_stdout()
-    def test_get_untrained_model_with_inputs_imagetext2text_generation(self):
-        mid = "HuggingFaceM4/tiny-random-idefics"
-        # mid = "Salesforce/codet5-small"
-        data = get_untrained_model_with_inputs(mid, verbose=1)
-        self.assertIn((data["size"], data["n_weights"]), [(12742888, 3185722)])
-        model, inputs = data["model"], data["inputs"]
-        model(**inputs)
-
     @hide_stdout()
     @requires_torch("2.7", "reduce test time")
     @requires_transformers("4.50", "reduce test time")
@@ -210,11 +114,9 @@ def _diff(c1, c2):
         for mid in load_models_testing():
             with self.subTest(mid=mid):
                 if mid in {
-                    "hf-internal-testing/tiny-random-BeitForImageClassification",
                     "hf-internal-testing/tiny-random-MaskFormerForInstanceSegmentation",
                     "hf-internal-testing/tiny-random-MoonshineForConditionalGeneration",
                     "fxmarty/pix2struct-tiny-random",
-                    "hf-internal-testing/tiny-random-ViTMSNForImageClassification",
                     "hf-internal-testing/tiny-random-YolosModel",
                 }:
                     print(f"-- not implemented yet for {mid!r}")
 
@@ -303,13 +303,13 @@ def get_parser_validate() -> ArgumentParser:
 def _cmd_validate(argv: List[Any]):
     from .helpers import string_type
     from .torch_models.test_helper import get_inputs_for_task, validate_model, _ds_clean
-    from .torch_models.hghub.model_inputs import get_get_inputs_function_for_tasks
+    from .tasks import supported_tasks
 
     parser = get_parser_validate()
     args = parser.parse_args(argv[1:])
     if not args.task and not args.mid:
         print("-- list of supported tasks:")
-        print("\n".join(sorted(get_get_inputs_function_for_tasks())))
+        print("\n".join(supported_tasks()))
     elif not args.mid:
         data = get_inputs_for_task(args.task)
         if args.verbose: