Enables export with fake tensors (#273)

xadupre · web-flow · commit 3f08c5f8f0a9 · 2025-10-24T23:25:46.000+02:00
* enables export with fake tensors

* improves tests

* fix

* fix fake export

* fix

* fix

* push

* doc

* doc

* foc

* fix index
diff --git a/CHANGELOGS.rst b/CHANGELOGS.rst
@@ -4,6 +4,7 @@ Change Logs
 0.7.16
 ++++++
 
+* :pr:`273`: enables export with FakeTensor
 * :pr:`272`: makes patches work with FakeTensor
 * :pr:`270`: add export sample code to export a specific model id with the appropriate inputs
 * :pr:`269`: adds one unit test to track a patch fixing broadcast output shape
diff --git a/_doc/conf.py b/_doc/conf.py
@@ -119,6 +119,8 @@ def linkcode_resolve(domain, info):
     ("py:class", "ast.Node"),
     ("py:class", "dtype"),
     ("py:class", "False"),
+    ("py:class", "FakeTensor"),
+    ("py:class", "FakeTensorMode"),
     ("py:class", "True"),
     ("py:class", "Argument"),
     ("py:class", "CacheProcessor"),
diff --git a/_doc/index.rst b/_doc/index.rst
@@ -135,7 +135,7 @@ See :func:`onnx_diagnostic.torch_export_patches.torch_export_rewrite`.
       # ...
 
 all_dynamic_shapes_from_inputs
-+++++++++++++++++++++++++++++
+++++++++++++++++++++++++++++++
 
 See :func:`onnx_diagnostic.export.shape_helper.all_dynamic_shapes_from_inputs`.
 
diff --git a/_unittests/ut_tasks/test_tasks_image_classification.py b/_unittests/ut_tasks/test_tasks_image_classification.py
@@ -14,14 +14,15 @@ def test_image_classification(self):
         self.assertEqual(data["task"], "image-classification")
         self.assertIn((data["size"], data["n_weights"]), [(56880, 14220)])
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        model(**inputs)
+        expected = model(**inputs)
         model(**data["inputs2"])
         if not has_transformers("4.52.999"):
             raise unittest.SkipTest("Requires transformers>=4.52")
         with torch_export_patches(patch_transformers=True, verbose=10):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
 
 if __name__ == "__main__":
diff --git a/_unittests/ut_tasks/test_tasks_image_text_to_text.py b/_unittests/ut_tasks/test_tasks_image_text_to_text.py
@@ -14,19 +14,21 @@
 
 class TestTasksImageTextToText(ExtTestCase):
     @hide_stdout()
-    @requires_transformers("4.53")
+    @requires_transformers("4.56")
     @requires_torch("2.7.99")
     def test_image_text_to_text_idefics(self):
         mid = "HuggingFaceM4/tiny-random-idefics"
         data = get_untrained_model_with_inputs(mid, verbose=1, add_second_input=True)
         self.assertEqual(data["task"], "image-text-to-text")
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        model(**torch_deepcopy(inputs))
+        expected = model(**torch_deepcopy(inputs))
         model(**data["inputs2"])
         with torch_export_patches(patch_transformers=True, verbose=10, patch_torch=False):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            # The conversion does not work. Tolerance is set to 1.
+            self.assertEqualAny(expected, ep.module()(**inputs), atol=1)
 
     @hide_stdout()
     @requires_transformers("5.0.99")
@@ -44,12 +46,13 @@ def test_image_text_to_text_tiny_gemma3(self):
         # self.assertIn((data["size"], data["n_weights"]), [(17248576, 4312144)])
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
         print("--", self.string_type(data["inputs"], with_shape=True))
-        model(**torch_deepcopy(inputs))
+        expected = model(**torch_deepcopy(inputs))
         model(**data["inputs2"])
         with torch_export_patches(patch_transformers=True, verbose=10):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
     @hide_stdout()
     @requires_transformers("4.56.99")
@@ -72,11 +75,13 @@ def test_image_text_to_text_gemma3_4b_it(self):
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
         # inputs.pop("attention_mask")
         # ds.pop("attention_mask")
-        model(**torch_deepcopy(inputs))
+        expected = model(**torch_deepcopy(inputs))
         with torch_export_patches(patch_transformers=True, verbose=10):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            # The conversion does not work. Tolerance is set to 1.
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
     @hide_stdout()
     @requires_transformers("5.0.99")
@@ -93,12 +98,13 @@ def test_image_text_to_text_zai_glm(self):
         self.assertEqual(data["task"], "image-text-to-text")
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
         print("--", self.string_type(data["inputs"], with_shape=True))
-        model(**torch_deepcopy(inputs))
+        expected = model(**torch_deepcopy(inputs))
         model(**data["inputs2"])
         with torch_export_patches(patch_transformers=True, verbose=10):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
 
 if __name__ == "__main__":
diff --git a/_unittests/ut_tasks/test_tasks_mask_generation.py b/_unittests/ut_tasks/test_tasks_mask_generation.py
@@ -21,12 +21,13 @@ def test_mask_generation(self):
         data = get_untrained_model_with_inputs(mid, verbose=1, add_second_input=True)
         self.assertEqual(data["task"], "mask-generation")
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        model(**torch_deepcopy(inputs))
+        expected = model(**torch_deepcopy(inputs))
         model(**data["inputs2"])
         with torch_export_patches(patch_torch=False, patch_transformers=True, verbose=1):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
     @hide_stdout()
     @requires_transformers("4.53")
@@ -36,14 +37,15 @@ def test_mask_generation_with_torch_patches(self):
         data = get_untrained_model_with_inputs(mid, verbose=1, add_second_input=True)
         self.assertEqual(data["task"], "mask-generation")
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        model(**torch_deepcopy(inputs))
+        expected = model(**torch_deepcopy(inputs))
         model(**data["inputs2"])
         with torch_export_patches(
             patch_torch=True, patch_sympy=True, patch_transformers=True, verbose=1
         ):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
 
 if __name__ == "__main__":
diff --git a/_unittests/ut_tasks/test_tasks_object_detection.py b/_unittests/ut_tasks/test_tasks_object_detection.py
@@ -14,14 +14,15 @@ def test_object_detection(self):
         self.assertEqual(data["task"], "object-detection")
         self.assertIn((data["size"], data["n_weights"]), [(8160384, 2040096)])
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        model(**inputs)
+        expected = model(**inputs)
         model(**data["inputs2"])
         if not has_transformers("4.51.999"):
             raise unittest.SkipTest("Requires transformers>=4.52")
         with torch_export_patches(patch_transformers=True, verbose=10):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
 
 if __name__ == "__main__":
diff --git a/_unittests/ut_tasks/test_tasks_text_generation.py b/_unittests/ut_tasks/test_tasks_text_generation.py
@@ -10,40 +10,62 @@
 from onnx_diagnostic.torch_models.hghub.model_inputs import get_untrained_model_with_inputs
 from onnx_diagnostic.torch_export_patches import torch_export_patches
 from onnx_diagnostic.torch_export_patches.patch_inputs import use_dyn_not_str
+from onnx_diagnostic.export.shape_helper import make_fake_with_dynamic_dimensions
 
 
 class TestTasksTextGeneration(ExtTestCase):
     @hide_stdout()
     @requires_transformers("4.53")
     @requires_torch("2.7.99")
-    def test_tet_generation_gemma3_for_causallm(self):
+    def test_text_generation_gemma3_for_causallm(self):
         mid = "hf-internal-testing/tiny-random-Gemma3ForCausalLM"
         data = get_untrained_model_with_inputs(mid, verbose=1, add_second_input=True)
         self.assertEqual(data["task"], "text-generation")
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        model(**torch_deepcopy(inputs))
+        expected = model(**torch_deepcopy(inputs))
         model(**data["inputs2"])
         with torch_export_patches(patch_transformers=True, verbose=10, patch_torch=False):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
     @hide_stdout()
     @requires_transformers("4.53")
     @requires_torch("2.7.99")
-    def test_itext_generation_phi_3_mini_128k_instruct(self):
+    def test_text_generation_phi_3_mini_128k_instruct(self):
         mid = "microsoft/Phi-3-mini-128k-instruct"
         data = get_untrained_model_with_inputs(mid, verbose=1, add_second_input=True)
         self.assertEqual(data["task"], "text-generation")
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        print("--", self.string_type(inputs, with_shape=True))
-        print("--", self.string_type(ds))
-        model(**torch_deepcopy(inputs))
+        expected = model(**torch_deepcopy(inputs))
         model(**data["inputs2"])
         with torch_export_patches(patch_transformers=True, verbose=10, patch_torch=False):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
+
+    @hide_stdout()
+    @requires_transformers("4.53")
+    @requires_torch("2.7.99")
+    def test_text_generation_tiny_llm(self):
+        mid = "arnir0/Tiny-LLM"
+        data = get_untrained_model_with_inputs(mid, verbose=1, add_second_input=True)
+        self.assertEqual(data["task"], "text-generation")
+        model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
+        inputs_copied = torch_deepcopy(inputs)
+        expected = model(**torch_deepcopy(inputs))
+        model(**data["inputs2"])
+        fake = make_fake_with_dynamic_dimensions(inputs, dynamic_shapes=ds)[0]
+        with torch_export_patches(patch_transformers=True, verbose=10, patch_torch=False):
+            ep = torch.export.export(
+                model, (), kwargs=fake, dynamic_shapes=use_dyn_not_str(ds), strict=False
+            )
+            # print(ep)
+        got = ep.module()(**inputs_copied)
+        self.assertEqualAny(expected.past_key_values, got.past_key_values)
+        self.assertEqualArray(expected.logits, got.logits)
 
 
 if __name__ == "__main__":
diff --git a/_unittests/ut_tasks/test_tasks_text_to_image.py b/_unittests/ut_tasks/test_tasks_text_to_image.py
@@ -23,12 +23,13 @@ def test_text_to_image(self):
         self.assertEqual(data["task"], "text-to-image")
         self.assertIn((data["size"], data["n_weights"]), [(5708048, 1427012)])
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        model(**inputs)
+        expected = model(**inputs)
         model(**data["inputs2"])
         with torch_export_patches(patch_transformers=True, verbose=10, stop_if_static=1):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
 
 if __name__ == "__main__":
diff --git a/_unittests/ut_tasks/test_tasks_zero_shot_image_classification.py b/_unittests/ut_tasks/test_tasks_zero_shot_image_classification.py
@@ -15,12 +15,13 @@ def test_zero_shot_image_classification(self):
         self.assertEqual(data["task"], "zero-shot-image-classification")
         self.assertIn((data["size"], data["n_weights"]), [(188872708, 47218177)])
         model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
-        model(**inputs)
+        expected = model(**inputs)
         model(**data["inputs2"])
         with torch_export_patches(patch_transformers=True, verbose=10):
-            torch.export.export(
+            ep = torch.export.export(
                 model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds), strict=False
             )
+            self.assertEqualAny(expected, ep.module()(**inputs))
 
 
 if __name__ == "__main__":
diff --git a/onnx_diagnostic/export/dynamic_shapes.py b/onnx_diagnostic/export/dynamic_shapes.py
@@ -226,7 +226,7 @@ def _valid_shapes_tensor(cls, inputs, ds):
         for i, d in enumerate(inputs.shape):
             if i in ds and not isinstance(ds[i], int):
                 # dynamic then
-                if d in {0, 1}:
+                if isinstance(d, int) and d in {0, 1}:
                     # export issues for sure
                     issues[i] = f"d=[{d}]"
         return issues if issues else None
diff --git a/onnx_diagnostic/export/shape_helper.py b/onnx_diagnostic/export/shape_helper.py
@@ -215,7 +215,10 @@ def make_fake_with_dynamic_dimensions(
     .. runpython::
         :showcode:
 
-        from onnx_diagnostic.export.dynamic_shapes import make_fake_with_dynamic_dimensions
+        import pprint
+        import torch
+        from onnx_diagnostic.helpers.cache_helper import make_dynamic_cache
+        from onnx_diagnostic.export.shape_helper import make_fake_with_dynamic_dimensions
 
         inputs, _ = make_fake_with_dynamic_dimensions(
             dict(
@@ -245,7 +248,7 @@ def make_fake_with_dynamic_dimensions(
                 ],
             },
         )
-        print(inputs)
+        pprint.pprint(inputs)
     """
     if x is None:
         return None, None
@@ -306,6 +309,8 @@ def make_fake_with_dynamic_dimensions(
         return x, fake_mode
     if hasattr(x, "shape"):
         t = fake_reshape(x, dynamic_shapes, fake_mode=fake_mode)
+        assert t.device == x.device, f"device mismatch {x.device} -> {t.device}"
+        assert t.dtype == x.dtype, f"dtype mismatch {x.dtype} -> {t.dtype}"
         return t, fake_mode
     from ..helpers import string_type
 
diff --git a/onnx_diagnostic/ext_test_case.py b/onnx_diagnostic/ext_test_case.py
@@ -979,7 +979,11 @@ def assertEqualAny(
             else:
                 for e, g in zip(expected, value):
                     self.assertEqualAny(e, g, msg=msg, atol=atol, rtol=rtol)
-        elif expected.__class__.__name__ in ("DynamicCache", "SlidingWindowCache"):
+        elif expected.__class__.__name__ in (
+            "DynamicCache",
+            "SlidingWindowCache",
+            "HybridCache",
+        ):
             self.assertEqual(type(expected), type(value), msg=msg)
             atts = ["key_cache", "value_cache"]
             self.assertEqualAny(
diff --git a/onnx_diagnostic/helpers/cache_helper.py b/onnx_diagnostic/helpers/cache_helper.py
diff --git a/onnx_diagnostic/helpers/fake_tensor_helper.py b/onnx_diagnostic/helpers/fake_tensor_helper.py
diff --git a/onnx_diagnostic/helpers/helper.py b/onnx_diagnostic/helpers/helper.py
diff --git a/onnx_diagnostic/torch_export_patches/patches/patch_torch.py b/onnx_diagnostic/torch_export_patches/patches/patch_torch.py
diff --git a/onnx_diagnostic/torch_models/validate.py b/onnx_diagnostic/torch_models/validate.py