fix shape

xadupre · xadupre · commit 8313a1b46d9a · 2025-10-23T23:56:04.000+02:00
diff --git a/_unittests/ut_export/test_shape_helper.py b/_unittests/ut_export/test_shape_helper.py
@@ -3,6 +3,7 @@
 from onnx_diagnostic.ext_test_case import ExtTestCase, requires_transformers, requires_torch
 from onnx_diagnostic.torch_models.hghub import get_untrained_model_with_inputs
 from onnx_diagnostic.torch_export_patches import torch_export_patches
+from onnx_diagnostic.helpers import flatten_object
 from onnx_diagnostic.helpers.cache_helper import (
     make_dynamic_cache,
     make_sliding_window_cache,
@@ -12,11 +13,11 @@
 from onnx_diagnostic.export.shape_helper import (
     all_dynamic_shapes_from_inputs,
     guess_dynamic_shapes_from_inputs,
+    make_fake_with_dynamic_dimensions,
 )
 
 
 class TestShapeHelper(ExtTestCase):
-
     @requires_transformers("4.52")
     @requires_torch("2.7.99")
     def test_all_dynamic_shape_from_cache(self):
@@ -184,6 +185,60 @@ def test_guess_dynamic_shapes_from_inputs(self):
             guessed,
         )
 
+    @requires_transformers("4.55")
+    @requires_torch("2.9")
+    def test_make_fake_with_dynamic_dimensions_tensor(self):
+        res = make_fake_with_dynamic_dimensions(
+            (torch.rand((2, 32, 30, 96), dtype=torch.float16),),
+            ({0: "batch", 2: "cache_length"},),
+        )
+        reshaped = res[0][0]
+        self.assertIsInstance(reshaped.shape[0], torch.SymInt)
+        self.assertIsInstance(reshaped.shape[2], torch.SymInt)
+        self.assertEqual(reshaped.shape[1], 32)
+        self.assertEqual(reshaped.shape[3], 96)
+        self.assertNotEqual(reshaped.shape[0], reshaped.shape[2])
+
+    @requires_transformers("4.55")
+    @requires_torch("2.9")
+    def test_make_fake_with_dynamic_dimensions_whole(self):
+        res = make_fake_with_dynamic_dimensions(
+            dict(
+                input_ids=torch.randint(30360, size=(2, 3), dtype=torch.int64),
+                attention_mask=torch.randint(1, size=(2, 33), dtype=torch.int64),
+                position_ids=torch.randint(32, size=(2, 3), dtype=torch.int64),
+                past_key_values=make_dynamic_cache(
+                    [
+                        (
+                            torch.rand((2, 32, 30, 96), dtype=torch.float16),
+                            torch.rand((2, 32, 30, 96), dtype=torch.float16),
+                        ),
+                        (
+                            torch.rand((2, 32, 30, 96), dtype=torch.float16),
+                            torch.rand((2, 32, 30, 96), dtype=torch.float16),
+                        ),
+                    ]
+                ),
+            ),
+            dynamic_shapes={
+                "input_ids": {0: "batch", 1: "seq_length"},
+                "attention_mask": {0: "batch", 1: "cache+seq"},
+                "position_ids": {0: "batch", 1: "seq_length"},
+                "past_key_values": [
+                    [{0: "batch", 2: "cache_length"}, {0: "batch", 2: "cache_length"}],
+                    [{0: "batch", 2: "cache_length"}, {0: "batch", 2: "cache_length"}],
+                ],
+            },
+        )
+        flat = flatten_object(res[0], drop_keys=True)
+        for t in flat:
+            if len(t.shape) == 4:
+                self.assertIsInstance(t.shape[0], torch.SymInt)
+                self.assertIsInstance(t.shape[2], torch.SymInt)
+                self.assertEqual(t.shape[1], 32)
+                self.assertEqual(t.shape[3], 96)
+                self.assertNotEqual(t.shape[0], t.shape[2])
+
 
 if __name__ == "__main__":
     unittest.main(verbosity=2)
diff --git a/onnx_diagnostic/export/shape_helper.py b/onnx_diagnostic/export/shape_helper.py
@@ -1,8 +1,7 @@
 from typing import Any, Dict, List, Set, Optional, Tuple, Union
-from ..helpers import flatten_object
 from ..helpers.cache_helper import flatten_unflatten_for_dynamic_shapes
-from ..helpers.fake_tensor_helper import make_fake
-from .dynamic_shapes import ModelInputs, _flatten_dynamic_shapes
+from ..helpers.fake_tensor_helper import fake_reshape
+from .dynamic_shapes import ModelInputs
 
 
 def all_dynamic_shapes_from_inputs(inputs: Any, dim_prefix: Any = "d") -> Any:
@@ -204,10 +203,10 @@ def guess_dynamic_shapes_from_inputs(
 
 
 def make_fake_with_dynamic_dimensions(
-    inputs: Any,
+    x: Any,
     dynamic_shapes: Any,
     fake_mode: Optional["FakeTensorMode"] = None,  # noqa: F821
-) -> Any:  # noqa: F821
+) -> Tuple[Any, "FakeTensorMode"]:  # noqa: F821
     """
     Replaces all tensors by fake tensor respecting the same
     constraints as the following dynamic shapes.
@@ -235,19 +234,81 @@ def make_fake_with_dynamic_dimensions(
                         ),
                     ]
                 ),
-            )
+            ),
+            dynamic_shapes={
+                "input_ids": {0: "batch", 1: "seq_length"},
+                "attention_mask": {0: "batch", 1: "cache+seq"},
+                "position_ids": {0: "batch", 1: "seq_length"},
+                "past_key_values": [
+                    [{0: "batch", 2: "cache_length"}, {0: "batch", 2: "cache_length"}],
+                    [{0: "batch", 2: "cache_length"}, {0: "batch", 2: "cache_length"}],
+                ],
+            },
         )
         print(inputs)
     """
-    flat_inputs = flatten_object(inputs, drop_keys=True)
-    flat_fake, fake_mode = make_fake(flat_inputs, fake_mode=fake_mode)
-    flat_ds = _flatten_dynamic_shapes(dynamic_shapes)
-    assert len(flat_inputs) == len(flat_ds), (
-        f"Mismatch between the number of input tensor {len(flat_inputs)} "
-        f"and the number of dynamic_shapes {len(flat_ds)}"
+    if x is None:
+        return None, None
+    if fake_mode is None:
+        from torch.fx.experimental.symbolic_shapes import ShapeEnv
+        from torch._subclasses.fake_tensor import FakeTensorMode
+
+        shape_env = ShapeEnv()
+        fake_mode = FakeTensorMode(shape_env=shape_env)
+
+    if isinstance(x, (list, tuple)):
+        return (
+            x.__class__(
+                [
+                    make_fake_with_dynamic_dimensions(
+                        i, fake_mode=fake_mode, dynamic_shapes=ds
+                    )[0]
+                    for i, ds in zip(x, dynamic_shapes)
+                ]
+            ),
+            fake_mode,
+        )
+    if isinstance(x, dict):
+        return {
+            k: make_fake_with_dynamic_dimensions(
+                v, fake_mode=fake_mode, dynamic_shapes=dynamic_shapes[k]
+            )[0]
+            for k, v in x.items()
+        }, fake_mode
+
+    if x.__class__.__name__ in {"DynamicCache", "StaticCache", "HybridCache"}:
+        assert hasattr(x, "layers"), (
+            f"Une more recent version of transformers (>=4.55), "
+            f"'layers' not found in class {type(x)}"
+        )
+        assert (
+            isinstance(dynamic_shapes, list) and len(dynamic_shapes) == 2
+        ), f"Unexpected dynamic_shapes={dynamic_shapes} for a DynamicCache"
+        for il, layer in enumerate(x.layers):
+            assert hasattr(layer, "keys") and hasattr(layer, "values"), (
+                f"Une more recent version of transformers (>=4.55), 'layers' "
+                f"not found in class {type(layer)} ({dir(layer)})"
+            )
+            layer.keys = make_fake_with_dynamic_dimensions(
+                layer.keys, fake_mode=fake_mode, dynamic_shapes=dynamic_shapes[0][il]
+            )[0]
+            layer.values = make_fake_with_dynamic_dimensions(
+                layer.values, fake_mode=fake_mode, dynamic_shapes=dynamic_shapes[1][il]
+            )[0]
+        return x, fake_mode
+    if x.__class__.__name__ == "EncoderDecoderCache":
+        make_fake_with_dynamic_dimensions(
+            x.self_attention_cache, fake_mode=fake_mode, dynamic_shapes=dynamic_shapes[0]
+        )
+        make_fake_with_dynamic_dimensions(
+            x.cross_attention_cache, fake_mode=fake_mode, dynamic_shapes=dynamic_shapes[1]
+        )
+        return x, fake_mode
+    if hasattr(x, "shape"):
+        t = fake_reshape(x, dynamic_shapes, fake_mode=fake_mode)
+        return t, fake_mode
+    from . import string_type
+
+    raise TypeError(
+        f"Unexpected type {type(x)} for x, content is {string_type(x, with_shape=True)}"
     )
-    flat_reshaped = [
-        make_fake_with_dynamic_dimensions(t, sh, true_tensor=t, fake_mode=fake_mode)
-        for t, sh in zip(flat_inputs, flat_fake, flat_ds)
-    ]
-    return flat_reshaped
diff --git a/pyproject.toml b/pyproject.toml
@@ -46,6 +46,10 @@ disable_error_code = ["call-overload", "name-defined", "import-untyped"]
 module = ["onnx_diagnostic.ext_test_case"]
 disable_error_code = ["arg-type", "assignment", "import-untyped", "misc", "name-defined", "override", "return-value", "truthy-function"]
 
+[[tool.mypy.overrides]]
+module = ["onnx_diagnostic.export.shape_helper"]
+disable_error_code = ["name-defined"]
+
 [[tool.mypy.overrides]]
 module = ["onnx_diagnostic.helpers.args_helper"]
 disable_error_code = ["arg-type", "call-overload", "index"]