fix dynamic shapes

xadupre · xadupre · commit 3ab855c739d5 · 2025-07-04T00:43:14.000+02:00
diff --git a/CHANGELOGS.rst b/CHANGELOGS.rst
@@ -4,7 +4,7 @@ Change Logs
 0.7.4
 +++++
 
-* :pr:`174`: changes for the next version of onnx
+* :pr:`174`: changes for the next version of onnx, fixes all_dynamic_shape_from_inputs
 
 0.7.3
 +++++
diff --git a/_doc/index.rst b/_doc/index.rst
@@ -21,7 +21,8 @@ onnx-diagnostic: investigate onnx models
 The main feature is about `patches <https://github.com/sdpython/onnx-diagnostic/tree/main/onnx_diagnostic/torch_export_patches>`_:
 it helps exporting **pytorch models into ONNX**, mostly designed for LLMs using dynamic caches.
 Sources available at `github/onnx-diagnostic <https://github.com/sdpython/onnx-diagnostic/>`_.
-Patches can be enabled as follows:
+Patches can be enabled as follows with function
+:func:`onnx_diagnostic.torch_export_patches.torch_export_patches`:
 
 .. code-block:: python
 
@@ -31,7 +32,8 @@ Patches can be enabled as follows:
       ep = torch.export.export(model, args, kwargs=kwargs, dynamic_shapes=dynamic_shapes)
       # ...
 
-Dynamic shapes are difficult to guess for caches, one function
+Dynamic shapes are difficult to guess for caches, function
+:func:`onnx_diagnostic.export.shape_helper.all_dynamic_shape_from_inputs`
 returns a structure defining all dimensions as dynamic.
 You need then to remove those which are not dynamic in your model.
 
diff --git a/_scripts/test_backend_onnxruntime.py b/_scripts/test_backend_onnxruntime.py
@@ -56,7 +56,7 @@ def supports_device(cls, device: str) -> bool:
         d = Device(device)
         if d == DeviceType.CPU:
             return True
-        if d == DeviceType.GPU:
+        if d == DeviceType.CUDA:
             import torch
 
             return torch.cuda.is_available()
@@ -65,7 +65,7 @@ def supports_device(cls, device: str) -> bool:
     @classmethod
     def create_inference_session(cls, model, device):
         d = Device(device)
-        if d == DeviceType.GPU:
+        if d == DeviceType.CUDA:
             providers = ["CUDAExecutionProvider"]
         elif d == DeviceType.CPU:
             providers = ["CPUExecutionProvider"]
diff --git a/_unittests/ut_export/test_shape_helper.py b/_unittests/ut_export/test_shape_helper.py
@@ -5,10 +5,148 @@
     all_dynamic_shape_from_inputs,
     guess_dynamic_shapes_from_inputs,
 )
+from onnx_diagnostic.helpers.cache_helper import (
+    make_dynamic_cache,
+    make_sliding_window_cache,
+    make_encoder_decoder_cache,
+    make_static_cache,
+    make_mamba_cache,
+)
 from onnx_diagnostic.torch_models.hghub import get_untrained_model_with_inputs
+from onnx_diagnostic.torch_export_patches import torch_export_patches
 
 
 class TestShapeHelper(ExtTestCase):
+
+    @requires_transformers("4.52")
+    @requires_torch("2.7.99")
+    def test_all_dynamic_shape_from_cache(self):
+        cache = make_dynamic_cache([(torch.ones((2, 2)), (torch.ones((2, 2)) * 2))])
+        ds = all_dynamic_shape_from_inputs(cache)
+        self.assertEqual([[{0: "d_0_0", 1: "d_0_1"}], [{0: "d_1_0", 1: "d_1_1"}]], ds)
+
+    @requires_torch("2.7.99")
+    def test_all_dynamic_shape_all_transformers_cache(self):
+        caches = [
+            (
+                make_dynamic_cache([(torch.ones((2, 2)), (torch.ones((2, 2)) * 2))]),
+                [[{0: "d_0_0", 1: "d_0_1"}], [{0: "d_1_0", 1: "d_1_1"}]],
+            ),
+            (
+                make_encoder_decoder_cache(
+                    make_dynamic_cache(
+                        [
+                            (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                            (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                            (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                        ]
+                    ),
+                    make_dynamic_cache(
+                        [
+                            (torch.rand((5, 5, 5)), torch.rand((5, 5, 5))),
+                            (torch.rand((5, 5, 5)), torch.rand((5, 5, 5))),
+                            (torch.rand((5, 5, 5)), torch.rand((5, 5, 5))),
+                        ]
+                    ),
+                ),
+                [
+                    [
+                        [
+                            {0: "d_0_0", 1: "d_0_1", 2: "d_0_2"},
+                            {0: "d_1_0", 1: "d_1_1", 2: "d_1_2"},
+                            {0: "d_2_0", 1: "d_2_1", 2: "d_2_2"},
+                        ],
+                        [
+                            {0: "d_3_0", 1: "d_3_1", 2: "d_3_2"},
+                            {0: "d_4_0", 1: "d_4_1", 2: "d_4_2"},
+                            {0: "d_5_0", 1: "d_5_1", 2: "d_5_2"},
+                        ],
+                    ],
+                    [
+                        [
+                            {0: "d_6_0", 1: "d_6_1", 2: "d_6_2"},
+                            {0: "d_7_0", 1: "d_7_1", 2: "d_7_2"},
+                            {0: "d_8_0", 1: "d_8_1", 2: "d_8_2"},
+                        ],
+                        [
+                            {0: "d_9_0", 1: "d_9_1", 2: "d_9_2"},
+                            {0: "d_10_0", 1: "d_10_1", 2: "d_10_2"},
+                            {0: "d_11_0", 1: "d_11_1", 2: "d_11_2"},
+                        ],
+                    ],
+                ],
+            ),
+            (
+                make_sliding_window_cache(
+                    [
+                        (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                        (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                        (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                    ]
+                ),
+                [
+                    [
+                        {0: "d_0_0", 1: "d_0_1", 2: "d_0_2", 3: "d_0_3"},
+                        {0: "d_1_0", 1: "d_1_1", 2: "d_1_2", 3: "d_1_3"},
+                        {0: "d_2_0", 1: "d_2_1", 2: "d_2_2", 3: "d_2_3"},
+                    ],
+                    [
+                        {0: "d_3_0", 1: "d_3_1", 2: "d_3_2", 3: "d_3_3"},
+                        {0: "d_4_0", 1: "d_4_1", 2: "d_4_2", 3: "d_4_3"},
+                        {0: "d_5_0", 1: "d_5_1", 2: "d_5_2", 3: "d_5_3"},
+                    ],
+                ],
+            ),
+            (
+                make_static_cache(
+                    [
+                        (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                        (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                        (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                    ],
+                    max_cache_len=15,
+                ),
+                [
+                    [
+                        {0: "d_0_0", 1: "d_0_1", 2: "d_0_2", 3: "d_0_3"},
+                        {0: "d_1_0", 1: "d_1_1", 2: "d_1_2", 3: "d_1_3"},
+                        {0: "d_2_0", 1: "d_2_1", 2: "d_2_2", 3: "d_2_3"},
+                    ],
+                    [
+                        {0: "d_3_0", 1: "d_3_1", 2: "d_3_2", 3: "d_3_3"},
+                        {0: "d_4_0", 1: "d_4_1", 2: "d_4_2", 3: "d_4_3"},
+                        {0: "d_5_0", 1: "d_5_1", 2: "d_5_2", 3: "d_5_3"},
+                    ],
+                ],
+            ),
+            (
+                make_mamba_cache(
+                    [
+                        (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                        (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                        (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                    ]
+                ),
+                [
+                    [
+                        {0: "d_0_0", 1: "d_0_1", 2: "d_0_2"},
+                        {0: "d_1_0", 1: "d_1_1", 2: "d_1_2"},
+                        {0: "d_2_0", 1: "d_2_1", 2: "d_2_2"},
+                    ],
+                    [
+                        {0: "d_3_0", 1: "d_3_1", 2: "d_3_2"},
+                        {0: "d_4_0", 1: "d_4_1", 2: "d_4_2"},
+                        {0: "d_5_0", 1: "d_5_1", 2: "d_5_2"},
+                    ],
+                ],
+            ),
+        ]
+        with torch_export_patches(patch_transformers=True):
+            for cache, exds in caches:
+                with self.subTest(cache=type(cache)):
+                    ds = all_dynamic_shape_from_inputs(cache)
+                    self.assertEqual(exds, ds)
+
     @requires_transformers("4.52")
     @requires_torch("2.7.99")
     def test_all_dynamic_shape_from_inputs(self):
diff --git a/_unittests/ut_reference/test_backend_onnxruntime_evaluator.py b/_unittests/ut_reference/test_backend_onnxruntime_evaluator.py
@@ -52,7 +52,7 @@ def supports_device(cls, device: str) -> bool:
         d = Device(device)
         if d == DeviceType.CPU:
             return True
-        if d == DeviceType.GPU:
+        if d == DeviceType.CUDA:
             import torch
 
             return torch.cuda.is_available()
@@ -61,7 +61,7 @@ def supports_device(cls, device: str) -> bool:
     @classmethod
     def create_inference_session(cls, model, device):
         d = Device(device)
-        if d == DeviceType.GPU:
+        if d == DeviceType.CUDA:
             providers = ["CUDAExecutionProvider"]
         elif d == DeviceType.CPU:
             providers = ["CPUExecutionProvider"]
diff --git a/onnx_diagnostic/export/shape_helper.py b/onnx_diagnostic/export/shape_helper.py
@@ -30,6 +30,77 @@ def all_dynamic_shape_from_inputs(inputs: Any, dim_prefix: Any = "d") -> Any:
         )
         ds = all_dynamic_shape_from_inputs(inputs)
         pprint.pprint(ds)
+
+    For this function to work, patches must be enabled if :epkg:`transformers`
+    does not implement the serialization functions.
+
+    .. runpython::
+        :showcode:
+
+        import pprint
+        import torch
+        from onnx_diagnostic.helpers.cache_helper import (
+            make_dynamic_cache,
+            make_encoder_decoder_cache,
+            make_mamba_cache,
+            make_sliding_window_cache,
+            make_static_cache,
+        )
+        from onnx_diagnostic.export.shape_helper import all_dynamic_shape_from_inputs
+        from onnx_diagnostic.torch_export_patches import torch_export_patches
+
+        caches = [
+            make_dynamic_cache(
+                [
+                    (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                    (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                    (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                ]
+            ),
+            make_encoder_decoder_cache(
+                make_dynamic_cache(
+                    [
+                        (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                        (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                        (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                    ]
+                ),
+                make_dynamic_cache(
+                    [
+                        (torch.rand((5, 5, 5)), torch.rand((5, 5, 5))),
+                        (torch.rand((5, 5, 5)), torch.rand((5, 5, 5))),
+                        (torch.rand((5, 5, 5)), torch.rand((5, 5, 5))),
+                    ]
+                ),
+            ),
+            make_sliding_window_cache(
+                [
+                    (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                    (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                    (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                ]
+            ),
+            make_static_cache(
+                [
+                    (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                    (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                    (torch.rand((4, 5, 6, 7)), torch.rand((4, 5, 6, 7))),
+                ],
+                max_cache_len=15,
+            ),
+            make_mamba_cache(
+                [
+                    (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                    (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                    (torch.rand((4, 4, 4)), torch.rand((4, 4, 4))),
+                ]
+            ),
+        ]
+
+        with torch_export_patches(patch_transformers=True):
+            for cache in caches:
+                print(f"-- {cache.__class__.__name__}")
+                pprint.pprint(all_dynamic_shape_from_inputs(cache))
     """
     if isinstance(dim_prefix, str):
         prefixes: Set[str] = set()
diff --git a/onnx_diagnostic/helpers/cache_helper.py b/onnx_diagnostic/helpers/cache_helper.py
@@ -39,11 +39,21 @@ def flatten_unflatten_for_dynamic_shapes(
         subtrees.append(value)
         start = end
     if use_dict:
-        if spec.type is dict or spec.context:
+        if spec.type is dict:
             # This a dictionary.
             return dict(zip(spec.context, subtrees))
         if spec.type is tuple:
             return tuple(subtrees)
+        if spec.type is list:
+            return list(subtrees)
+        if spec.context:
+            # This is a custom class with attributes.
+            # It is returned as a list.
+            return list(subtrees)
+        raise ValueError(
+            f"Unable to interpret spec type {spec.type} "
+            f"(type is {type(spec.type)}, context is {spec.context})."
+        )
     # This is a list.
     return subtrees