fix registration issue

xadupre · xadupre · commit 8cb8ec5d1a57 · 2025-03-29T19:23:37.000+01:00
diff --git a/_unittests/ut_torch_export_patches/test_dynamic_class.py b/_unittests/ut_torch_export_patches/test_dynamic_class.py
@@ -1,7 +1,14 @@
 import copy
+import os
 import unittest
+from typing import Any, Dict, List, Tuple
 import torch
-from onnx_diagnostic.ext_test_case import ExtTestCase, ignore_warnings, hide_stdout
+from onnx_diagnostic.ext_test_case import (
+    ExtTestCase,
+    ignore_warnings,
+    hide_stdout,
+    requires_torch,
+)
 from onnx_diagnostic.helpers import string_type
 from onnx_diagnostic.cache_helpers import make_dynamic_cache
 from onnx_diagnostic.torch_export_patches.onnx_export_errors import (
@@ -45,21 +52,12 @@ def forward(self, x, cache):
             expected = model(*inputs)
 
             DYN = torch.export.Dim.DYNAMIC
-            ep = torch.export.export(
-                model,
-                inputs,
-                dynamic_shapes=({0: DYN, 2: DYN}, [[{0: DYN, 2: DYN}], [{0: DYN, 2: DYN}]]),
-                strict=strict,
-            )
-            mod = ep.module()
-            got = mod(*inputs)
-            self.assertEqualArray(expected, got)
 
             # patching
             with bypass_export_some_errors(patch_transformers=True):
                 got = model(*inputs)
                 self.assertEqualArray(expected, got)
-                ep2 = torch.export.export(
+                ep = torch.export.export(
                     model,
                     inputs,
                     dynamic_shapes=(
@@ -68,11 +66,201 @@ def forward(self, x, cache):
                     ),
                     strict=strict,
                 )
-                mod = ep2.module()
+                mod = ep.module()
                 got = mod(*inputs)
                 self.assertEqualArray(expected, got)
 
+                class MyInterpreter(torch.fx.Interpreter):
+                    def call_function(self, target, args, kwargs):
+                        res = super().call_function(target, args, kwargs)
+                        return res
+
+                args, _spec = torch.utils._pytree.tree_flatten(inputs)
+                got = MyInterpreter(ep.module()).run(*args)
+                self.assertEqualAny(expected, got)
+
+    @ignore_warnings(UserWarning)
+    def test_export_mycache_list_cat(self):
+        TreeContext = torch.utils._pytree.Context
+        MappingKey = torch.utils._pytree.MappingKey
+        KeyEntry = torch.utils._pytree.KeyEntry
+
+        class MyCache77:
+            def __init__(self, key=None, value=None):
+                self.key_cache = [key] if key is not None else []
+                self.value_cache = [value] if value is not None else []
+
+        class ModelMyCache(torch.nn.Module):
+            def forward(self, x, dc):
+                y = (
+                    (
+                        torch.cat(dc.key_cache, axis=1) + torch.cat(dc.value_cache, axis=1)
+                    ).reshape((-1, x.shape[1]))
+                ).transpose(1, 0)
+                return x @ y
+
+        inputs = {
+            "x": torch.randn(3, 8),
+            "dc": MyCache77(torch.ones((3, 8, 3, 8)), torch.ones((3, 8, 3, 8))),
+        }
+        model = ModelMyCache()
+        expected = model(**inputs)
+
+        def flatten_my_cache77(cache: MyCache77) -> Tuple[List[Any], TreeContext]:
+            flat = [
+                (k, getattr(cache, k))
+                for k in ["key_cache", "value_cache"]
+                if hasattr(cache, k)
+            ]
+            return [f[1] for f in flat], [f[0] for f in flat]
+
+        def flatten_with_keys_my_cache77(
+            d: Dict[Any, Any],
+        ) -> Tuple[List[Tuple[KeyEntry, Any]], TreeContext]:
+            values, context = flatten_my_cache77(d)
+            return [(MappingKey(k), v) for k, v in zip(context, values)], context
+
+        def unflatten_my_cache_77(
+            values: List[Any], context: TreeContext, output_type=None
+        ) -> MyCache77:
+            cache = MyCache77()
+            values = dict(zip(context, values))
+            for k, v in values.items():
+                setattr(cache, k, v)
+            return cache
+
+        torch.utils._pytree.register_pytree_node(
+            MyCache77,
+            flatten_my_cache77,
+            unflatten_my_cache_77,
+            serialized_type_name="MyCache77",
+            flatten_with_keys_fn=flatten_with_keys_my_cache77,
+        )
+
+        # DYN = torch.export.Dim.DYNAMIC
+        ep = torch.export.export(model, (), kwargs=inputs)
+
+        args, _spec = torch.utils._pytree.tree_flatten(inputs)
+        got = torch.fx.Interpreter(ep.module()).run(*args)
+        self.assertEqualAny(expected, got)
+
+        mod = ep.module()
+        got = mod(**inputs)
+        self.assertEqualArray(expected, got)
+
+    @ignore_warnings(UserWarning)
+    def test_export_mycache_dict_cat(self):
+        TreeContext = torch.utils._pytree.Context
+
+        class MyCache78:
+            def __init__(self, key=None, value=None):
+                self.key_cache = [key] if key is not None else []
+                self.value_cache = [value] if value is not None else []
+
+        class ModelMyCache(torch.nn.Module):
+            def forward(self, x, dc):
+                y = (
+                    (
+                        torch.cat(dc.key_cache, axis=1) + torch.cat(dc.value_cache, axis=1)
+                    ).reshape((-1, x.shape[1]))
+                ).transpose(1, 0)
+                return x @ y
+
+        inputs = {
+            "x": torch.randn(3, 8),
+            "dc": MyCache78(torch.ones((3, 8, 3, 8)), torch.ones((3, 8, 3, 8))),
+        }
+        model = ModelMyCache()
+        expected = model(**inputs)
+
+        def flatten_my_cache78(cache: MyCache78):
+            dictionary = {
+                "key_cache": cache.key_cache,
+                "value_cache": cache.value_cache,
+            }
+            return torch.utils._pytree._dict_flatten(dictionary)
+
+        def flatten_with_keys_my_cache78(cache: MyCache78):
+            dictionary = {
+                "key_cache": cache.key_cache,
+                "value_cache": cache.value_cache,
+            }
+            return torch.utils._pytree._dict_flatten_with_keys(dictionary)
+
+        def unflatten_my_cache_78(values, context: TreeContext, output_type=None) -> MyCache78:
+            dictionary = torch.utils._pytree._dict_unflatten(values, context)
+            cache = MyCache78()
+            for k, v in dictionary.items():
+                setattr(cache, k, v)
+            return cache
+
+        torch.utils._pytree.register_pytree_node(
+            MyCache78,
+            flatten_my_cache78,
+            unflatten_my_cache_78,
+            serialized_type_name="MyCache78",
+            flatten_with_keys_fn=flatten_with_keys_my_cache78,
+        )
+
+        # DYN = torch.export.Dim.DYNAMIC
+        ep = torch.export.export(model, (), kwargs=inputs)
+
+        args, _spec = torch.utils._pytree.tree_flatten(inputs)
+        got = torch.fx.Interpreter(ep.module()).run(*args)
+        self.assertEqualAny(expected, got)
+
+        mod = ep.module()
+        got = mod(**inputs)
+        self.assertEqualArray(expected, got)
+
     @ignore_warnings(UserWarning)
+    def test_export_dynamic_cache_cat(self):
+
+        class ModelDynamicCache(torch.nn.Module):
+            def forward(self, x, dc):
+                y = (
+                    (
+                        torch.cat(dc.key_cache, axis=1) + torch.cat(dc.value_cache, axis=1)
+                    ).reshape((-1, x.shape[1]))
+                ).transpose(1, 0)
+                return x @ y
+
+        inputs = {
+            "x": torch.randn(3, 8),
+            "dc": make_dynamic_cache(
+                [(torch.ones((3, 8, 3, 8)), (torch.ones((3, 8, 3, 8)) * 2))]
+            ),
+        }
+        model = ModelDynamicCache()
+        expected = model(**inputs)
+
+        # DYN = torch.export.Dim.DYNAMIC
+        NOBYPASS = int(os.environ.get("NOBYBASS", "0"))
+        if NOBYPASS:
+            ep = torch.export.export(model, (), kwargs=inputs)
+
+            args, _spec = torch.utils._pytree.tree_flatten(inputs)
+            got = torch.fx.Interpreter(ep.module()).run(*args)
+            self.assertEqualAny(expected, got)
+
+            mod = ep.module()
+            got = mod(**inputs)
+            self.assertEqualArray(expected, got)
+            return
+
+        with bypass_export_some_errors(patch_transformers=True):
+            ep = torch.export.export(model, (), kwargs=inputs)
+
+            args, _spec = torch.utils._pytree.tree_flatten(inputs)
+            got = torch.fx.Interpreter(ep.module()).run(*args)
+            self.assertEqualAny(expected, got)
+
+            mod = ep.module()
+            got = mod(**inputs)
+            self.assertEqualArray(expected, got)
+
+    @ignore_warnings(UserWarning)
+    @requires_torch("2.9")
     def test_phi2_export_module(self):
         data = get_untrained_model_with_inputs("microsoft/phi-2")
         model, inputs, dyn_shapes = data["model"], data["inputs"], data["dynamic_shapes"]
@@ -100,6 +288,7 @@ def test_phi2_export_module(self):
                 dynamic_shapes=dyn_shapes,
                 strict=False,  # True works but then the it fails during the execution
             )
+            # ep = ep.run_decompositions()
             mod = ep.module()
             inputs_copied = copy.deepcopy(inputs)
             self.assertEqual(
@@ -108,15 +297,8 @@ def test_phi2_export_module(self):
             got = mod(**inputs_copied)
             self.assertEqualAny(expected, got)
 
-        inputs_copied = copy.deepcopy(inputs)
-        self.assertEqual(
-            str_inputs, string_type(inputs_copied, with_shape=True, with_min_max=True)
-        )
-        mod = ep.module()
-        got = mod(**inputs_copied)
-        self.assertEqualAny(expected, got)
-
     @ignore_warnings(UserWarning)
+    @requires_torch("2.9")
     def test_phi2_export_interpreter(self):
         data = get_untrained_model_with_inputs("microsoft/phi-2")
         model, inputs, dyn_shapes = data["model"], data["inputs"], data["dynamic_shapes"]
@@ -144,6 +326,7 @@ def test_phi2_export_interpreter(self):
                 dynamic_shapes=dyn_shapes,
                 strict=False,  # True works but then the it fails during the execution
             )
+            # ep = ep.run_decompositions()
 
             # from experimental_experiment.torch_interpreter.tracing import CustomTracer
             # CustomTracer.remove_unnecessary_slices(ep.graph)
diff --git a/onnx_diagnostic/torch_export_patches/onnx_export_errors.py b/onnx_diagnostic/torch_export_patches/onnx_export_errors.py
@@ -100,7 +100,19 @@ def _register_cache_serialization(verbose: int = 0) -> Dict[str, bool]:
             flatten_with_keys_fn=flatten_with_keys_mamba_cache,
         )
 
-    # DynamicCache
+    # DynamicCache serialization is different in transformers and does not
+    # play way with torch.export.export.
+    # see test test_export_dynamic_cache_cat with NOBYPASS=1
+    # :: NOBYBASS=1 python _unittests/ut_torch_export_patches/test_dynamic_class.py -k e_c
+    # This is caused by this line:
+    # torch.fx._pytree.register_pytree_flatten_spec(
+    #           DynamicCache, _flatten_dynamic_cache_for_fx)
+    # so we remove it anyway
+    if DynamicCache in torch.fx._pytree.SUPPORTED_NODES:
+        if verbose:
+            print("[_register_cache_serialization] DynamicCache is unregistered first.")
+        _unregister(DynamicCache)
+
     unregistered_dynamic_cache = True
     if DynamicCache is not None and DynamicCache in torch.utils._pytree.SUPPORTED_NODES:
         if verbose > 1: