sdpython · sdpython · Mar 24, 2025 · Mar 24, 2025 · Mar 24, 2025 · Mar 24, 2025
diff --git a/CHANGELOGS.rst b/CHANGELOGS.rst
@@ -4,6 +4,7 @@ Change Logs
 0.2.0
 +++++
 
+* :pr:`11`: adds ``ModelInputs`` to guess dynamic shapes
 * :pr:`9`: adds ``OnnxruntimeEvaluator``
 * :pr:`8`: adds ``ExtendedReferenceEvaluator``
 * :pr:`7`: improves function ``investigate_onnxruntime_issue``

diff --git a/README.rst b/README.rst
@@ -25,6 +25,9 @@ onnx-diagnostic: investigate onnx models
 .. image:: https://codecov.io/gh/sdpython/onnx-diagnostic/branch/main/graph/badge.svg?token=Wb9ZGDta8J 
     :target: https://codecov.io/gh/sdpython/onnx-diagnostic
 
+Helps investigating onnx models, exporting modes into onnx.
+See :epkg:`documentation of onnx-diagnostic <https://sdpython.github.io/doc/onnx-diagnostic/dev/>`_.
+
 Getting started
 +++++++++++++++
 
@@ -42,8 +45,10 @@ or
 
 **Enlightening Examples**
 
-* `Use DYNAMIC or AUTO when dynamic shapes has constraints
+* `Use DYNAMIC or AUTO when exporting if dynamic shapes has constraints
   <https://sdpython.github.io/doc/onnx-diagnostic/dev/auto_examples/plot_export_with_dynamic_shapes_auto.html>`_
+* `Export with DynamicCache and dynamic shapes
+  <https://sdpython.github.io/doc/onnx-diagnostic/dev/auto_examples/plot_export_with_dynamic_cache.html>`_
 * `Steel method forward to guess the dynamic shapes
   <https://sdpython.github.io/doc/onnx-diagnostic/dev/auto_examples/plot_export_tiny_llm.html>`_
 * `Running ReferenceEvaluator on a failing model
@@ -95,8 +100,3 @@ Snapshot of usefuls tools
 **max_diff**
 
 Returns the maximum discrancies accross nested containers containing tensors.
-
-Documentation
-+++++++++++++
-
-See `onnx-diagnostic <https://sdpython.github.io/doc/onnx-diagnostic/dev/>`_.
diff --git a/_doc/api/export/dynamic_shapes.rst b/_doc/api/export/dynamic_shapes.rst
@@ -0,0 +1,8 @@
+
+onnx_diagnostic.export.dynamic_shapes
+=====================================
+
+.. automodule:: onnx_diagnostic.export.dynamic_shapes
+    :members:
+    :no-undoc-members:
+    :exclude-members: onnx_diagnostic.export.dynamic_shapes
diff --git a/_doc/api/export/index.rst b/_doc/api/export/index.rst
@@ -0,0 +1,21 @@
+onnx_diagnostic.export
+======================
+
+.. toctree::
+    :maxdepth: 1
+    :caption: modules
+
+    dynamic_shapes
+
+ModelInputs
++++++++++++
+
+.. autoclass:: onnx_diagnostic.dyanmic_shapes.ModelInputs
+    :members:
+
+Other functions
++++++++++++++++
+
+.. automodule:: onnx_diagnostic.export
+    :members:
+    :no-undoc-members:
diff --git a/_doc/api/index.rst b/_doc/api/index.rst
@@ -7,6 +7,7 @@ API of onnx_diagnostic
     :maxdepth: 1
     :caption: submodules
 
+    export/index
     reference/index
     torch_export_patches/index
     torch_models/index

diff --git a/_doc/examples/plot_export_with_dynamic_cache.py b/_doc/examples/plot_export_with_dynamic_cache.py
@@ -0,0 +1,206 @@
+"""
+.. _l-plot-export-with-dynamic-shape:
+
+===========================================
+Export with DynamicCache and dynamic shapes
+===========================================
+
+Every LLMs implemented in :epkg:`trasnformers` use cache.
+One of the most used is :class:`transformers.cache_utils.DynamicCache`.
+The cache size is dynamic to cope with the growing context.
+The example shows a tool which determines the dynamic shapes
+for :func:`torch.export.export` based on a set of valid inputs.
+
+Simple Examples
+===============
+
+We first look at examples playing positional and names parameters
+to understand how :func:`torch.export.export` works.
+
+args
+++++
+"""
+
+import pprint
+import torch
+from onnx_diagnostic.cache_helpers import make_dynamic_cache
+from onnx_diagnostic.helpers import string_type
+from onnx_diagnostic.export import ModelInputs
+
+
+class Model(torch.nn.Module):
+    def forward(self, x, y):
+        return x + y
+
+
+model = Model()
+x = torch.randn((5, 6))
+y = torch.randn((1, 6))
+model(x, y)  # to check it works
+
+ep = torch.export.export(model, (x, y))
+print(ep)
+
+# %%
+# As expected there is no dynamic shapes.
+# We use :class:`onnx_diagnostic.export.ModelInputs`
+# to define them from two set of valid inputs.
+# These inputs must have different value for the dynamic
+# dimensions.
+
+inputs = [(x, y), (torch.randn((7, 8)), torch.randn((1, 8)))]
+mi = ModelInputs(Model(), inputs)
+ds = mi.guess_dynamic_shapes()
+pprint.pprint(ds)
+
+# %%
+# The function returns a tuple with two objets.
+# The first one for the positional arguments, the other one
+# for the named arguments. There is no named argements. We
+# we used the first result to export.
+
+ep = torch.export.export(model, (x, y), dynamic_shapes=ds[0])
+print(ep)
+
+# %%
+# kwargs
+# ++++++
+#
+# We do the same with named argments.
+
+
+class Model(torch.nn.Module):
+    def forward(self, x, y):
+        return x + y
+
+
+model = Model()
+x = torch.randn((5, 6))
+y = torch.randn((1, 6))
+model(x=x, y=y)  # to check it works
+
+# %%
+# Two sets of valid inputs.
+inputs = [dict(x=x, y=y), dict(x=torch.randn((7, 8)), y=torch.randn((1, 8)))]
+mi = ModelInputs(Model(), inputs)
+ds = mi.guess_dynamic_shapes()
+pprint.pprint(ds)
+
+# %%
+# And we export.
+ep = torch.export.export(model, (), kwargs=dict(x=x, y=y), dynamic_shapes=ds[1])
+print(ep)
+
+# %%
+# args and kwargs
+# +++++++++++++++
+#
+# :func:`torch.export.export` does not like having dynami shapes
+# for both args and kwargs. We need to define them using one mechanism.
+
+
+class Model(torch.nn.Module):
+    def forward(self, x, y):
+        return x + y
+
+
+model = Model()
+x = torch.randn((5, 6))
+y = torch.randn((1, 6))
+model(x, y=y)  # to check it works
+
+# %%
+# Two sets of valid inputs with positional and names arguments.
+
+inputs = [((x,), dict(y=y)), ((torch.randn((7, 8)),), dict(y=torch.randn((1, 8))))]
+mi = ModelInputs(Model(), inputs)
+ds = mi.guess_dynamic_shapes()
+pprint.pprint(ds)
+
+# %%
+# This does not work with :func:`torch.export.export` so
+# we use a method to move the positional dynamic shapes to
+# named one. The method relies on the signature of the
+# forward method.
+
+new_args, new_kwargs, new_ds = mi.move_to_kwargs(*mi.inputs[0], ds)
+pprint.pprint(new_ds)
+
+# %%
+# And we export.
+
+ep = torch.export.export(model, new_args, kwargs=new_kwargs, dynamic_shapes=new_ds[1])
+print(ep)
+
+# %%
+# DynamicCache
+# ============
+#
+# :func:`torch.export.export` serializes caches and any custom class
+# if these serialization functions are provided with is the case for
+# :class:`transformers.cache_utils.DynamicCache` and ``transformers>=4.50``.
+# The dynamic shapes must be provided following the serialized form.
+
+
+class Model(torch.nn.Module):
+    def forward(self, cache, z):
+        return (
+            z
+            + cache.key_cache[0]
+            + cache.key_cache[1]
+            + cache.value_cache[0]
+            + cache.value_cache[1]
+        )
+
+
+model = Model()
+
+n_layers = 2
+bsize, nheads, slen, dim = 2, 4, 3, 7
+cache = make_dynamic_cache(
+    [
+        (torch.randn(bsize, nheads, slen, dim), torch.randn(bsize, nheads, slen, dim))
+        for i in range(n_layers)
+    ]
+)
+z = torch.randn((1, 1, 1, 7))
+model(cache, z)  # to check it works.
+
+# %%
+# The cache looks like this:
+
+print(string_type(cache, with_shape=True))
+
+
+# %% Let's create another set of inputs.
+
+cache2 = make_dynamic_cache(
+    [
+        (
+            torch.randn(bsize + 1, nheads, slen + 1, dim + 1),
+            torch.randn(bsize + 1, nheads, slen + 1, dim + 1),
+        )
+        for i in range(n_layers)
+    ]
+)
+inputs = [
+    (cache, z),
+    (cache2, torch.randn((1, 1, 1, 8))),
+]
+
+# %%
+# And the first set of inputs looks like:
+print(string_type(inputs[0], with_shape=True))
+
+# %%
+# We can now compute the dynamic shapes.
+
+mi = ModelInputs(Model(), inputs)
+ds = mi.guess_dynamic_shapes()
+pprint.pprint(ds)
+
+# %%
+# And finally the export.
+
+ep = torch.export.export(model, inputs[0], dynamic_shapes=ds[0], strict=False)
+print(ep)
diff --git a/_doc/examples/plot_export_with_dynamic_shapes_auto.py b/_doc/examples/plot_export_with_dynamic_shapes_auto.py
@@ -1,8 +1,8 @@
 """
 .. _l-plot-sxport-with-dynamio-shapes-auto:
 
-Use DYNAMIC or AUTO when dynamic shapes has constraints
-=======================================================
+Use DYNAMIC or AUTO when exporting if dynamic shapes has constraints
+====================================================================
 
 Settings the dynamic shapes is not always easy.
 Here are a few tricks to make it work.

diff --git a/_doc/index.rst b/_doc/index.rst
@@ -42,6 +42,7 @@ Source are `sdpython/onnx-diagnostic
 
 * :ref:`l-plot-export-cond`
 * :ref:`l-plot-sxport-with-dynamio-shapes-auto`
+* :ref:`l-plot-export-with-dynamic-shape`
 * :ref:`l-plot-tiny-llm-export`
 * :ref:`l-plot-failing-reference-evaluator`
 * :ref:`l-plot-failing-onnxruntime-evaluator`