better doc

xadupre · xadupre · commit 4ed5d8c16532 · 2025-05-20T15:00:59.000+02:00
diff --git a/CHANGELOGS.rst b/CHANGELOGS.rst
@@ -4,6 +4,7 @@ Change Logs
 0.5.0
 +++++
 
+* :pr:`105`: more options to tune control flow rewriting
 * :pr:`104`: add summarization task, add rewrite to command line validate
 * :pr:`101`: first draft to rewrite loops
 * :pr:`100`: implements a context to automatically rewrite methods or function with control flows
diff --git a/_doc/api/torch_export_patches/index.rst b/_doc/api/torch_export_patches/index.rst
@@ -5,6 +5,8 @@ onnx_diagnostic.torch_export_patches
     :maxdepth: 1
     :caption: submodules
 
+    onnx_export_errors
+    onnx_export_serialization
     patches/index
     patch_expressions
     patch_inputs
diff --git a/_doc/api/torch_export_patches/onnx_export_errors.rst b/_doc/api/torch_export_patches/onnx_export_errors.rst
@@ -0,0 +1,8 @@
+
+onnx_diagnostic.torch_export_patches.onnx_export_errors
+=======================================================
+
+.. automodule:: onnx_diagnostic.torch_export_patches.onnx_export_errors
+    :members:
+    :no-undoc-members:
+    :exclude-members: torch_export_patches, register_additional_serialization_functions
diff --git a/_doc/api/torch_export_patches/onnx_export_serialization.rst b/_doc/api/torch_export_patches/onnx_export_serialization.rst
@@ -0,0 +1,7 @@
+
+onnx_diagnostic.torch_export_patches.onnx_export_serialization
+==============================================================
+
+.. automodule:: onnx_diagnostic.torch_export_patches.onnx_export_serialization
+    :members:
+    :no-undoc-members:
diff --git a/_doc/api/torch_export_patches/patch_module_helper.rst b/_doc/api/torch_export_patches/patch_module_helper.rst
@@ -1,8 +1,7 @@
 
-onnx_diagnostic.torch_export_patches.patch_module
-=================================================
+onnx_diagnostic.torch_export_patches.patch_module_helper
+========================================================
 
-.. automodule:: onnx_diagnostic.torch_export_patches.patch_module
+.. automodule:: onnx_diagnostic.torch_export_patches.patch_module_helper
     :members:
     :no-undoc-members:
-    :exclude-members: torch_export_rewrite
diff --git a/_doc/conf.py b/_doc/conf.py
@@ -125,19 +125,22 @@ def linkcode_resolve(domain, info):
     ("py:class", "torch.utils._pytree.Context"),
     ("py:class", "torch.utils._pytree.KeyEntry"),
     ("py:class", "torch.utils._pytree.TreeSpec"),
+    ("py:class", "transformers.BartForConditionalGeneration"),
     ("py:class", "transformers.LlamaConfig"),
     ("py:class", "transformers.cache_utils.Cache"),
     ("py:class", "transformers.cache_utils.DynamicCache"),
     ("py:class", "transformers.cache_utils.EncoderDecoderCache"),
     ("py:class", "transformers.cache_utils.MambaCache"),
     ("py:class", "transformers.cache_utils.SlidingWindowCache"),
     ("py:class", "transformers.configuration_utils.PretrainedConfig"),
+    ("py:class", "transformers.modeling_outputs.BaseModelOutput"),
     ("py:func", "torch.export._draft_export.draft_export"),
     ("py:func", "torch._export.tools.report_exportability"),
     ("py:func", "torch.utils._pytree.register_pytree_node"),
     ("py:meth", "huggingface_hub.HfApi.list_models"),
     ("py:meth", "transformers.AutoConfig.from_pretrained"),
     ("py:meth", "transformers.GenerationMixin.generate"),
+    ("py:meth", "transformers.models.bart.modeling_bart.BartEncoderLayer.forward"),
     ("py:meth", "unittests.TestCase.subTest"),
 ]
 
diff --git a/_doc/index.rst b/_doc/index.rst
@@ -35,6 +35,7 @@ It also implements tools to investigate, validate exported models (ExportedProgr
     :maxdepth: 1
     :caption: Contents
 
+    patches
     api/index
     cmds/index
     auto_examples/index
diff --git a/_doc/patches.rst b/_doc/patches.rst
@@ -0,0 +1,172 @@
+.. _l-patches-explained:
+
+=================
+Patches Explained
+=================
+
+Function :func:`onnx_diagnostic.torch_export_patches.torch_export_patches`
+implements four kinds of patches to make it easier to export a model, usually
+coming from :epkg:`transformers`.
+All patches takes place in :mod:`onnx_diagnostic.torch_export_patches`.
+.. code-block:: python
+
+    with torch_export_patches(...) as f:
+        ep = torch.export.export(model, args, kwargs=kwargs, dynamic_shapes=dynamic_shapes)
+
+1. **torch fixes**:
+   it disables some exceptions or improves some functions related to dynamic shapes
+   until :epkg:`torch` addresses the issues
+   (see `mostly exporter issues
+   <https://github.com/pytorch/pytorch/issues?q=is%3Aissue%20state%3Aopen%20author%3Axadupre>`_)
+2. **transformers rewriting**:
+   some methods are replaced with a version :func:`torch.export.export` can understand,
+   some rewriting may migrate to :epkg:`transformers`, others are applied only
+   at export time because it would make the implementation less efficient
+3. **cache serialization**: :func:`torch.export.export` needs to know how to
+   serialize custom classes such as :class:`transformers.cache_utils.DynamicCache`
+4. **control flow rewriting**: control flow (if, for) cannot be exported as is,
+   there is still some work to be done to automatically process them,
+   this package offers some automated rewriting, but it is far from being perfect.
+
+All of them are triggered by :func:`onnx_diagnostic.torch_export_patches.torch_export_patches`.
+
+.. code-block:: bash
+
+    python -m onnx_diagnostic validate \
+        -m hf-tiny-model-private/tiny-random-PLBartForConditionalGeneration \
+        --run -v 1 --export onnx-dynamo -o dump_test --dtype float16 --device cuda
+
+
+All patches can be disabled with ``with torch_export_patches(patch=False)``.
+
+torch fixes
+===========
+
+Implemented in :mod:`onnx_diagnostic.torch_export_patches.patches.patch_torch` and triggered with
+``with torch_export_patches(patch_sympy=True, patch_torch=True, catch_constraints=True, stop_if_static=1...)``.
+
+It fixes some issues found while exporting model. Some of them might not be needed anymore.
+It improves shape broadcasting or inserts an exception everytime a dynamic dimension
+becomes static (``stop_if_static=1``).
+
+transformers rewriting
+======================
+
+Implemented in :mod:`onnx_diagnostic.torch_export_patches.patches.patch_transformers` and triggered with
+``with torch_export_patches(patch_transformers=True)``.
+
+Every patched class is prefixed with ``patched_``. It contains two class attributes.
+``_PATCHES_`` contains the list of methods to replace.
+``_PATCHED_CLASS_`` is the class patched by this one.
+
+.. code-block:: python
+
+    class patched_AttentionMaskConverter:
+        """
+        Patches
+        ``transformers.modeling_attn_mask_utils.AttentionMaskConverter._make_causal_mask``.
+        """
+
+        # This method was fixed in 4.51 at least.
+        _PATCHES_ = ["_make_causal_mask"] if not has_transformers("4.48.3") else []
+        _PATCHED_CLASS_ = AttentionMaskConverter
+
+The packages automatically parses this file to extract the patched methods.
+More can be added by populating the argument ``custom_patches``:
+``with torch_export_patches(custom_patches=[...])``.
+
+Cache serialization
+===================
+
+Implemented in :mod:`onnx_diagnostic.torch_export_patches.onnx_export_serialization`.
+Any custom classes manipulated by a model needs to be registered through 
+``torch.utils._pytree.register_pytree_node`` or with
+:func:`onnx_diagnostic.torch_export_patches.onnx_export_serialization.register_class_serialization`
+and triggered by ``with torch_export_patches(patch_transformers=True)``.
+This function does one class, 
+:func:`onnx_diagnostic.torch_export_patches.onnx_export_serialization.register_cache_serialization`
+does all known classes.
+It can be undone with :func:`onnx_diagnostic.torch_export_patches.onnx_export_serialization.unregister`
+or :func:`onnx_diagnostic.torch_export_patches.onnx_export_serialization.unregister_cache_serialization`.
+
+.. _l-control-flow-rewriting:
+
+Control flow rewriting
+======================
+
+This is an attempt to automatically rewrite control flow using :mod:`ast`.
+It is implemented in :mod:`onnx_diagnostic.torch_export_patches.patch_module` and
+triggered ``with torch_export_patches(rewrite=<instance of torch.nn.Module>)``.
+Option ``dump_rewriting=<folder>`` tells the function to dump all applied
+rewritings.
+
+The following example contains the rewriting of method
+:meth:`transformers.models.bart.modeling_bart.BartEncoderLayer.forward`.
+The list of known rewriting to apply are returned by function
+:func:`onnx_diagnostic.torch_export_patches.patch_module_helper.code_needing_rewriting`
+and applied by function :func:`onnx_diagnostic.torch_export_patches.patch_module.transform_method`.
+
+While parsing the code, it is missing type information but this is known by
+:func:`torch.export.export`. Due to that, the automation usually needs manual tuning
+to filter out some tests (argument ``filter_node``) or pre/post processing
+(arguments ``pre_rewriter``,  ``post_rewriter``) of function 
+:func:`onnx_diagnostic.torch_export_patches.patch_module.transform_method`.
+
+The main entry point is the context
+:func:`onnx_diagnostic.torch_export_patches.torch_export_rewrite`
+which rewrites and undoes the rewriting.
+For example, the model :class:`transformers.BartForConditionalGeneration`
+requires the following value for parameter ``rewrite``:
+
+.. runpython::
+    :showcode:
+
+    from onnx_diagnostic.torch_export_patches.patch_module_helper import (
+        code_needing_rewriting,
+    )
+
+    print(code_needing_rewriting("BartForConditionalGeneration"))    
+
+And that produces:
+
+.. code-block:: diff
+
+    --- original
+    +++ rewritten
+    @@ -26,7 +26,6 @@
+        hidden_states = nn.functional.dropout(hidden_states, p=self.dropout, training=self.training)
+        hidden_states = residual + hidden_states
+        hidden_states = self.self_attn_layer_norm(hidden_states)
+    -
+        residual = hidden_states
+        hidden_states = self.activation_fn(self.fc1(hidden_states))
+        hidden_states = nn.functional.dropout(
+    @@ -37,15 +36,22 @@
+        hidden_states = residual + hidden_states
+        hidden_states = self.final_layer_norm(hidden_states)
+    
+    -    if hidden_states.dtype == torch.float16 and (
+    -        torch.isinf(hidden_states).any() or torch.isnan(hidden_states).any()
+    -    ):
+    +    def branch_cond_then_1(hidden_states):
+            clamp_value = torch.finfo(hidden_states.dtype).max - 1000
+            hidden_states = torch.clamp(hidden_states, min=-clamp_value, max=clamp_value)
+    +        return hidden_states.clone()
+    
+    +    def branch_cond_else_1(hidden_states):
+    +        return hidden_states.clone()
+    +
+    +    hidden_states = torch.cond(
+    +        hidden_states.dtype == torch.float16
+    +        and torch.isinf(hidden_states).any() | torch.isnan(hidden_states).any(),
+    +        branch_cond_then_1,
+    +        branch_cond_else_1,
+    +        [hidden_states],
+    +    )
+        outputs = (hidden_states,)
+    -
+        if output_attentions:
+    -        outputs += (attn_weights,)
+    -
+    +        outputs = outputs + (attn_weights,)
+        return outputs
diff --git a/onnx_diagnostic/torch_export_patches/__init__.py b/onnx_diagnostic/torch_export_patches/__init__.py
@@ -16,6 +16,6 @@ def register_flattening_functions(verbose: int = 0):
     This is needed whenever a model must be exported through
     :func:`torch.export.export`.
     """
-    from .onnx_export_serialization import _register_cache_serialization
+    from .onnx_export_serialization import register_cache_serialization
 
-    return _register_cache_serialization(verbose=verbose)
+    return register_cache_serialization(verbose=verbose)
diff --git a/onnx_diagnostic/torch_export_patches/onnx_export_errors.py b/onnx_diagnostic/torch_export_patches/onnx_export_errors.py
@@ -1,8 +1,8 @@
 import contextlib
 from typing import Any, Callable, Dict, List, Optional
 from .onnx_export_serialization import (
-    _register_cache_serialization,
-    _unregister_cache_serialization,
+    register_cache_serialization,
+    unregister_cache_serialization,
 )
 from .patches import patch_transformers as patch_transformers_list
 
@@ -85,11 +85,11 @@ def register_additional_serialization_functions(
 ) -> Callable:
     """The necessary modifications to run the fx Graph."""
     fct_callable = replacement_before_exporting if patch_transformers else (lambda x: x)
-    done = _register_cache_serialization(verbose=verbose)
+    done = register_cache_serialization(verbose=verbose)
     try:
         yield fct_callable
     finally:
-        _unregister_cache_serialization(done, verbose=verbose)
+        unregister_cache_serialization(done, verbose=verbose)
 
 
 @contextlib.contextmanager
@@ -107,6 +107,7 @@ def torch_export_patches(
 ) -> Callable:
     """
     Tries to bypass some situations :func:`torch.export.export` does not support.
+    See also :ref:`l-patches-explained`.
 
     :param patch_sympy: fix missing method ``name`` for IntegerConstant
     :param patch_torch: patches :epkg:`torch` with supported implementation
@@ -206,11 +207,11 @@ def torch_export_patches(
                 pass
     elif not patch:
         fct_callable = lambda x: x  # noqa: E731
-        done = _register_cache_serialization(verbose=verbose)
+        done = register_cache_serialization(verbose=verbose)
         try:
             yield fct_callable
         finally:
-            _unregister_cache_serialization(done, verbose=verbose)
+            unregister_cache_serialization(done, verbose=verbose)
     else:
         import torch
         import torch._export.non_strict_utils  # produce_guards_and_solve_constraints
@@ -226,7 +227,7 @@ def torch_export_patches(
         # caches
         ########
 
-        cache_done = _register_cache_serialization(verbose=verbose)
+        cache_done = register_cache_serialization(verbose=verbose)
 
         #############
         # patch sympy
@@ -439,7 +440,7 @@ def torch_export_patches(
             # caches
             ########
 
-            _unregister_cache_serialization(cache_done, verbose=verbose)
+            unregister_cache_serialization(cache_done, verbose=verbose)
 
 
 def replacement_before_exporting(args: Any) -> Any:
diff --git a/onnx_diagnostic/torch_export_patches/onnx_export_serialization.py b/onnx_diagnostic/torch_export_patches/onnx_export_serialization.py
diff --git a/onnx_diagnostic/torch_export_patches/patch_module.py b/onnx_diagnostic/torch_export_patches/patch_module.py
diff --git a/onnx_diagnostic/torch_models/test_helper.py b/onnx_diagnostic/torch_models/test_helper.py