sdpython
diff --git a/‎.github/workflows/check-urls.yml‎
Lines changed: 2 additions & 2 deletions b/‎.github/workflows/check-urls.yml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎CHANGELOGS.rst‎
Lines changed: 1 addition & 0 deletions b/‎CHANGELOGS.rst‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎_doc/api/torch_export_patches/index.rst‎
Lines changed: 3 additions & 1 deletion b/‎_doc/api/torch_export_patches/index.rst‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎_doc/api/torch_export_patches/onnx_export_errors.rst‎
Lines changed: 8 additions & 0 deletions b/‎_doc/api/torch_export_patches/onnx_export_errors.rst‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎_doc/api/torch_export_patches/onnx_export_serialization.rst‎
Lines changed: 7 additions & 0 deletions b/‎_doc/api/torch_export_patches/onnx_export_serialization.rst‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎_doc/api/torch_export_patches/patch_module_helper.rst‎
Lines changed: 7 additions & 0 deletions b/‎_doc/api/torch_export_patches/patch_module_helper.rst‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎_doc/conf.py‎
Lines changed: 3 additions & 0 deletions b/‎_doc/conf.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎_doc/index.rst‎
Lines changed: 1 addition & 0 deletions b/‎_doc/index.rst‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎_doc/patches.rst‎
Lines changed: 172 additions & 0 deletions b/‎_doc/patches.rst‎
Lines changed: 172 additions & 0 deletions
diff --git a/‎_unittests/ut_torch_export_patches/test_patch_module.py‎
Lines changed: 13 additions & 2 deletions b/‎_unittests/ut_torch_export_patches/test_patch_module.py‎
Lines changed: 13 additions & 2 deletions
@@ -31,7 +31,7 @@ jobs:
         timeout: 2
         retry_count# : 2
         exclude_urls: https://github.com/pytorch/pytorch/pull/117009,https://github.com/huggingface/transformers/pull/29285,https://github.com/pytorch/pytorch/blob/a44f8894fa6d973693aab44a3dda079a168b05c1/torch/_decomp/decompositions.py#L1475,https://github.com/huggingface/transformers/pull/36652
-        exclude_patterns: https://dumps.wikimedia.org/,https://github.com/pytorch/pytorch/pull/,https://github.com/pytorch/pytorch/blob/a44f8894fa6d973693aab44a3dda079a168b05c1/torch/_decomp/decompositions.py#L1475,https://huggingface.co/,https://huggingface.co/,https://github.com/huggingface/transformers/
+        exclude_patterns: https://dumps.wikimedia.org/,https://github.com/,https://huggingface.co/,https://huggingface.co/
         # force_pass : true
 
     - name: urls-checker-docs
@@ -43,5 +43,5 @@ jobs:
         timeout: 2
         retry_count# : 2
         exclude_urls: https://hal.archives-,ouvertes.fr/hal-00990252/document,http://badge.fury.io/py/onnx-diagnostic,https://azure.microsoft.com/en-us/products/devops/pipelines,https://github.com/pytorch/pytorch/pull/83137#issuecomment-1211320670,https://github.com/NVIDIA/TransformerEngine.git@6a9edc38bf9b941b7d369af5103fa8fe0b121d61,https://medium.com/@msouza.os/llm-from-scratch-with-pytorch-9f21808c6319,https://github.com/pytorch/pytorch/blob/main/torch/fx/experimental/symbolic_shapes.py#L5965,https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-24-04.html,https://badge.fury.io/py/onnx-diagnostic.svg,https://github.com/huggingface/transformers/pull/36311
-        exclude_patterns: https://www.data.gouv.fr/fr/datasets/r/e3d83ab3-dc52-4c99-abaf-8a38050cc68c,https://dev.azure.com/,https://azure.microsoft.com/en-us/products/devops/pipelines,https://github.com/pytorch/pytorch/pull/83137#issuecomment-1211320670,https://github.com/NVIDIA/TransformerEngine.git@6a9edc38bf9b941b7d369af5103fa8fe0b121d61,https://github.com/pytorch/pytorch/blob/main/torch/,https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-24-04.html,https://badge.fury.io/py/onnx-diagnostic.svg,https://github.com/huggingface/transformers/pull/36311,https://codecov.io/,https://huggingface.co/
+        exclude_patterns: https://www.data.gouv.fr/fr/datasets/r/e3d83ab3-dc52-4c99-abaf-8a38050cc68c,https://dev.azure.com/,https://azure.microsoft.com/en-us/products/devops/pipelines,https://github.com/pytorch/pytorch/pull/83137#issuecomment-1211320670,https://github.com/NVIDIA/TransformerEngine.git@6a9edc38bf9b941b7d369af5103fa8fe0b121d61,https://github.com/pytorch/pytorch/blob/main/torch/,https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-24-04.html,https://badge.fury.io/py/onnx-diagnostic.svg,https://github.com/,https://codecov.io/,https://huggingface.co/
         # force_pass : true
@@ -4,6 +4,7 @@ Change Logs
 0.5.0
 +++++
 
+* :pr:`105`: more options to tune control flow rewriting
 * :pr:`104`: add summarization task, add rewrite to command line validate
 * :pr:`101`: first draft to rewrite loops
 * :pr:`100`: implements a context to automatically rewrite methods or function with control flows
 
@@ -5,11 +5,13 @@ onnx_diagnostic.torch_export_patches
     :maxdepth: 1
     :caption: submodules
 
+    onnx_export_errors
+    onnx_export_serialization
     patches/index
     patch_expressions
     patch_inputs
     patch_module
-
+    patch_module_helper
 
 .. automodule:: onnx_diagnostic.torch_export_patches
     :members:
 
@@ -0,0 +1,8 @@
+
+onnx_diagnostic.torch_export_patches.onnx_export_errors
+=======================================================
+
+.. automodule:: onnx_diagnostic.torch_export_patches.onnx_export_errors
+    :members:
+    :no-undoc-members:
+    :exclude-members: torch_export_patches, register_additional_serialization_functions
@@ -0,0 +1,7 @@
+
+onnx_diagnostic.torch_export_patches.onnx_export_serialization
+==============================================================
+
+.. automodule:: onnx_diagnostic.torch_export_patches.onnx_export_serialization
+    :members:
+    :no-undoc-members:
@@ -0,0 +1,7 @@
+
+onnx_diagnostic.torch_export_patches.patch_module_helper
+========================================================
+
+.. automodule:: onnx_diagnostic.torch_export_patches.patch_module_helper
+    :members:
+    :no-undoc-members:
@@ -125,19 +125,22 @@ def linkcode_resolve(domain, info):
     ("py:class", "torch.utils._pytree.Context"),
     ("py:class", "torch.utils._pytree.KeyEntry"),
     ("py:class", "torch.utils._pytree.TreeSpec"),
+    ("py:class", "transformers.BartForConditionalGeneration"),
     ("py:class", "transformers.LlamaConfig"),
     ("py:class", "transformers.cache_utils.Cache"),
     ("py:class", "transformers.cache_utils.DynamicCache"),
     ("py:class", "transformers.cache_utils.EncoderDecoderCache"),
     ("py:class", "transformers.cache_utils.MambaCache"),
     ("py:class", "transformers.cache_utils.SlidingWindowCache"),
     ("py:class", "transformers.configuration_utils.PretrainedConfig"),
+    ("py:class", "transformers.modeling_outputs.BaseModelOutput"),
     ("py:func", "torch.export._draft_export.draft_export"),
     ("py:func", "torch._export.tools.report_exportability"),
     ("py:func", "torch.utils._pytree.register_pytree_node"),
     ("py:meth", "huggingface_hub.HfApi.list_models"),
     ("py:meth", "transformers.AutoConfig.from_pretrained"),
     ("py:meth", "transformers.GenerationMixin.generate"),
+    ("py:meth", "transformers.models.bart.modeling_bart.BartEncoderLayer.forward"),
     ("py:meth", "unittests.TestCase.subTest"),
 ]
 
 
@@ -35,6 +35,7 @@ It also implements tools to investigate, validate exported models (ExportedProgr
     :maxdepth: 1
     :caption: Contents
 
+    patches
     api/index
     cmds/index
     auto_examples/index
 
@@ -0,0 +1,172 @@
+.. _l-patches-explained:
+
+=================
+Patches Explained
+=================
+
+Function :func:`onnx_diagnostic.torch_export_patches.torch_export_patches`
+implements four kinds of patches to make it easier to export a model, usually
+coming from :epkg:`transformers`.
+All patches takes place in :mod:`onnx_diagnostic.torch_export_patches`.
+.. code-block:: python
+
+    with torch_export_patches(...) as f:
+        ep = torch.export.export(model, args, kwargs=kwargs, dynamic_shapes=dynamic_shapes)
+
+1. **torch fixes**:
+   it disables some exceptions or improves some functions related to dynamic shapes
+   until :epkg:`torch` addresses the issues
+   (see `mostly exporter issues
+   <https://github.com/pytorch/pytorch/issues?q=is%3Aissue%20state%3Aopen%20author%3Axadupre>`_)
+2. **transformers rewriting**:
+   some methods are replaced with a version :func:`torch.export.export` can understand,
+   some rewriting may migrate to :epkg:`transformers`, others are applied only
+   at export time because it would make the implementation less efficient
+3. **cache serialization**: :func:`torch.export.export` needs to know how to
+   serialize custom classes such as :class:`transformers.cache_utils.DynamicCache`
+4. **control flow rewriting**: control flow (if, for) cannot be exported as is,
+   there is still some work to be done to automatically process them,
+   this package offers some automated rewriting, but it is far from being perfect.
+
+All of them are triggered by :func:`onnx_diagnostic.torch_export_patches.torch_export_patches`.
+
+.. code-block:: bash
+
+    python -m onnx_diagnostic validate \
+        -m hf-tiny-model-private/tiny-random-PLBartForConditionalGeneration \
+        --run -v 1 --export onnx-dynamo -o dump_test --dtype float16 --device cuda
+
+
+All patches can be disabled with ``with torch_export_patches(patch=False)``.
+
+torch fixes
+===========
+
+Implemented in :mod:`onnx_diagnostic.torch_export_patches.patches.patch_torch` and triggered with
+``with torch_export_patches(patch_sympy=True, patch_torch=True, catch_constraints=True, stop_if_static=1...)``.
+
+It fixes some issues found while exporting model. Some of them might not be needed anymore.
+It improves shape broadcasting or inserts an exception every time a dynamic dimension
+becomes static (``stop_if_static=1``).
+
+transformers rewriting
+======================
+
+Implemented in :mod:`onnx_diagnostic.torch_export_patches.patches.patch_transformers` and triggered with
+``with torch_export_patches(patch_transformers=True)``.
+
+Every patched class is prefixed with ``patched_``. It contains two class attributes.
+``_PATCHES_`` contains the list of methods to replace.
+``_PATCHED_CLASS_`` is the class patched by this one.
+
+.. code-block:: python
+
+    class patched_AttentionMaskConverter:
+        """
+        Patches
+        ``transformers.modeling_attn_mask_utils.AttentionMaskConverter._make_causal_mask``.
+        """
+
+        # This method was fixed in 4.51 at least.
+        _PATCHES_ = ["_make_causal_mask"] if not has_transformers("4.48.3") else []
+        _PATCHED_CLASS_ = AttentionMaskConverter
+
+The packages automatically parses this file to extract the patched methods.
+More can be added by populating the argument ``custom_patches``:
+``with torch_export_patches(custom_patches=[...])``.
+
+Cache serialization
+===================
+
+Implemented in :mod:`onnx_diagnostic.torch_export_patches.onnx_export_serialization`.
+Any custom classes manipulated by a model needs to be registered through 
+``torch.utils._pytree.register_pytree_node`` or with
+:func:`onnx_diagnostic.torch_export_patches.onnx_export_serialization.register_class_serialization`
+and triggered by ``with torch_export_patches(patch_transformers=True)``.
+This function does one class, 
+:func:`onnx_diagnostic.torch_export_patches.onnx_export_serialization.register_cache_serialization`
+does all known classes.
+It can be undone with :func:`onnx_diagnostic.torch_export_patches.onnx_export_serialization.unregister`
+or :func:`onnx_diagnostic.torch_export_patches.onnx_export_serialization.unregister_cache_serialization`.
+
+.. _l-control-flow-rewriting:
+
+Control flow rewriting
+======================
+
+This is an attempt to automatically rewrite control flow using :mod:`ast`.
+It is implemented in :mod:`onnx_diagnostic.torch_export_patches.patch_module` and
+triggered ``with torch_export_patches(rewrite=<instance of torch.nn.Module>)``.
+Option ``dump_rewriting=<folder>`` tells the function to dump all applied
+rewritings.
+
+The following example contains the rewriting of method
+:meth:`transformers.models.bart.modeling_bart.BartEncoderLayer.forward`.
+The list of known rewriting to apply are returned by function
+:func:`onnx_diagnostic.torch_export_patches.patch_module_helper.code_needing_rewriting`
+and applied by function :func:`onnx_diagnostic.torch_export_patches.patch_module.transform_method`.
+
+While parsing the code, it is missing type information but this is known by
+:func:`torch.export.export`. Due to that, the automation usually needs manual tuning
+to filter out some tests (argument ``filter_node``) or pre/post processing
+(arguments ``pre_rewriter``,  ``post_rewriter``) of function 
+:func:`onnx_diagnostic.torch_export_patches.patch_module.transform_method`.
+
+The main entry point is the context
+:func:`onnx_diagnostic.torch_export_patches.torch_export_rewrite`
+which rewrites and undoes the rewriting.
+For example, the model :class:`transformers.BartForConditionalGeneration`
+requires the following value for parameter ``rewrite``:
+
+.. runpython::
+    :showcode:
+
+    from onnx_diagnostic.torch_export_patches.patch_module_helper import (
+        code_needing_rewriting,
+    )
+
+    print(code_needing_rewriting("BartForConditionalGeneration"))    
+
+And that produces:
+
+.. code-block:: diff
+
+    --- original
+    +++ rewritten
+    @@ -26,7 +26,6 @@
+        hidden_states = nn.functional.dropout(hidden_states, p=self.dropout, training=self.training)
+        hidden_states = residual + hidden_states
+        hidden_states = self.self_attn_layer_norm(hidden_states)
+    -
+        residual = hidden_states
+        hidden_states = self.activation_fn(self.fc1(hidden_states))
+        hidden_states = nn.functional.dropout(
+    @@ -37,15 +36,22 @@
+        hidden_states = residual + hidden_states
+        hidden_states = self.final_layer_norm(hidden_states)
+    
+    -    if hidden_states.dtype == torch.float16 and (
+    -        torch.isinf(hidden_states).any() or torch.isnan(hidden_states).any()
+    -    ):
+    +    def branch_cond_then_1(hidden_states):
+            clamp_value = torch.finfo(hidden_states.dtype).max - 1000
+            hidden_states = torch.clamp(hidden_states, min=-clamp_value, max=clamp_value)
+    +        return hidden_states.clone()
+    
+    +    def branch_cond_else_1(hidden_states):
+    +        return hidden_states.clone()
+    +
+    +    hidden_states = torch.cond(
+    +        hidden_states.dtype == torch.float16
+    +        and torch.isinf(hidden_states).any() | torch.isnan(hidden_states).any(),
+    +        branch_cond_then_1,
+    +        branch_cond_else_1,
+    +        [hidden_states],
+    +    )
+        outputs = (hidden_states,)
+    -
+        if output_attentions:
+    -        outputs += (attn_weights,)
+    -
+    +        outputs = outputs + (attn_weights,)
+        return outputs
@@ -13,6 +13,7 @@
     ShapeFinder,
     RewriteControlFlow,
 )
+from onnx_diagnostic.torch_export_patches.patch_module_helper import ast_or_into_bitor
 
 
 class _ModelForATest(torch.nn.Module):
@@ -396,15 +397,25 @@ def forward(self, x, y):
     def test_rewrite_test_in_PLBartEncoderLayer(self):
         from transformers.models.plbart.modeling_plbart import PLBartEncoderLayer
 
-        rewritten = transform_method(PLBartEncoderLayer.forward, verbose=self.verbose)
+        def filter_node(node) -> bool:
+            return isinstance(node, ast.If) and not isinstance(node.test, ast.Name)
+
+        rewritten = transform_method(
+            PLBartEncoderLayer.forward,
+            verbose=self.verbose,
+            filter_node=filter_node,
+            pre_rewriter=ast_or_into_bitor,
+        )
         self.assertIn(
             (
                 "torch.cond(hidden_states.dtype == torch.float16 and "
-                "(torch.isinf(hidden_states).any() or torch.isnan(hidden_states).any()), "
+                "torch.isinf(hidden_states).any()"
+                " | torch.isnan(hidden_states).any(), "
                 "branch_cond_then_1, branch_cond_else_1, [hidden_states])"
             ),
             rewritten.code,
         )
+        self.assertNotIn("torch.cond(output_attentions", rewritten.code)
 
     @hide_stdout()
     def test_torch_export_patch_method_tuple(self):