Adds a helper to convert an onnx model into dot

xadupre · xadupre · commit a6044a2f8dfa · 2025-12-01T09:25:16.000+01:00
diff --git a/_doc/api/helpers/dot_helper.rst b/_doc/api/helpers/dot_helper.rst
@@ -0,0 +1,7 @@
+
+onnx_diagnostic.helpers.dot_helper
+==================================
+
+.. automodule:: onnx_diagnostic.helpers.dot_helper
+    :members:
+    :no-undoc-members:
diff --git a/_doc/api/helpers/index.rst b/_doc/api/helpers/index.rst
@@ -11,6 +11,7 @@ onnx_diagnostic.helpers
     cache_helper
     config_helper
     doc_helper
+    dot_helper
     fake_tensor_helper
     graph_helper
     helper
diff --git a/_doc/recipes/plot_dynamic_shapes_json.py b/_doc/recipes/plot_dynamic_shapes_json.py
@@ -74,7 +74,7 @@ def flatten_unflatten_like_dynamic_shapes(obj):
     start = 0
     end = 0
     subtrees = []
-    for subspec in spec.children_specs:
+    for subspec in spec.children():
         end += subspec.num_leaves
         value = subspec.unflatten(flat[start:end])
         value = flatten_unflatten_like_dynamic_shapes(value)
diff --git a/_unittests/ut_helpers/test_dot_helper.py b/_unittests/ut_helpers/test_dot_helper.py
@@ -0,0 +1,79 @@
+import textwrap
+import unittest
+import onnx
+import onnx.helper as oh
+from onnx_diagnostic.ext_test_case import ExtTestCase
+from onnx_diagnostic.helpers.dot_helper import to_dot
+from onnx_diagnostic.export.api import to_onnx
+from onnx_diagnostic.torch_export_patches import torch_export_patches
+from onnx_diagnostic.torch_models.hghub import get_untrained_model_with_inputs
+
+
+class TestDotHelper(ExtTestCase):
+    def test_custom_doc_kernels_layer_normalization(self):
+        TFLOAT16 = onnx.TensorProto.FLOAT16
+        model = oh.make_model(
+            oh.make_graph(
+                [
+                    oh.make_node(
+                        "LayerNormalization",
+                        ["X", "W", "B"],
+                        ["ln"],
+                        axis=-1,
+                        epsilon=9.999999974752427e-7,
+                    ),
+                    oh.make_node(
+                        "Add", ["ln", "W"], ["Z"], axis=-1, epsilon=9.999999974752427e-7
+                    ),
+                ],
+                "dummy",
+                [
+                    oh.make_tensor_value_info("X", TFLOAT16, ["b", "c", "d"]),
+                    oh.make_tensor_value_info("W", TFLOAT16, ["d"]),
+                    oh.make_tensor_value_info("B", TFLOAT16, ["d"]),
+                ],
+                [oh.make_tensor_value_info("Z", TFLOAT16, ["b", "c", "d"])],
+            ),
+            ir_version=9,
+            opset_imports=[oh.make_opsetid("", 18)],
+        )
+        dot = to_dot(model)
+        expected = textwrap.dedent(
+            """
+            digraph {
+              graph [rankdir=TB, splines=true, overlap=false, nodesep=0.2, ranksep=0.2, fontsize=8];
+              node [style="rounded,filled", color="#888888", fontcolor="#222222", shape=box];
+              edge [arrowhead=vee, fontsize=6];
+              I_0 [label="X", fillcolor="#aaeeaa"];
+              I_1 [label="W", fillcolor="#aaeeaa"];
+              I_2 [label="B", fillcolor="#aaeeaa"];
+              LayerNormalization_3 [label="LayerNormalization(., ., ., axis=-1)", fillcolor="#cccccc"];
+              Add_4 [label="Add(., ., axis=-1)", fillcolor="#cccccc"];
+              I_0 -> LayerNormalization_3;
+              I_1 -> LayerNormalization_3;
+              I_2 -> LayerNormalization_3;
+              LayerNormalization_3 -> Add_4 [label="FLOAT16(b,c,d)"];
+              I_1 -> Add_4;
+              O_5 [label="Z", fillcolor="#aaaaee"];
+              Add_4 -> O_5;
+            }
+            """
+        )
+        self.maxDiff = None
+        self.assertEqual(expected.strip("\n "), dot.strip("\n "))
+
+    def test_dot_plot_tiny(self):
+        data = get_untrained_model_with_inputs("arnir0/Tiny-LLM")
+        model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
+        with torch_export_patches(patch_transformers=True):
+            em = to_onnx(model, inputs, dynamic_shapes=ds, exporter="custom")
+        dot = to_dot(em.model_proto)
+        name = self.get_dump_file("test_dot_plot_tiny.dot")
+        with open(name, "w") as f:
+            f.write(dot)
+        # dot -Tpng dump_test/test_dot_plot_tiny.dot -o dump_test/test_dot_plot_tiny.png
+        self.assertIn("-> Add", dot)
+
+
+if __name__ == "__main__":
+    unittest.main(verbosity=2)
diff --git a/onnx_diagnostic/helpers/cache_helper.py b/onnx_diagnostic/helpers/cache_helper.py
@@ -80,7 +80,7 @@ def flatten_unflatten_for_dynamic_shapes(
     start = 0
     end = 0
     subtrees = []
-    for subspec in spec.children_specs:
+    for subspec in spec.children():
         end += subspec.num_leaves
         value = subspec.unflatten(flat[start:end])
         value = flatten_unflatten_for_dynamic_shapes(
diff --git a/onnx_diagnostic/helpers/dot_helper.py b/onnx_diagnostic/helpers/dot_helper.py
@@ -0,0 +1,187 @@
+from typing import Set
+import onnx
+from .onnx_helper import onnx_dtype_name, pretty_onnx
+
+
+def _get_hidden_inputs(graph: onnx.GraphProto) -> Set[str]:
+    hidden = set()
+    memo = (
+        {i.name for i in graph.initializer}
+        | {i.values.name for i in graph.sparse_initializer}
+        | {i.name for i in graph.input}
+    )
+    for node in graph.node:
+        for i in node.input:
+            if i not in memo:
+                hidden.add(i)
+        for att in node.attribute:
+            if att.type == onnx.AttributeProto.GRAPH and att.g:
+                hid = _get_hidden_inputs(att.g)
+                less = set(h for h in hid if h not in memo)
+                hidden |= less
+        memo |= set(node.output)
+    return hidden
+
+
+def _make_node_label(node: onnx.NodeProto) -> str:
+    els = [f"{node.domain}.\\n{node.op_type}" if node.domain else node.op_type, "("]
+    ee = ["." if i else "" for i in node.input]
+    for att in node.attribute:
+        if att.name == "to":
+            ee.append(f"{att.name}={onnx_dtype_name(att.i)}")
+        elif att.name in {"to", "axis", "value_int", "stash_type"}:
+            ee.append(f"{att.name}={att.i}")
+        elif att.name in {"value_float"}:
+            ee.append(f"{att.name}={att.f}")
+        elif att.name in {"value_floats"}:
+            ee.append(f"{att.name}={att.floats}")
+        elif att.name in {"value_ints", "perm"}:
+            ee.append(f"{att.name}={att.ints}")
+    els.append(", ".join(ee))
+    els.append(")")
+    if node.op_type == "Constant":
+        els.extend([" -> ", node.output[0]])
+    return "".join(els)
+
+
+def to_dot(model: onnx.ModelProto) -> str:
+    """
+    Converts a model into a dot graph.
+    Here is an example:
+
+    .. gdot::
+        :script: DOT-SECTION
+        :process:
+
+        from onnx_diagnostic.helpers.dot_helper import to_dot
+        from onnx_diagnostic.export.api import to_onnx
+        from onnx_diagnostic.torch_export_patches import torch_export_patches
+        from onnx_diagnostic.torch_models.hghub import get_untrained_model_with_inputs
+
+        data = get_untrained_model_with_inputs("arnir0/Tiny-LLM")
+        model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
+        with torch_export_patches(patch_transformers=True):
+            em = to_onnx(model, inputs, dynamic_shapes=ds, exporter="custom")
+        dot = to_dot(em.model_proto)
+        print("DOT-SECTION", dot)
+
+    Or this one obtained with :func:`torch.onnx.export`.
+
+    .. gdot::
+        :script: DOT-SECTION
+        :process:
+
+        from onnx_diagnostic.helpers.dot_helper import to_dot
+        from onnx_diagnostic.export.api import to_onnx
+        from onnx_diagnostic.torch_export_patches import torch_export_patches
+        from onnx_diagnostic.torch_models.hghub import get_untrained_model_with_inputs
+
+        data = get_untrained_model_with_inputs("arnir0/Tiny-LLM")
+        model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
+        with torch_export_patches(patch_transformers=True):
+            em = to_onnx(model, kwargs=inputs, dynamic_shapes=ds, exporter="onnx-dynamo")
+        dot = to_dot(em.model_proto)
+        print("DOT-SECTION", dot)
+    """
+    _unique = {}
+
+    def _mkn(obj: object) -> int:
+        id_obj = id(obj)
+        if id_obj in _unique:
+            return _unique[id_obj]
+        i = len(_unique)
+        _unique[id_obj] = i
+        return i
+
+    model = onnx.shape_inference.infer_shapes(model)
+
+    op_type_colors = {
+        "Shape": "#eeeeee",
+        "MatMul": "#ee9999",
+        "Transpose": "#ee99ee",
+    }
+
+    edge_label = {}
+    for val in model.graph.value_info:
+        itype = val.type.tensor_type.elem_type
+        if itype == onnx.TensorProto.UNDEFINED:
+            continue
+        shape = tuple(
+            d.dim_param if d.dim_param else d.dim_value for d in val.type.tensor_type.shape.dim
+        )
+        sshape = ",".join(
+            map(
+                str,
+                [("?" if isinstance(s, str) and s.startswith("unk") else s) for s in shape],
+            )
+        )
+        edge_label[val.name] = f"{onnx_dtype_name(itype)}({sshape})"
+
+    rows = [
+        "digraph {",
+        (
+            "  graph [rankdir=TB, splines=true, overlap=false, nodesep=0.2, "
+            "ranksep=0.2, fontsize=8];"
+        ),
+        '  node [style="rounded,filled", color="#888888", fontcolor="#222222", shape=box];',
+        "  edge [arrowhead=vee, fontsize=6];",
+    ]
+    inputs = list(model.graph.input)
+    outputs = list(model.graph.output)
+    nodes = list(model.graph.node)
+    inits = list(model.graph.initializer)
+    name_to_ids = {}
+    for inp in inputs:
+        if not inp.name:
+            continue
+        rows.append(f'  I_{_mkn(inp)} [label="{inp.name}", fillcolor="#aaeeaa"];')
+        name_to_ids[inp.name] = f"I_{_mkn(inp)}"
+    for init in inits:
+        rows.append(f'  i_{_mkn(init)} [label="{init.name}", fillcolor="#cccc00"];')
+        name_to_ids[init.name] = f"i_{_mkn(init)}"
+    for node in nodes:
+        color = op_type_colors.get(node.op_type, "#cccccc")
+        label = _make_node_label(node)
+        rows.append(f'  {node.op_type}_{_mkn(node)} [label="{label}", fillcolor="{color}"];')
+        name_to_ids.update({o: f"{node.op_type}_{_mkn(node)}" for o in node.output if o})
+
+    # nodes
+    done = set()
+    for node in nodes:
+        names = list(node.input)
+        for i in names:
+            if not i:
+                continue
+            if i not in name_to_ids:
+                raise ValueError(f"Unable to find {i!r}\n{pretty_onnx(model)}")
+            edge = name_to_ids[i], f"{node.op_type}_{_mkn(node)}"
+            if edge in done:
+                continue
+            done.add(edge)
+            lab = edge_label.get(i, "")
+            if lab:
+                ls = ",".join([f'label="{lab}"'])
+                lab = f" [{ls}]"
+            rows.append(f"  {edge[0]} -> {edge[1]}{lab};")
+        if node.op_type in {"Scan", "Loop", "If"}:
+            unique = set()
+            for att in node.attribute:
+                if att.type == onnx.AttributeProto.GRAPH:
+                    unique |= _get_hidden_inputs(att.g)
+            for i in unique:
+                edge = name_to_ids[i], _mkn(node)
+                if edge in done:
+                    continue
+                done.add(edge)
+                rows.append(f"  {edge[0]} -> {edge[1]} [style=dotted];")
+
+    # outputs
+    for out in outputs:
+        if not out.name:
+            continue
+        rows.append(f'  O_{_mkn(out)} [label="{out.name}", fillcolor="#aaaaee"];')
+        edge = name_to_ids[out.name], f"O_{_mkn(out)}"
+        rows.append(f"  {edge[0]} -> {edge[1]};")
+
+    rows.append("}")
+    return "\n".join(rows)
diff --git a/pyproject.toml b/pyproject.toml
@@ -172,6 +172,7 @@ select = [
 "_scripts/compare_model_execution.py" = ["E402", "F401"]
 "_doc/technical/plot_*.py" = ["E402", "B018", "PIE808", "RUF015", "SIM105", "SIM117"]
 "_unittests/*/test*.py" = ["B008", "B904", "PIE808", "SIM117", "SIM105", "UP008"]
+"_unittests/ut_helpers/test_dot_helper.py" = ["E501"]
 "_unittests/ut_tasks/try_export.py" = ["B008", "B904", "E501", "PIE808", "SIM117", "SIM105", "UP008"]
 "onnx_diagnostic/export/__init__.py" = ["F401"]
 "onnx_diagnostic/helpers/__init__.py" = ["F401"]