doc

xadupre · xadupre · commit 0c37bc36b18a · 2025-04-01T16:53:15.000+02:00
diff --git a/_doc/cmds/validate.rst b/_doc/cmds/validate.rst
@@ -18,6 +18,9 @@ exports the model, measures the discrepancies...
 Get the list of supported tasks
 +++++++++++++++++++++++++++++++
 
+The task are the same defined by :epkg:`HuggingFace`.
+The tool only supports a subset of them.
+
 .. code-block::
 
     python -m onnx_diagnostic validate
@@ -32,6 +35,10 @@ Get the list of supported tasks
 Get the default inputs for a specific task
 ++++++++++++++++++++++++++++++++++++++++++
 
+This returns the dummy inputs for a specific task.
+There may be too many inputs. Only those the forward method
+defines are kept.
+
 .. code-block::
 
     python -m onnx_diagnostic validate -t text-generation
@@ -42,8 +49,12 @@ Get the default inputs for a specific task
 
     main("validate -t text-generation".split())
 
-Validate a model
-++++++++++++++++
+Validate dummy inputs for a model
++++++++++++++++++++++++++++++++++
+
+The dummy inputs may not work for this model and this task.
+The following command line checks that. It is no use to export
+if this fails.
 
 .. code-block::
 
@@ -54,3 +65,22 @@ Validate a model
     from onnx_diagnostic._command_lines_parser import main
 
     main("validate -m arnir0/Tiny-LLM --run -v 1".split())
+
+Validate and export a model
++++++++++++++++++++++++++++
+
+Exports a model given the task. Checks for discrepancies as well.
+The latency given are just for one run. It tells how long the benchmark
+runs but it is far from the latency measure we can get by running multiple times
+the same model.
+
+
+.. code-block::
+
+    python -m onnx_diagnostic validate -m arnir0/Tiny-LLM --run -v 1 --export exporter-nostrict -o dump_models --patch
+
+.. runpython::
+
+    from onnx_diagnostic._command_lines_parser import main
+
+    main("validate -m arnir0/Tiny-LLM --run -v 1 --export exporter-nostrict -o dump_models --patch".split())
diff --git a/_unittests/ut_torch_models/test_test_helpers.py b/_unittests/ut_torch_models/test_test_helpers.py
@@ -39,14 +39,12 @@ def test_validate_model_export(self):
         summary, data = validate_model(
             mid,
             do_run=True,
-            verbose=2,
-            dtype="float32",
-            device="cpu",
+            verbose=10,
             exporter="export-nostrict",
+            dump_folder="dump_test_validate_model_export",
         )
         self.assertIsInstance(summary, dict)
         self.assertIsInstance(data, dict)
-        validate_model(mid, do_run=True, verbose=2, quiet=False)
 
 
 if __name__ == "__main__":
diff --git a/onnx_diagnostic/_command_lines_parser.py b/onnx_diagnostic/_command_lines_parser.py
@@ -239,28 +239,10 @@ def get_parser_validate() -> ArgumentParser:
         ),
         epilog="If the model id is specified, one untrained version of it is instantiated.",
     )
-    parser.add_argument(
-        "-m",
-        "--mid",
-        type=str,
-        help="model id, usually <author>/<name>",
-    )
-    parser.add_argument(
-        "-t",
-        "--task",
-        default=None,
-        help="force the task to use",
-    )
-    parser.add_argument(
-        "-e",
-        "--export",
-        help="export the model with this exporter",
-    )
-    parser.add_argument(
-        "-o",
-        "--opt",
-        help="optimization to apply after the export",
-    )
+    parser.add_argument("-m", "--mid", type=str, help="model id, usually <author>/<name>")
+    parser.add_argument("-t", "--task", default=None, help="force the task to use")
+    parser.add_argument("-e", "--export", help="export the model with this exporter")
+    parser.add_argument("--opt", help="optimization to apply after the export")
     parser.add_argument(
         "-r",
         "--run",
@@ -288,6 +270,12 @@ def get_parser_validate() -> ArgumentParser:
         action=BooleanOptionalAction,
         help="validate the trained model (requires downloading)",
     )
+    parser.add_argument(
+        "-o",
+        "--dump-folder",
+        help="if not empty, a folder is created to dumps statistics, "
+        "exported program, onnx...",
+    )
     parser.add_argument("-v", "--verbose", default=0, type=int, help="verbosity")
     parser.add_argument("--dtype", help="changes dtype if necessary")
     parser.add_argument("--device", help="changes the device if necessary")
@@ -328,6 +316,7 @@ def _cmd_validate(argv: List[Any]):
             patch=args.patch,
             optimization=args.opt,
             exporter=args.export,
+            dump_folder=args.dump_folder,
         )
         print("")
         print("-- summary --")
diff --git a/onnx_diagnostic/torch_models/test_helper.py b/onnx_diagnostic/torch_models/test_helper.py
@@ -1,3 +1,4 @@
+import os
 from typing import Any, Dict, Optional, Tuple, Union
 import time
 import torch
@@ -11,7 +12,7 @@
 def empty(value: Any) -> bool:
     """Tells if the value is empty."""
     if isinstance(value, (str, list, dict, tuple, set)):
-        return value
+        return bool(value)
     if value is None:
         return True
     return False
@@ -22,8 +23,8 @@ def _ds_clean(v):
         str(v)
         .replace("<class 'onnx_diagnostic.torch_models.hghub.model_inputs.", "")
         .replace("'>", "")
-        .replace("_DimHint(type=<_DimHintType.DYNAMIC: 3>", "DYNAMIC")
-        .replace("_DimHint(type=<_DimHintType.AUTO: 3>", "AUTO")
+        .replace("_DimHint(type=<_DimHintType.DYNAMIC: 3>)", "DYNAMIC")
+        .replace("_DimHint(type=<_DimHintType.AUTO: 3>)", "AUTO")
     )
 
 
@@ -52,6 +53,7 @@ def validate_model(
     optimization: Optional[str] = None,
     quiet: bool = False,
     patch: bool = False,
+    dump_folder: Optional[str] = None,
 ) -> Tuple[Dict[str, Union[int, float, str]], Dict[str, Any]]:
     """
     Validates a model.
@@ -72,11 +74,23 @@ def validate_model(
         depend on the the exporter
     :param quiet: if quiet, catches exception if any issue
     :param patch: applies patches before exporting
+    :param dump_folder: dumps everything in a subfolder of this one
     :return: two dictionaries, one with some metrics,
         another one with whatever the function produces
     """
     assert not trained, f"trained={trained} not supported yet"
     summary: Dict[str, Union[int, float, str]] = {}
+    if dump_folder:
+        folder_name = f"{model_id.replace('/','-')}-{exporter}-{optimization or ''}"
+        dump_folder = os.path.join(dump_folder, folder_name)
+        if not os.path.exists(dump_folder):
+            os.makedirs(dump_folder)
+        summary["dump_folder"] = dump_folder
+        summary["dump_folder_name"] = folder_name
+        if verbose:
+            print(f"[validate_model] dump into {folder_name!r}")
+    else:
+        folder_name = None
     if verbose:
         print(f"[validate_model] validate model id {model_id!r}")
         print("[validate_model] get dummy inputs...")
@@ -98,15 +112,15 @@ def validate_model(
             dtype = getattr(torch, dtype)
         if verbose:
             print(f"[validate_model] dtype conversion to {dtype}")
-        data["model"] = to_any(data["model"], dtype)
-        data["inputs"] = to_any(data["inputs"], dtype)
+        data["model"] = to_any(data["model"], dtype)  # type: ignore
+        data["inputs"] = to_any(data["inputs"], dtype)  # type: ignore
         summary["model_dtype"] = str(dtype)
 
     if not empty(device):
         if verbose:
             print(f"[validate_model] device conversion to {device}")
-        data["model"] = to_any(data["model"], device)
-        data["inputs"] = to_any(data["inputs"], device)
+        data["model"] = to_any(data["model"], device)  # type: ignore
+        data["inputs"] = to_any(data["inputs"], device)  # type: ignore
         summary["model_device"] = str(device)
 
     summary["time_create"] = time.perf_counter() - begin
@@ -156,6 +170,7 @@ def validate_model(
             f"before: {hash_inputs}\n"
             f" after: {string_type(data["inputs"], with_shape=True)}"
         )
+
     if exporter:
         print(
             f"[validate_model] export the model with {exporter!r}, "
@@ -164,10 +179,10 @@ def validate_model(
         if patch:
             if verbose:
                 print("[validate_model] applies patches before exporting")
-            with bypass_export_some_errors(
+            with bypass_export_some_errors(  # type: ignore
                 patch_transformers=True, verbose=max(0, verbose - 1)
             ) as modificator:
-                data["inputs_export"] = modificator(data["inputs"])
+                data["inputs_export"] = modificator(data["inputs"])  # type: ignore
 
                 if do_run:
                     # We run a second time the model to check the patch did not
@@ -230,6 +245,25 @@ def validate_model(
             )
         summary.update(summary_export)
 
+    if dump_folder:
+        if "exported_program" in data:
+            ep = data["exported_program"]
+            if verbose:
+                print(f"[validate_model] dumps exported program in {dump_folder!r}...")
+            with open(os.path.join(dump_folder, f"{folder_name}.ep"), "w") as f:
+                f.write(str(ep))
+            with open(os.path.join(dump_folder, f"{folder_name}.graph"), "w") as f:
+                f.write(str(ep.graph))
+            if verbose:
+                print("[validate_model] done (dump ep)")
+        if verbose:
+            print(f"[validate_model] dumps statistics in {dump_folder!r}...")
+        with open(os.path.join(dump_folder, f"{folder_name}.stats"), "w") as f:
+            for k, v in sorted(summary.items()):
+                f.write(f":{k}:{v};\n")
+        if verbose:
+            print("[validate_model] done (dump)")
+
     if verbose:
         print("[validate_model] done (final)")
     return summary, data
@@ -281,7 +315,7 @@ def split_args_kwargs(inputs: Any) -> Tuple[Tuple[Any, ...], Dict[str, Any]]:
         return (), inputs
     if isinstance(inputs, tuple) and len(inputs) == 2 and isinstance(inputs[1], dict):
         return inputs
-    assert isinstance(inputs, tuple), f"Unexpectd inputs {string_type(inputs)}"
+    assert isinstance(inputs, tuple), f"Unexpected inputs {string_type(inputs)}"
     return inputs, {}
 
 
@@ -309,7 +343,7 @@ def call_torch_export_export(
     """
     assert "model" in data, f"model is missing from data: {sorted(data)}"
     assert "inputs_export" in data, f"inputs_export is missing from data: {sorted(data)}"
-    summary = {}
+    summary: Dict[str, Union[str, int, float]] = {}
     strict = "nostrict" not in exporter
     args, kwargs = split_args_kwargs(data["inputs_export"])
     ds = data.get("dynamic_shapes", None)
@@ -323,7 +357,7 @@ def call_torch_export_export(
         print(f"[call_torch_export_export] dynamic_shapes={_ds_clean(ds)}")
         print("[call_torch_export_export] export...")
     summary["export_exporter"] = exporter
-    summary["export_optimization"] = optimization
+    summary["export_optimization"] = optimization or ""
     summary["export_strict"] = strict
     summary["export_args"] = string_type(args, with_shape=True)
     summary["export_kwargs"] = string_type(kwargs, with_shape=True)