val

xadupre · xadupre · commit fdced7a3e998 · 2025-04-01T12:46:27.000+02:00
diff --git a/_unittests/ut_helpers/test_memory_peak.py b/_unittests/ut_helpers/test_memory_peak.py
@@ -31,21 +31,21 @@ def test_spy_cpu(self):
             time.sleep(0.005)
             n_elements = max(value.shape[0], n_elements)
         time.sleep(0.02)
-        pres = p.stop()
+        measures = p.stop()
         self.assertGreater(n_elements, 0)
-        self.assertIsInstance(pres, dict)
-        self.assertLessEqual(pres["cpu"].end, pres["cpu"].max_peak)
-        self.assertLessEqual(pres["cpu"].begin, pres["cpu"].max_peak)
-        self.assertGreater(pres["cpu"].begin, 0)
+        self.assertIsInstance(measures, dict)
+        self.assertLessEqual(measures["cpu"].end, measures["cpu"].max_peak)
+        self.assertLessEqual(measures["cpu"].begin, measures["cpu"].max_peak)
+        self.assertGreater(measures["cpu"].begin, 0)
         # Zero should not happen...
-        self.assertGreaterOrEqual(pres["cpu"].delta_peak, 0)
-        self.assertGreaterOrEqual(pres["cpu"].delta_peak, pres["cpu"].delta_end)
-        self.assertGreaterOrEqual(pres["cpu"].delta_peak, pres["cpu"].delta_avg)
-        self.assertGreaterOrEqual(pres["cpu"].delta_end, 0)
-        self.assertGreaterOrEqual(pres["cpu"].delta_avg, 0)
+        self.assertGreaterOrEqual(measures["cpu"].delta_peak, 0)
+        self.assertGreaterOrEqual(measures["cpu"].delta_peak, measures["cpu"].delta_end)
+        self.assertGreaterOrEqual(measures["cpu"].delta_peak, measures["cpu"].delta_avg)
+        self.assertGreaterOrEqual(measures["cpu"].delta_end, 0)
+        self.assertGreaterOrEqual(measures["cpu"].delta_avg, 0)
         # Too unstable.
-        # self.assertGreater(pres["cpu"].delta_peak, n_elements * 8 * 0.5)
-        self.assertIsInstance(pres["cpu"].to_dict(), dict)
+        # self.assertGreater(measures["cpu"].delta_peak, n_elements * 8 * 0.5)
+        self.assertIsInstance(measures["cpu"].to_dict(), dict)
 
     @skipif_ci_apple("stuck")
     @requires_cuda()
@@ -58,10 +58,10 @@ def test_spy_cuda(self):
             value += 1
             n_elements = max(value.shape[0], n_elements)
         time.sleep(0.02)
-        pres = p.stop()
-        self.assertIsInstance(pres, dict)
-        self.assertIn("gpus", pres)
-        gpu = pres["gpus"][0]
+        measures = p.stop()
+        self.assertIsInstance(measures, dict)
+        self.assertIn("gpus", measures)
+        gpu = measures["gpus"][0]
         self.assertLessEqual(gpu.end, gpu.max_peak)
         self.assertLessEqual(gpu.begin, gpu.max_peak)
         self.assertGreater(gpu.delta_peak, 0)
diff --git a/_unittests/ut_torch_models/test_test_helpers.py b/_unittests/ut_torch_models/test_test_helpers.py
@@ -1,7 +1,7 @@
 import copy
 import unittest
 from onnx_diagnostic.ext_test_case import ExtTestCase
-from onnx_diagnostic.torch_models.test_helper import get_inputs_for_task
+from onnx_diagnostic.torch_models.test_helper import get_inputs_for_task, validate_model
 from onnx_diagnostic.torch_models.hghub.model_inputs import get_get_inputs_function_for_tasks
 
 
@@ -15,6 +15,13 @@ def test_get_inputs_for_task(self):
             self.assertIn("dynamic_shapes", data)
             copy.deepcopy(data["inputs"])
 
+    def test_validate_model(self):
+        mid = "arnir0/Tiny-LLM"
+        summary, data = validate_model(mid, do_run=True, verbose=2)
+        self.assertIsInstance(summary, dict)
+        self.assertIsInstance(data, dict)
+        validate_model(mid, do_run=True, verbose=2, quiet=True)
+
 
 if __name__ == "__main__":
     unittest.main(verbosity=2)
diff --git a/_unittests/ut_xrun_doc/test_command_lines_exe.py b/_unittests/ut_xrun_doc/test_command_lines_exe.py
@@ -37,9 +37,16 @@ def test_parser_config(self):
     def test_parser_validate(self):
         st = StringIO()
         with redirect_stdout(st):
+            main(["validate"])
             main(["validate", "-t", "text-generation"])
         text = st.getvalue()
         self.assertIn("dynamic_shapes", text)
+        st = StringIO()
+        with redirect_stdout(st):
+            main(["validate"])
+            main(["validate", "-m", "arnir0/Tiny-LLM", "--run", "-v", "1"])
+        text = st.getvalue()
+        self.assertIn("model_clas", text)
 
 
 if __name__ == "__main__":
diff --git a/onnx_diagnostic/_command_lines_parser.py b/onnx_diagnostic/_command_lines_parser.py
@@ -233,6 +233,8 @@ def get_parser_validate() -> ArgumentParser:
         description=dedent(
             """
         Prints out dummy inputs for a particular task or a model id.
+        If both mid and task are empty, the command line displays the list
+        of supported tasks.
         """
         ),
         epilog="If the model id is specified, one untrained version of it is instantiated.",
@@ -263,6 +265,19 @@ def get_parser_validate() -> ArgumentParser:
         action=BooleanOptionalAction,
         help="runs the model to check it runs",
     )
+    parser.add_argument(
+        "-q",
+        "--quiet",
+        default=False,
+        action=BooleanOptionalAction,
+        help="catches exception, report them in the summary",
+    )
+    parser.add_argument(
+        "--trained",
+        default=False,
+        action=BooleanOptionalAction,
+        help="validate the trained model (requires downloading)",
+    )
     parser.add_argument(
         "-v",
         "--verbose",
@@ -274,12 +289,15 @@ def get_parser_validate() -> ArgumentParser:
 
 def _cmd_validate(argv: List[Any]):
     from .helpers import string_type
-    from .torch_models.test_helper import get_inputs_for_task
+    from .torch_models.test_helper import get_inputs_for_task, validate_model, _ds_clean
+    from .torch_models.hghub.model_inputs import get_get_inputs_function_for_tasks
 
     parser = get_parser_validate()
     args = parser.parse_args(argv[1:])
-    assert args.task or args.mid, "A model id or a task needs to be specified."
-    if not args.mid:
+    if not args.task and not args.mid:
+        print("-- list of supported tasks:")
+        print("\n".join(sorted(get_get_inputs_function_for_tasks())))
+    elif not args.mid:
         data = get_inputs_for_task(args.task)
         if args.verbose:
             print(f"task: {args.task}")
@@ -289,10 +307,20 @@ def _cmd_validate(argv: List[Any]):
             print(f"  + {k.ljust(max_length)}: {string_type(v, with_shape=True)}")
         print("-- dynamic_shapes")
         for k, v in data["dynamic_shapes"].items():
-            vs = str(v).replace("<class 'onnx_diagnostic.torch_models.hghub.model_inputs.", "").replace("'>", "").replace("_DimHint(type=<_DimHintType.DYNAMIC: 3>", "DYNAMIC").replace("_DimHint(type=<_DimHintType.AUTO: 3>", "AUTO")
-            print(f"  + {k.ljust(max_length)}: {vs}")
-
-    # validate_model(args.input, verbose=args.verbose, watch=set(args.names.split(",")))
+            print(f"  + {k.ljust(max_length)}: {_ds_clean(v)}")
+    else:
+        summary, _data = validate_model(
+            model_id=args.mid,
+            task=args.task,
+            do_run=args.run,
+            verbose=args.verbose,
+            quiet=args.quiet,
+            trained=args.trained,
+        )
+        print("")
+        print("-- summary")
+        for k, v in sorted(summary.items()):
+            print(f":{k},{v};")
 
 
 def get_main_parser() -> ArgumentParser:
diff --git a/onnx_diagnostic/torch_models/hghub/model_inputs.py b/onnx_diagnostic/torch_models/hghub/model_inputs.py
@@ -147,7 +147,7 @@ def random_input_kwargs(config: Any, task: str) -> Tuple[Dict[str, Any], Callabl
     If the configuration is None, the function selects typical dimensions.
     """
     fcts = get_get_inputs_function_for_tasks()
-    assert task in fcts, f"Unsupported task {task!r}, supprted are {sorted(fcts)}"
+    assert task in fcts, f"Unsupported task {task!r}, supported are {sorted(fcts)}"
     if task == "text-generation":
         if config is not None:
             check_hasattr(
@@ -376,6 +376,7 @@ def get_untrained_model_with_inputs(
     res["configuration"] = config
     res["size"] = sizes[0]
     res["n_weights"] = sizes[1]
+    res["task"] = task
 
     update = {}
     for k, v in res.items():
diff --git a/onnx_diagnostic/torch_models/test_helper.py b/onnx_diagnostic/torch_models/test_helper.py
@@ -1,7 +1,21 @@
-from typing import Any, Dict, Optional, Union
+import torch
+from typing import Any, Dict, Optional, Tuple, Union
+import time
+from ..helpers import string_type
+from .hghub import get_untrained_model_with_inputs
 from .hghub.model_inputs import random_input_kwargs
 
 
+def _ds_clean(v):
+    return (
+        str(v)
+        .replace("<class 'onnx_diagnostic.torch_models.hghub.model_inputs.", "")
+        .replace("'>", "")
+        .replace("_DimHint(type=<_DimHintType.DYNAMIC: 3>", "DYNAMIC")
+        .replace("_DimHint(type=<_DimHintType.AUTO: 3>", "AUTO")
+    )
+
+
 def get_inputs_for_task(task: str, config: Optional[Any] = None) -> Dict[str, Any]:
     """
     Returns dummy inputs for a specific task.
@@ -18,12 +32,90 @@ def validate_model(
     model_id: str,
     task: Optional[str] = None,
     do_run: bool = False,
-    do_export: bool = False,
+    exporter: Optional[str] = None,
     do_same: bool = False,
     verbose: int = 0,
-) -> Dict[str, Union[int, float, str]]:
+    dtype: Optional[Union[str, torch.dtype]] = None,
+    device: Optional[Union[str, torch.device]] = None,
+    trained: bool = False,
+    optimization: Optional[str] = None,
+    quiet: bool = False,
+) -> Tuple[Dict[str, Union[int, float, str]], Dict[str, Any]]:
     """
     Validates a model.
 
-
+    :param model_id: model id to validate
+    :param task: task used to generate the necessary inputs,
+        can be left empty to use the default task for this model
+        if it can be determined
+    :param do_run: checks the model works with the defined inputs
+    :param exporter: exporter the model using this exporter,
+        available list: ``export-strict``, ``export-nostrict``, ``onnx``
+    :param do_same: checks the discrepancies of the exported model
+    :param verbose: verbosity level
+    :param dtype: uses this dtype to check the model
+    :param device: do the verification on this device
+    :param trained: use the trained model, not the untrained one
+    :param optimization: optimization to apply to the exported model,
+        depend on the the exporter
+    :param quiet: if quiet, catches exception if any issue
+    :return: two dictionaries, one with some metrics,
+        another one with whatever the function produces
     """
+    assert not trained, f"trained={trained} not supported yet"
+    assert not dtype, f"dtype={dtype} not supported yet"
+    assert not device, f"device={device} not supported yet"
+    summary = {}
+    if verbose:
+        print(f"[validate_model] validate model id {model_id!r}")
+        print("[validate_model] get dummy inputs...")
+        summary["model_id"] = model_id
+    begin = time.perf_counter()
+    if quiet:
+        try:
+            data = get_untrained_model_with_inputs(model_id, verbose=verbose, task=task)
+        except Exception as e:
+            summary["ERR_create"] = e
+            summary["time_create"] = time.perf_counter() - begin
+            return summary, {}
+    else:
+        data = get_untrained_model_with_inputs(model_id, verbose=verbose, task=task)
+    summary["time_create"] = time.perf_counter() - begin
+    for k in ["task", "size", "n_weights"]:
+        summary[f"model_{k.replace('_','')}"] = data[k]
+        summary["model_inputs"] = string_type(data["inputs"], with_shape=True)
+        summary["model_shapes"] = _ds_clean(str(data["dynamic_shapes"]))
+        summary["model_class"] = data["model"].__class__.__name__
+        summary["model_config_class"] = data["configuration"].__class__.__name__
+        summary["model_config"] = str(data["configuration"].to_dict()).replace(" ", "")
+    summary["model_id"] = model_id
+    if verbose:
+        print(f"[validate_model] task={data["task"]}")
+        print(f"[validate_model] size={data["size"]}")
+        print(f"[validate_model] n_weights={data["n_weights"]}")
+        print(f"[validate_model] n_weights={data["n_weights"]}")
+        for k, v in data["inputs"].items():
+            print(f"[validate_model] +INPUT {k}={string_type(v, with_shape=True)}")
+        for k, v in data["dynamic_shapes"].items():
+            print(f"[validate_model] +SHAPE {k}={_ds_clean(v)}")
+    if do_run:
+        if verbose:
+            print("[validate_model] run the model...")
+        begin = time.perf_counter()
+        if quiet:
+            try:
+                expected = data["model"](**data["inputs"])
+            except Exception as e:
+                summary["ERR_run"] = e
+                summary["time_run"] = time.perf_counter() - begin
+                return summary, data
+        else:
+            expected = data["model"](**data["inputs"])
+        summary["time_run"] = time.perf_counter() - begin
+        summary["model_expected"] = string_type(expected, with_shape=True)
+        if verbose:
+            print("[validate_model] run the model")
+        data["expected"] = expected
+    if verbose:
+        print("[validate_model] done.")
+    return summary, data