Add test_device support for torch

JewelRoam · JewelRoam · commit d347d7c7f48e · 2025-11-26T14:53:15.000+08:00
diff --git a/graph_net/torch/test_compiler.py b/graph_net/torch/test_compiler.py
@@ -120,6 +120,7 @@ def get_input_dict(args):
 
 def measure_performance(model_call, args, compiler):
     stats = {}
+    outs = model_call()
 
     # Warmup runs
     for _ in range(args.warmup):
@@ -180,9 +181,9 @@ def measure_performance(model_call, args, compiler):
                 flush=True,
             )
             e2e_times.append(duration_box.value)
-        stats["e2e"] = test_compiler_utilget_timing_stats(e2e_times)
+        stats["e2e"] = test_compiler_util.get_timing_stats(e2e_times)
 
-    return stats
+    return outs, stats
 
 
 def test_single_model(args):
diff --git a/graph_net/torch/test_reference_device.py b/graph_net/torch/test_reference_device.py
@@ -0,0 +1,200 @@
+import argparse
+import importlib.util
+import torch
+import time
+import numpy as np
+import random
+import os
+from pathlib import Path
+from contextlib import redirect_stdout, redirect_stderr
+import json
+import re
+import sys
+import traceback
+
+from graph_net import path_utils
+from graph_net import test_compiler_util
+from graph_net.torch import test_compiler
+
+
+def get_reference_log_path(reference_dir, model_path):
+    model_name = model_path.split("torch_samples/")[-1].replace(os.sep, "_")
+    return os.path.join(reference_dir, f"{model_name}.log")
+
+
+def get_reference_output_path(reference_dir, model_path):
+    model_name = model_path.split("torch_samples/")[-1].replace(os.sep, "_")
+    return os.path.join(reference_dir, f"{model_name}.pth")
+
+
+def test_single_model(args):
+    ref_log = get_reference_log_path(args.reference_dir, args.model_path)
+    ref_dump = get_reference_output_path(args.reference_dir, args.model_path)
+    print(f"Reference log path: {ref_log}", file=sys.stderr, flush=True)
+    print(f"Reference outputs path: {ref_dump}", file=sys.stderr, flush=True)
+
+    with open(ref_log, "w", encoding="utf-8") as log_f:
+        with redirect_stdout(log_f), redirect_stderr(log_f):
+            compiler = test_compiler.get_compiler_backend(args)
+
+            input_dict = test_compiler.get_input_dict(args)
+            model = test_compiler.get_model(args)
+            model.eval()
+
+            test_compiler_util.print_with_log_prompt(
+                "[Config] seed:", args.seed, args.log_prompt
+            )
+
+            test_compiler_util.print_basic_config(
+                args,
+                test_compiler.get_hardward_name(args),
+                test_compiler.get_compile_framework_version(args),
+            )
+
+            success = False
+            time_stats = {}
+            try:
+                compiled_model = compiler(model)
+                model_call = lambda: compiled_model(**input_dict)
+                outputs, time_stats = test_compiler.measure_performance(
+                    model_call, args, compiler
+                )
+                success = True
+            except Exception as e:
+                print(
+                    f"Run model failed: {str(e)}\n{traceback.format_exc()}",
+                    file=sys.stderr,
+                    flush=True,
+                )
+
+            test_compiler_util.print_running_status(args, success)
+            if success:
+                torch.save(outputs, str(ref_dump))
+            test_compiler_util.print_with_log_prompt(
+                "[Performance][eager]:", json.dumps(time_stats), args.log_prompt
+            )
+
+    with open(ref_log, "r", encoding="utf-8") as f:
+        content = f.read()
+        print(content, file=sys.stderr, flush=True)
+
+
+def test_multi_models(args):
+    test_samples = test_compiler_util.get_allow_samples(args.allow_list)
+
+    sample_idx = 0
+    failed_samples = []
+    module_name = os.path.splitext(os.path.basename(__file__))[0]
+    for model_path in path_utils.get_recursively_model_path(args.model_path):
+        if test_samples is None or os.path.abspath(model_path) in test_samples:
+            print(
+                f"[{sample_idx}] {module_name}, model_path: {model_path}",
+                file=sys.stderr,
+                flush=True,
+            )
+            cmd = " ".join(
+                [
+                    sys.executable,
+                    f"-m graph_net.torch.{module_name}",
+                    f"--model-path {model_path}",
+                    f"--compiler {args.compiler}",
+                    f"--device {args.device}",
+                    f"--warmup {args.warmup}",
+                    f"--trials {args.trials}",
+                    f"--log-prompt {args.log_prompt}",
+                    f"--seed {args.seed}",
+                    f"--reference-dir {args.reference_dir}",
+                ]
+            )
+            cmd_ret = os.system(cmd)
+            # assert cmd_ret == 0, f"{cmd_ret=}, {cmd=}"
+            if cmd_ret != 0:
+                failed_samples.append(model_path)
+            sample_idx += 1
+
+    print(
+        f"Totally {sample_idx} verified samples, failed {len(failed_samples)} samples.",
+        file=sys.stderr,
+        flush=True,
+    )
+    for model_path in failed_samples:
+        print(f"- {model_path}", file=sys.stderr, flush=True)
+
+
+def main(args):
+    assert os.path.isdir(args.model_path)
+    # Support all torch compilers
+    valid_compilers = list(test_compiler.registry_backend.keys())
+    assert (
+        args.compiler in valid_compilers
+    ), f"Compiler must be one of {valid_compilers}"
+    assert args.device in ["cuda", "cpu", "xpu"]
+
+    test_compiler.set_seed(random_seed=args.seed)
+
+    ref_dump_dir = Path(args.reference_dir)
+    ref_dump_dir.mkdir(parents=True, exist_ok=True)
+
+    if path_utils.is_single_model_dir(args.model_path):
+        test_single_model(args)
+    else:
+        test_multi_models(args)
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Test compiler performance.")
+    parser.add_argument(
+        "--model-path",
+        type=str,
+        required=True,
+        help="Path to model file(s), each subdirectory containing graph_net.json will be regarded as a model",
+    )
+    parser.add_argument(
+        "--compiler",
+        type=str,
+        required=False,
+        default="inductor",
+        help="Compiler backend to use",
+    )
+    parser.add_argument(
+        "--device",
+        type=str,
+        required=False,
+        default="cuda",
+        help="Device for testing the compiler (e.g., 'cpu' or 'cuda')",
+    )
+    parser.add_argument(
+        "--warmup", type=int, required=False, default=5, help="Number of warmup steps"
+    )
+    parser.add_argument(
+        "--trials", type=int, required=False, default=10, help="Number of timing trials"
+    )
+    parser.add_argument(
+        "--log-prompt",
+        type=str,
+        required=False,
+        default="graph-net-test-device-log",
+        help="Log prompt for performance log filtering.",
+    )
+    parser.add_argument(
+        "--allow-list",
+        type=str,
+        required=False,
+        default=None,
+        help="Path to samples list, each line contains a sample path",
+    )
+    parser.add_argument(
+        "--seed",
+        type=int,
+        required=False,
+        default=123,
+        help="Random seed (default: 123)",
+    )
+    parser.add_argument(
+        "--reference-dir",
+        type=str,
+        required=True,
+        help="Directory to save reference stats log and outputs",
+    )
+    args = parser.parse_args()
+    main(args=args)
diff --git a/graph_net/torch/test_target_device.py b/graph_net/torch/test_target_device.py