update analysis

JewelRoam · JewelRoam · commit ee9cb274ae02 · 2025-09-01T09:16:57.000Z
diff --git a/graph_net/analysis.py b/graph_net/analysis.py
@@ -5,135 +5,90 @@
 import argparse
 import os
 import json
-import re
-
-
-def read_speedups_from_log(log_file):
-    speedups = []
-    try:
-        with open(log_file, "r") as f:
-            for line in f:
-                match = re.search(
-                    r"duration.*eager:\s*(\d+\.?\d*).*compiled:\s*(\d+\.?\d*)", line
-                )
-                if match:
-                    eager_time = float(match.group(1))
-                    compiled_time = float(match.group(2))
-                    if compiled_time > 0:
-                        speedups.append(eager_time / compiled_time)
-    except FileNotFoundError:
-        print(f"Error: Log file not found -> {log_file}")
-        return []
-    return speedups
-
-
-def read_speedups_from_json(benchmark_path):
-    speedups = []
+from collections import defaultdict
+
+
+def parse_filename(filename):
+    """
+    Parses the model name and compiler name from a JSON filename.
+    Assumes filename format: <model_name>_<compiler_name>.json
+    """
+    parts = os.path.splitext(filename)[0].split("_")
+    if len(parts) < 2:
+        return None, None
+    compiler = parts[-1]
+    model = "_".join(parts[:-1])
+    return model, compiler
+
+
+def read_all_speedups(benchmark_path):
+    """
+    Recursively finds all .json files in a given path, extracts the speedup values,
+    and organizes them by compiler and category (subdirectory).
+    """
+    data_by_compiler_category = defaultdict(lambda: defaultdict(list))
+    all_compilers = set()
+
     if not os.path.exists(benchmark_path):
         print(f"Error: Path does not exist -> {benchmark_path}")
-        return []
-
-    try:
-        for root, _, files in os.walk(benchmark_path):
-            for file in files:
-                if file.endswith(".json"):
-                    json_file = os.path.join(root, file)
-                    try:
-                        with open(json_file, "r") as f:
-                            data = json.load(f)
-                            if (
-                                "performance" in data
-                                and "speedup" in data["performance"]
-                            ):
-                                speedups.append(data["performance"]["speedup"])
-                            else:
-                                print(
-                                    f"Warning: Invalid JSON format (missing 'performance.speedup') -> {json_file}"
-                                )
-                    except json.JSONDecodeError:
-                        print(f"Error: Invalid JSON file -> {json_file}")
-                        continue
-    except Exception as e:
-        print(f"Unexpected error: {str(e)}")
-        return []
+        return {}, []
 
-    return speedups
+    for root, _, files in os.walk(benchmark_path):
+        for file in files:
+            if file.endswith(".json"):
+                _, compiler = parse_filename(file)
+                if not compiler:
+                    continue
 
+                all_compilers.add(compiler)
 
-def analysis(args):
-    compilers = ["CINN", "torch.inductor", "tvm", "XLA", "TensorRT", "BladeDISC"]
-    num_samples_per_compiler = 200
-    data = {"Compiler": [], "log2(speedup)": []}
-
-    # A: CINN (Simulate)
-    # data["log2(speedup)"].extend(
-    #     np.random.normal(loc=0.35, scale=0.2, size=num_samples_per_compiler)
-    # )
-    # data["Compiler"].extend(["CINN"] * num_samples_per_compiler)
-
-    # B: torch.inductor
-    # inductor_log = os.path.join(args.test_compiler_log_file)
-    # inductor_speedup = read_speedups_from_log(inductor_log)
-    inductor_speedup = read_speedups_from_json(args.benchmark_path)
-    print(f"Find {len(inductor_speedup)} samples.")
-    log2_speedups = np.log2(inductor_speedup)
-
-    mask = log2_speedups <= 2
-    filtered_log2_speedups = log2_speedups[mask]
-    filtered_count = len(filtered_log2_speedups)
-    print(
-        f"After filtering, {filtered_count} samples remain (removed {len(log2_speedups) - filtered_count} outliers)."
-    )
+                category = os.path.relpath(root, benchmark_path)
+                if category == ".":
+                    category = os.path.basename(benchmark_path)
 
-    data["log2(speedup)"].extend(filtered_log2_speedups)
-    data["Compiler"].extend(["torch.inductor"] * len(filtered_log2_speedups))
-    # data["log2(speedup)"].extend(log2_speedups)
-    # data["Compiler"].extend(["torch.inductor"] * len(log2_speedups))
-
-    # C: tvm (Simulate)
-    # data["log2(speedup)"].extend(
-    #     np.random.normal(loc=0.3, scale=0.15, size=num_samples_per_compiler)
-    # )
-    # data["Compiler"].extend(["tvm"] * num_samples_per_compiler)
-
-    # D: XLA (Simulate)
-    # data["log2(speedup)"].extend(
-    #     np.concatenate(
-    #         [
-    #             np.random.normal(
-    #                 loc=-0.5, scale=0.1, size=int(num_samples_per_compiler * 0.6)
-    #             ),
-    #             np.random.normal(
-    #                 loc=0.2, scale=0.2, size=int(num_samples_per_compiler * 0.4)
-    #             ),
-    #         ]
-    #     )
-    # )
-    # data["Compiler"].extend(["XLA"] * num_samples_per_compiler)
-
-    # E: TensorRT (Simulate)
-    # data["log2(speedup)"].extend(
-    #     np.random.normal(loc=0.5, scale=0.1, size=num_samples_per_compiler)
-    # )
-    # data["Compiler"].extend(["TensorRT"] * num_samples_per_compiler)
-
-    # F: BladeDISC (Simulate)
-    # data["log2(speedup)"].extend(
-    #     np.random.normal(loc=0.05, scale=0.3, size=num_samples_per_compiler)
-    # )
-    # data["Compiler"].extend(["BladeDISC"] * num_samples_per_compiler)
-
-    df = pd.DataFrame(data)
-    df["Compiler"] = pd.Categorical(df["Compiler"], categories=compilers, ordered=True)
+                json_file = os.path.join(root, file)
+                try:
+                    with open(json_file, "r") as f:
+                        data = json.load(f)
+                        speedup_data = data.get("performance", {}).get("speedup")
 
+                        if isinstance(speedup_data, dict):
+                            # Handle new format with 'e2e' and 'gpu' keys
+                            if "e2e" in speedup_data:
+                                data_by_compiler_category[compiler][category].append(
+                                    speedup_data["e2e"]
+                                )
+                            elif "gpu" in speedup_data:
+                                data_by_compiler_category[compiler][category].append(
+                                    speedup_data["gpu"]
+                                )
+                        elif isinstance(speedup_data, float):
+                            # Handle old format where speedup is just a number
+                            data_by_compiler_category[compiler][category].append(
+                                speedup_data
+                            )
+
+                except (json.JSONDecodeError, KeyError) as e:
+                    print(
+                        f"Warning: Failed to read or parse file -> {json_file}, Error: {e}"
+                    )
+                    continue
+
+    return data_by_compiler_category, sorted(list(all_compilers))
+
+
+def plot_summary_comparison(df, all_compilers, output_dir):
+    """
+    Generates a summary plot comparing the overall performance of all compilers.
+    """
+    plt.figure(figsize=(12, 7))
     sns.set_theme(style="whitegrid")
-    plt.figure(figsize=(10, 6))
 
     ax = sns.violinplot(
         x="Compiler",
         y="log2(speedup)",
         data=df,
-        order=compilers,
+        order=all_compilers,
         color="white",
         linewidth=0.8,
         inner=None,
@@ -143,7 +98,7 @@ def analysis(args):
         x="Compiler",
         y="log2(speedup)",
         data=df,
-        order=compilers,
+        order=all_compilers,
         showcaps=False,
         boxprops={"facecolor": "royalblue", "edgecolor": "black"},
         medianprops={"color": "white", "linewidth": 2},
@@ -153,15 +108,128 @@ def analysis(args):
         ax=ax,
     )
 
+    sample_counts = df["Compiler"].value_counts().to_dict()
+    x_labels = [
+        f"{compiler}\n({sample_counts.get(compiler, 0)} samples)"
+        for compiler in all_compilers
+    ]
+
     ax.set_ylabel("log2(speedup)", fontsize=14)
     ax.set_xlabel("")
-    x_labels = [f"{chr(65+i)}\n{compiler}" for i, compiler in enumerate(compilers)]
-    ax.set_xticks(ticks=range(len(x_labels)), labels=x_labels, fontsize=12)
-    ax.tick_params(axis="y", colors="black")
+    ax.set_xticks(ticks=range(len(x_labels)))
+    ax.set_xticklabels(x_labels, rotation=45, ha="right", fontsize=11)
+    ax.set_title("Overall Compiler Performance Comparison", fontsize=16)
+
     sns.despine(trim=True, left=True)
 
-    plt.savefig(args.output_file, dpi=300, bbox_inches="tight")
-    print(f"Figure saved to {args.output_file}")
+    output_file = os.path.join(output_dir, "summary_speedup_comparison.png")
+    plt.savefig(output_file, dpi=300, bbox_inches="tight")
+    print(f"\nSummary comparison plot saved to: {output_file}")
+    plt.close()
+
+
+def plot_per_compiler_detail(df_all, compiler_name, output_dir):
+    """
+    Generates a detailed plot for a single compiler, showing its performance across different categories.
+    """
+    df_compiler = df_all[df_all["Compiler"] == compiler_name]
+    if df_compiler.empty:
+        print(
+            f"Warning: No valid data found for compiler '{compiler_name}'. Skipping detailed plot."
+        )
+        return
+
+    categories = sorted(df_compiler["Category"].unique())
+
+    plt.figure(figsize=(10, 6))
+    sns.set_theme(style="whitegrid")
+
+    ax = sns.violinplot(
+        x="Category",
+        y="log2(speedup)",
+        data=df_compiler,
+        order=categories,
+        color="white",
+        linewidth=0.8,
+        inner=None,
+    )
+
+    sns.boxplot(
+        x="Category",
+        y="log2(speedup)",
+        data=df_compiler,
+        order=categories,
+        showcaps=False,
+        boxprops={"facecolor": "royalblue", "edgecolor": "black"},
+        medianprops={"color": "white", "linewidth": 2},
+        whiskerprops={"color": "black", "linewidth": 1.5},
+        flierprops={"marker": ".", "markerfacecolor": "black"},
+        width=0.1,
+        ax=ax,
+    )
+
+    sample_counts = df_compiler["Category"].value_counts().to_dict()
+    # Use os.path.basename to get only the package name from the path
+    x_labels = [
+        f"{os.path.basename(cat)}\n(n={sample_counts.get(cat, 0)})"
+        for cat in categories
+    ]
+
+    ax.set_ylabel("log2(speedup)", fontsize=14)
+    ax.set_xlabel("")
+    ax.set_xticks(ticks=range(len(x_labels)))
+    ax.set_xticklabels(x_labels, rotation=45, ha="right", fontsize=11)
+    # Add the benchmark path to the title
+    ax.set_title(f"Speedup for {compiler_name} by Categories", fontsize=16)
+
+    sns.despine(trim=True, left=True)
+
+    output_file = os.path.join(output_dir, f"{compiler_name}_speedup_by_category.png")
+    plt.savefig(output_file, dpi=300, bbox_inches="tight")
+    print(f"Detailed plot for '{compiler_name}' saved to: {output_file}")
+    plt.close()
+
+
+def analysis(args):
+    data_by_compiler_category, all_compilers = read_all_speedups(args.benchmark_path)
+
+    if not data_by_compiler_category:
+        print("Error: No valid benchmark data found.")
+        return
+
+    print(f"\nDiscovered compilers: {all_compilers}")
+
+    # Prepare data for DataFrame
+    plot_data = {"Compiler": [], "Category": [], "log2(speedup)": []}
+
+    for compiler, categories_data in data_by_compiler_category.items():
+        for category, speedups in categories_data.items():
+            if not speedups:
+                continue
+
+            speedups_array = np.array(speedups)
+            # Filter out non-positive values before taking the logarithm
+            log2_speedups = np.log2(speedups_array[speedups_array > 0])
+
+            plot_data["log2(speedup)"].extend(log2_speedups)
+            plot_data["Compiler"].extend([compiler] * len(log2_speedups))
+            plot_data["Category"].extend([category] * len(log2_speedups))
+
+    df_all = pd.DataFrame(plot_data)
+
+    if df_all.empty:
+        print("Error: No valid data available for plotting after processing.")
+        return
+
+    # Create the output directory
+    os.makedirs(args.output_dir, exist_ok=True)
+
+    # 1. Generate the summary comparison plot
+    plot_summary_comparison(df_all, all_compilers, args.output_dir)
+
+    # 2. Generate a detailed plot for each compiler
+    for compiler in all_compilers:
+        plot_per_compiler_detail(df_all, compiler, args.output_dir)
 
 
 def main(args):
@@ -170,25 +238,19 @@ def main(args):
 
 if __name__ == "__main__":
     parser = argparse.ArgumentParser(
-        description="Analyse speedup from different compile frameworks/hardware types"
+        description="Analyze speedup from different compile frameworks/hardware types and generate plots."
     )
     parser.add_argument(
         "--benchmark-path",
         type=str,
         required=True,
-        help="Path include multiple benchmark results from test_compiler",
-    )
-    parser.add_argument(
-        "--test-compiler-log-file",
-        type=str,
-        required=False,
-        help="Log from test_compiler (Outdated)",
+        help="Path to the root directory containing benchmark result subdirectories and JSON files.",
     )
     parser.add_argument(
-        "--output-file",
+        "--output-dir",
         type=str,
-        default="compiler_speedup.png",
-        help="Output figure file name",
+        default="analysis_results",
+        help="Directory to save the output figures.",
     )
     args = parser.parse_args()
-    main(args=args)
+    main(args)