meta-pytorch · PaliC · Jul 29, 2025 · Jul 30, 2025 · Jul 30, 2025 · Jul 23, 2025
@@ -7,4 +7,5 @@ backendbench.egg-info/
 CLAUDE.md
 venv/
 ops/
+datasets/
 uv.lock
@@ -0,0 +1,229 @@
+"""
+Shared data loading utilities for reading trace and parquet files.
+"""
+
+import hashlib
+import logging
+import re
+from pathlib import Path
+from typing import Dict, List, Optional, Union
+
+import pyarrow.parquet as pq
+
+import requests
+import torch
+from BackendBench.utils import cleanup_memory_and_gpu, deserialize_args
+from tqdm import tqdm
+
+
+def _args_size(args):
+    """Calculate the size of arguments in bytes."""
+
+    size = 0
+    for arg in args:
+        if isinstance(arg, torch.Tensor):
+            size += arg.numel() * arg.element_size()
+        elif isinstance(arg, (tuple, list)):
+            size += _args_size(arg)
+    return size
+
+
+def _parse_trace_file(filename: str, filter: Optional[List[str]] = None) -> List[Dict]:
+    """
+    Parse a single trace file and return a list of operation dictionaries.
+
+    Args:
+        filename: Path to trace file
+        filter: Optional list of operation name filters
+    """
+    op_inputs = []
+    op = None
+
+    with open(filename, "r") as f:
+        lines = list(f)
+        iterator = tqdm(lines, desc=f"Parsing {Path(filename).name}")
+        for line in iterator:
+            if m := re.match("Operator: (.*)", line):
+                op = m.group(1)
+                # this is due to a version skew error of the pytorch version we're
+                # using for developing BackendBench and what was used in tritonbench where
+                # SymInt didn't exist.
+                # @todo: see if we can remove this before releasing
+                if op == "aten.sum.SymInt":
+                    op = "aten.sum.dim_IntList"
+            if m := re.match("cnt: \\d+, (.*)", line):
+                assert op is not None
+                args_str = m.group(1)
+                cnt = int(m.group(0).split(",")[0].split(":")[1])
+
+                if filter is None or any(f in op for f in filter):
+                    args, kwargs = deserialize_args(args_str)
+                    size = _args_size(args) + _args_size(list(kwargs.values()))
+                    size = size / (1024 * 1024)  # Convert to MB
+                    is_synthetic = cnt == 0
+
+                    op_inputs.append(
+                        {
+                            "uuid": hashlib.sha256(args_str.encode() + op.encode()).hexdigest(),
+                            "op_name": op,
+                            "args": args_str,
+                            "arg_size": size,
+                            "count": cnt,
+                            "is_synthetic": is_synthetic,
+                        }
+                    )
+    return op_inputs
+
+
+def _parse_trace_stream(
+    stream, filter: Optional[List[str]] = None, desc: str = "Parsing stream"
+) -> List[Dict]:
+    """
+    Parse trace data from a text stream (e.g., from requests.Response.iter_lines()).
+
+    Args:
+        stream: Iterable of lines (strings or bytes)
+        filter: Optional list of operation name filters
+        desc: Description for progress bar
+    """
+    op_inputs = []
+    op = None
+
+    iterator = tqdm(stream, desc=desc)
+
+    for line in iterator:
+        # Handle bytes from response stream
+        if isinstance(line, bytes):
+            line = line.decode("utf-8")
+
+        if m := re.match("Operator: (.*)", line):
+            op = m.group(1)
+            if op == "aten.sum.SymInt":
+                op = "aten.sum.dim_IntList"
+        if m := re.match("cnt: \\d+, (.*)", line):
+            assert op is not None
+            args_str = m.group(1)
+            cnt = int(m.group(0).split(",")[0].split(":")[1])
+
+            if filter is None or any(f in op for f in filter):
+                args, kwargs = deserialize_args(args_str)
+                size = _args_size(args) + _args_size(list(kwargs.values()))
+                del args, kwargs
+                cleanup_memory_and_gpu()
+                size = size / (1024 * 1024)  # Convert to MB
+                is_synthetic = cnt == 0
+
+                op_inputs.append(
+                    {
+                        "uuid": hashlib.sha256(args_str.encode() + op.encode()).hexdigest(),
+                        "op_name": op,
+                        "args": args_str,
+                        "arg_size": size,
+                        "count": cnt,
+                        "is_synthetic": is_synthetic,
+                    }
+                )
+    return op_inputs
+
+
+def load_ops_from_source(
+    source: Union[str, Path],
+    format: str = "auto",
+    filter: Optional[List[str]] = None,
+) -> List[Dict]:
+    """
+    Load operation data from various sources and formats.
+
+    Args:
+        source: File path or URL
+        format: "trace", "parquet", or "auto" (detect from file extension)
+        filter: Optional list of operation name filters
+
+    Returns:
+        List of dictionaries with detailed operation info
+
+    Auto-detection behavior:
+        - https://domain.com/data.parquet → parquet format
+        - https://domain.com/data.txt → trace format
+        - https://domain.com/data → trace format (fallback)
+        - local_file.parquet → parquet format
+        - local_file.txt → trace format
+    """
+
+    # Auto-detect format if not specified
+    if format == "auto":
+        if isinstance(source, str):
+            # Check file extension first (works for both local files and URLs)
+            if source.endswith(".parquet"):
+                format = "parquet"
+            elif source.endswith(".txt"):
+                format = "trace"
+            elif source.startswith(("http://", "https://")):
+                # Remote URL without recognizable extension - default to trace
+                format = "trace"
+            else:
+                raise ValueError(f"Unsupported source: {source}")
+        else:
+            raise ValueError(f"Unsupported source: {source}")
+
+    if format == "parquet":
+        return _load_from_parquet(source, filter)
+    elif format == "trace":
+        # Always load full data - consumers can extract what they need
+        return _load_from_trace(source, filter)
+    else:
+        raise ValueError(f"Unsupported format: {format}")
+
+
+def _load_from_parquet(source: Union[str, Path], filter: Optional[List[str]]):
+    """Load operations from parquet file."""
+    table = pq.read_table(source)
+    df = table.to_pandas()
+
+    # Apply filter if provided
+    if filter:
+        mask = df["op_name"].apply(lambda op: any(f in op for f in filter))
+        df = df[mask]
+
+    return df.to_dict("records")
+
+
+def op_list_to_benchmark_dict(ops_list: List[Dict]) -> Dict[str, List[str]]:
+    """
+    Convert a list of operation dictionaries to a dictionary format which can be used for benchmarking.
+
+    Args:
+        ops_list: List of dicts with 'op_name' and 'args' keys
+
+    Returns:
+        Dictionary mapping op_name to list of args strings
+    """
+    result = {}
+    for op_data in ops_list:
+        if not op_data["included_in_benchmark"]:
+            continue
+        op_name = op_data["op_name"]
+        args = op_data["args"]
+        if op_name not in result:
+            result[op_name] = []
+        result[op_name].append(args)
+    return result
+
+
+def _load_from_trace(source: Union[str, Path], filter: Optional[List[str]]) -> List[Dict]:
+    """Load operations from trace file(s) and return list of dicts."""
+    op_inputs = []
+
+    # Handle URLs - stream directly without saving to disk
+    if isinstance(source, str) and (source.startswith("http://") or source.startswith("https://")):
+        logging.info(f"Downloading trace from {source}")
+        with requests.get(source, stream=True) as response:
+            response.raise_for_status()
+            desc = "Parsing"
+            op_inputs = _parse_trace_stream(response.iter_lines(), filter, desc)
+
+    # Handle single files
+    else:
+        op_inputs = _parse_trace_file(source, filter)
+
+    return op_inputs
@@ -4,9 +4,7 @@
 
 import triton.testing
 
-
-from BackendBench.utils import uses_cuda_stream
-from BackendBench.utils import serialize_args
+from BackendBench.utils import serialize_args, uses_cuda_stream
 
 logger = logging.getLogger(__name__)
 

@@ -0,0 +1,30 @@
+# Operators to skip for indexing ops that need valid indices
+SKIP_OPERATORS = [
+    "embedding",
+    "scatter",
+    "gather",
+    "index",
+    "nll_loss",
+    "im2col_backward",
+    "col2im_backward",
+    "native_layer_norm_backward",
+    "upsample_nearest2d_backward.vec",
+    "upsample_bilinear2d_backward.vec",
+    "_cudnn_rnn_backward.default",  # RuntimeError: cuDNN error: CUDNN_STATUS_BAD_PARAM
+    "_fft_c2c.default",  # cuFFT only supports dimensions whose sizes are powers of two when computing in half precision
+]
+
+
+def apply_skip_ops_filter(ops):
+    for op in ops:
+        if any(skip_op in op["op_name"] for skip_op in SKIP_OPERATORS):
+            op["included_in_benchmark"] = False
+            op["why_excluded"].append("We cannot run this op on backendbench yet")
+            op["runnable"] = False
+
+        if op["is_synthetic"]:
+            op["included_in_benchmark"] = False
+            op["why_excluded"].append(
+                "Synthetic ops are not supported in the official benchmark yet"
+            )
+    return ops
@@ -1,5 +1,4 @@
 import argparse
-import gc
 import logging
 import os
 import tempfile
@@ -20,6 +19,7 @@
 )
 from main import setup_logging
 from tqdm import tqdm
+from BackendBench.utils import cleanup_memory_and_gpu
 
 # Magic numbers and constants
 MAX_ITERATIONS = 100  # Maximum binary search iterations to prevent infinite loops
@@ -44,16 +44,6 @@
 log = logging.getLogger(__name__)
 
 
-def cleanup_memory_and_gpu(*variables):
-    """Helper function to delete variables and clean up GPU memory"""
-    for var in variables:
-        if var is not None:
-            del var
-    torch.cuda.synchronize()
-    torch.cuda.empty_cache()
-    gc.collect()
-
-
 def scale_shape(shape: List[int], scale_factor: float) -> List[int]:
     """Scale tensor shape by a factor"""
     return [max(MIN_TENSOR_DIM, int(dim * scale_factor)) for dim in shape]

@@ -7,6 +7,7 @@
 import BackendBench.eval as eval
 import click
 import torch
+
 from BackendBench.facto_suite import FactoTestSuite
 from BackendBench.llm_client import ClaudeKernelGenerator, LLMKernelGenerator
 from BackendBench.opinfo_suite import OpInfoTestSuite
-Original file line number
+Diff line change
@@ Expand Up / @@ -7,4 +7,5 @@ backendbench.egg-info/ @@
     CLAUDE.md
     venv/
     ops/
+    datasets/
     uv.lock