flashinfer-ai
diff --git a/‎benchmarks/README.md
Lines changed: 47 additions & 38 deletions b/‎benchmarks/README.md
Lines changed: 47 additions & 38 deletions
diff --git a/‎benchmarks/flashinfer_benchmark.py
Lines changed: 10 additions & 26 deletions b/‎benchmarks/flashinfer_benchmark.py
Lines changed: 10 additions & 26 deletions
@@ -2,7 +2,11 @@
 import sys
 
 from routines.attention import parse_attention_args, run_attention_test
-from routines.flashinfer_benchmark_utils import full_output_columns, output_column_dict
+from routines.flashinfer_benchmark_utils import (
+    benchmark_apis,
+    full_output_columns,
+    output_column_dict,
+)
 from routines.gemm import parse_gemm_args, run_gemm_test
 
 
@@ -15,16 +19,9 @@ def run_test(args):
     """
 
     ## Depending on routine type, route to corresponding test routine
-    if args.routine in [
-        "BatchDecodeWithPagedKVCacheWrapper",
-        "BatchPrefillWithPagedKVCacheWrapper",
-        "BatchPrefillWithRaggedKVCacheWrapper",
-    ]:
+    if args.routine in benchmark_apis["attention"]:
         res = run_attention_test(args)
-    elif args.routine in [
-        "gemm_fp8_nt_groupwise",
-        "group_gemm_fp8_nt_groupwise",
-    ]:
+    elif args.routine in benchmark_apis["gemm"]:
         res = run_gemm_test(args)
     else:
         raise ValueError(f"Unsupported routine: {args.routine}")
@@ -63,13 +60,7 @@ def parse_args(line=sys.argv[1:]):
         "-R",
         type=str,
         required=True,
-        choices=[
-            "BatchDecodeWithPagedKVCacheWrapper",
-            "BatchPrefillWithPagedKVCacheWrapper",
-            "BatchPrefillWithRaggedKVCacheWrapper",
-            "gemm_fp8_nt_groupwise",
-            "group_gemm_fp8_nt_groupwise",
-        ],
+        choices=list(benchmark_apis["attention"]) + list(benchmark_apis["gemm"]),
     )
     args, _ = parser.parse_known_args(line[:])
 
@@ -122,16 +113,9 @@ def parse_args(line=sys.argv[1:]):
     )
 
     ## Check routine and pass on to routine-specific argument parser
-    if args.routine in [
-        "BatchDecodeWithPagedKVCacheWrapper",
-        "BatchPrefillWithPagedKVCacheWrapper",
-        "BatchPrefillWithRaggedKVCacheWrapper",
-    ]:
+    if args.routine in benchmark_apis["attention"]:
         args = parse_attention_args(line, parser)
-    elif args.routine in [
-        "gemm_fp8_nt_groupwise",
-        "group_gemm_fp8_nt_groupwise",
-    ]:
+    elif args.routine in benchmark_apis["gemm"]:
         args = parse_gemm_args(line, parser)
     else:
         raise ValueError(f"Unsupported routine: {args.routine}")