Skip to content

Commit f380945

Browse files
committed
Update
1 parent ee9cb27 commit f380945

File tree

2 files changed

+6
-4
lines changed

2 files changed

+6
-4
lines changed

graph_net/analysis.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@
1111
def parse_filename(filename):
1212
"""
1313
Parses the model name and compiler name from a JSON filename.
14-
Assumes filename format: <model_name>_<compiler_name>.json
14+
According to filename format of graph_net.torch.test_compiler: <model_name>_<compiler_name>.json
1515
"""
1616
parts = os.path.splitext(filename)[0].split("_")
1717
if len(parts) < 2:
@@ -24,7 +24,7 @@ def parse_filename(filename):
2424
def read_all_speedups(benchmark_path):
2525
"""
2626
Recursively finds all .json files in a given path, extracts the speedup values,
27-
and organizes them by compiler and category (subdirectory).
27+
and organizes them by compiler and category (library).
2828
"""
2929
data_by_compiler_category = defaultdict(lambda: defaultdict(list))
3030
all_compilers = set()

graph_net/torch/test_compiler.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -105,8 +105,10 @@ def measure_performance(model_call, args, compiler):
105105
compiler.synchronize()
106106

107107
if "cuda" in args.device:
108-
# Acknowledgement: We evaluate the performance on both end-to-end and GPU-only timings, with reference to
109-
# methods only based on CUDA events from KernelBench in https://github.com/ScalingIntelligence/KernelBench.
108+
"""
109+
Acknowledgement: We evaluate the performance on both end-to-end and GPU-only timings,
110+
With reference to methods only based on CUDA events from KernelBench in https://github.com/ScalingIntelligence/KernelBench
111+
"""
110112

111113
device = torch.device(args.device)
112114
hardware_name = torch.cuda.get_device_name(device)

0 commit comments

Comments
 (0)