Skip to content

Commit 421c498

Browse files
committed
Merge leftover
1 parent 7bf92f9 commit 421c498

File tree

2 files changed

+2
-4
lines changed

2 files changed

+2
-4
lines changed

benchmarks/kernels/benchmark_paged_attention.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -169,7 +169,6 @@ def run_cuda_benchmark(num_iters: int, profile: bool = False) -> float:
169169
kv_cache_dtype,
170170
k_scale,
171171
v_scale,
172-
None,
173172
)
174173
else:
175174
raise ValueError(f"Invalid version: {version}")
@@ -183,13 +182,13 @@ def run_cuda_benchmark(num_iters: int, profile: bool = False) -> float:
183182
# Warmup.
184183
print("Warming up...")
185184
run_benchmark = run_cuda_benchmark
186-
run_benchmark(num_iters=500, profile=False)
185+
run_benchmark(num_iters=3, profile=False)
187186

188187
# Benchmark.
189188
if do_profile:
190189
latency = run_benchmark(num_iters=1, profile=True)
191190
else:
192-
latency = run_benchmark(num_iters=10000, profile=False)
191+
latency = run_benchmark(num_iters=100, profile=False)
193192
print(f"Kernel running time: {latency * 1000000:.3f} us")
194193

195194

vllm/_custom_ops.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,6 @@
1111
from vllm.logger import init_logger
1212
from vllm.platforms import current_platform
1313
from vllm.scalar_type import ScalarType
14-
from vllm.utils import is_navi
1514

1615
logger = init_logger(__name__)
1716

0 commit comments

Comments
 (0)