We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9a3101b commit 1d34eb1Copy full SHA for 1d34eb1
vllm/v1/worker/gpu/block_table.py
@@ -3,10 +3,9 @@
3
from collections.abc import Iterable
4
5
import torch
6
-import triton
7
-import triton.language as tl
8
9
from vllm.attention.backends.utils import PAD_SLOT_ID
+from vllm.triton_utils import tl, triton
10
from vllm.utils.math_utils import cdiv
11
from vllm.v1.utils import CpuGpuBuffer
12
vllm/v1/worker/gpu/input_batch.py
@@ -7,9 +7,8 @@
import numba.types as types
import numpy as np
13
from vllm.utils import random_uuid
14
15
0 commit comments