File tree Expand file tree Collapse file tree 2 files changed +1
-33
lines changed Expand file tree Collapse file tree 2 files changed +1
-33
lines changed Load Diff This file was deleted.
Original file line number Diff line number Diff line change 9
9
from vllm .logger import init_logger
10
10
from vllm .v1 .sample .metadata import SamplingMetadata
11
11
from vllm .v1 .sample .ops .topk_topp_sampler import apply_top_k_top_p
12
- from vllm .v1 .sample .ops .utils import compiled_softmax
13
12
from vllm .v1 .spec_decode .metadata import SpecDecodeMetadata
14
13
15
14
logger = init_logger (__name__ )
@@ -275,8 +274,7 @@ def compute_probs(
275
274
# NOTE(woosuk): `apply_top_k_top_p` uses sorting to calculate the mask,
276
275
# which is slow for large vocab sizes. This may cause performance issues.
277
276
logits = apply_top_k_top_p (logits , top_k , top_p )
278
-
279
- output_prob = compiled_softmax (logits )
277
+ output_prob = logits .softmax (dim = - 1 , dtype = torch .float32 )
280
278
return output_prob
281
279
282
280
You can’t perform that action at this time.
0 commit comments