File tree Expand file tree Collapse file tree 2 files changed +1
-33
lines changed Expand file tree Collapse file tree 2 files changed +1
-33
lines changed Load Diff This file was deleted.
Original file line number Diff line number Diff line change 99from vllm .logger import init_logger
1010from vllm .v1 .sample .metadata import SamplingMetadata
1111from vllm .v1 .sample .ops .topk_topp_sampler import apply_top_k_top_p
12- from vllm .v1 .sample .ops .utils import compiled_softmax
1312from vllm .v1 .spec_decode .metadata import SpecDecodeMetadata
1413
1514logger = init_logger (__name__ )
@@ -275,8 +274,7 @@ def compute_probs(
275274 # NOTE(woosuk): `apply_top_k_top_p` uses sorting to calculate the mask,
276275 # which is slow for large vocab sizes. This may cause performance issues.
277276 logits = apply_top_k_top_p (logits , top_k , top_p )
278-
279- output_prob = compiled_softmax (logits )
277+ output_prob = logits .softmax (dim = - 1 , dtype = torch .float32 )
280278 return output_prob
281279
282280
You can’t perform that action at this time.
0 commit comments