@@ -767,7 +767,7 @@ def add_request(
767767 Details:
768768 - Set arrival_time to the current time if it is None.
769769 - Set prompt_token_ids to the encoded prompt if it is None.
770- - Create `best_of ` number of :class:`~vllm.Sequence` objects.
770+ - Create `n ` number of :class:`~vllm.Sequence` objects.
771771 - Create a :class:`~vllm.SequenceGroup` object
772772 from the list of :class:`~vllm.Sequence`.
773773 - Add the :class:`~vllm.SequenceGroup` object to the scheduler.
@@ -1242,8 +1242,7 @@ def _advance_to_next_step(
12421242 if seq_group_metadata .do_sample :
12431243 assert len (sequence_group_outputs .samples ) == 1 , (
12441244 "Async output processor expects a single sample"
1245- " (i.e sampling_params.n == 1 and no "
1246- "sampling_params.best_of > 1)" )
1245+ " (i.e sampling_params.n == 1)" )
12471246 sample = sequence_group_outputs .samples [0 ]
12481247
12491248 assert len (seq_group .seqs ) == 1
@@ -1612,7 +1611,6 @@ def _get_stats(self,
16121611 # Metadata
16131612 num_prompt_tokens_requests : List [int ] = []
16141613 num_generation_tokens_requests : List [int ] = []
1615- best_of_requests : List [int ] = []
16161614 n_requests : List [int ] = []
16171615 finished_reason_requests : List [str ] = []
16181616
@@ -1683,8 +1681,6 @@ def _get_stats(self,
16831681 for seq in seq_group .get_finished_seqs ()
16841682 ])
16851683 if seq_group .sampling_params is not None :
1686- best_of_requests .append (
1687- seq_group .sampling_params .best_of )
16881684 n_requests .append (seq_group .sampling_params .n )
16891685 finished_reason_requests .extend ([
16901686 SequenceStatus .get_finished_reason (seq .status )
@@ -1737,7 +1733,6 @@ def _get_stats(self,
17371733 # Metadata
17381734 num_prompt_tokens_requests = num_prompt_tokens_requests ,
17391735 num_generation_tokens_requests = num_generation_tokens_requests ,
1740- best_of_requests = best_of_requests ,
17411736 n_requests = n_requests ,
17421737 finished_reason_requests = finished_reason_requests ,
17431738 )
@@ -1824,8 +1819,6 @@ def create_trace_span(self, seq_group: SequenceGroup) -> None:
18241819 seq_group .sampling_params .top_p )
18251820 seq_span .set_attribute (SpanAttributes .LLM_REQUEST_MAX_TOKENS ,
18261821 seq_group .sampling_params .max_tokens )
1827- seq_span .set_attribute (SpanAttributes .LLM_REQUEST_BEST_OF ,
1828- seq_group .sampling_params .best_of )
18291822 seq_span .set_attribute (SpanAttributes .LLM_REQUEST_N ,
18301823 seq_group .sampling_params .n )
18311824 seq_span .set_attribute (SpanAttributes .LLM_USAGE_NUM_SEQUENCES ,
0 commit comments