@@ -810,7 +810,7 @@ def add_request(
810810 Details:
811811 - Set arrival_time to the current time if it is None.
812812 - Set prompt_token_ids to the encoded prompt if it is None.
813- - Create `best_of ` number of :class:`~vllm.Sequence` objects.
813+ - Create `n ` number of :class:`~vllm.Sequence` objects.
814814 - Create a :class:`~vllm.SequenceGroup` object
815815 from the list of :class:`~vllm.Sequence`.
816816 - Add the :class:`~vllm.SequenceGroup` object to the scheduler.
@@ -1289,8 +1289,7 @@ def _advance_to_next_step(
12891289 if seq_group_metadata .do_sample :
12901290 assert len (sequence_group_outputs .samples ) == 1 , (
12911291 "Async output processor expects a single sample"
1292- " (i.e sampling_params.n == 1 and no "
1293- "sampling_params.best_of > 1)" )
1292+ " (i.e sampling_params.n == 1)" )
12941293 sample = sequence_group_outputs .samples [0 ]
12951294
12961295 assert len (seq_group .seqs ) == 1
@@ -1659,7 +1658,6 @@ def _get_stats(self,
16591658 # Metadata
16601659 num_prompt_tokens_requests : List [int ] = []
16611660 num_generation_tokens_requests : List [int ] = []
1662- best_of_requests : List [int ] = []
16631661 n_requests : List [int ] = []
16641662 finished_reason_requests : List [str ] = []
16651663
@@ -1730,8 +1728,6 @@ def _get_stats(self,
17301728 for seq in seq_group .get_finished_seqs ()
17311729 ])
17321730 if seq_group .sampling_params is not None :
1733- best_of_requests .append (
1734- seq_group .sampling_params .best_of )
17351731 n_requests .append (seq_group .sampling_params .n )
17361732 finished_reason_requests .extend ([
17371733 SequenceStatus .get_finished_reason (seq .status )
@@ -1784,7 +1780,6 @@ def _get_stats(self,
17841780 # Metadata
17851781 num_prompt_tokens_requests = num_prompt_tokens_requests ,
17861782 num_generation_tokens_requests = num_generation_tokens_requests ,
1787- best_of_requests = best_of_requests ,
17881783 n_requests = n_requests ,
17891784 finished_reason_requests = finished_reason_requests ,
17901785 )
@@ -1871,8 +1866,6 @@ def create_trace_span(self, seq_group: SequenceGroup) -> None:
18711866 seq_group .sampling_params .top_p )
18721867 seq_span .set_attribute (SpanAttributes .LLM_REQUEST_MAX_TOKENS ,
18731868 seq_group .sampling_params .max_tokens )
1874- seq_span .set_attribute (SpanAttributes .LLM_REQUEST_BEST_OF ,
1875- seq_group .sampling_params .best_of )
18761869 seq_span .set_attribute (SpanAttributes .LLM_REQUEST_N ,
18771870 seq_group .sampling_params .n )
18781871 seq_span .set_attribute (SpanAttributes .LLM_USAGE_NUM_SEQUENCES ,
0 commit comments