@@ -540,7 +540,7 @@ def test_decode_schedule_preempted():
540
540
curr_loras = None
541
541
for i in range (3 ):
542
542
_ , seq_group = create_dummy_prompt (str (i ), prompt_length = 60 )
543
- scheduler ._allocate_and_set_running (seq_group , 60 )
543
+ scheduler ._allocate_and_set_running (seq_group )
544
544
append_new_token_seq_group (60 , seq_group , 1 )
545
545
running .append (seq_group )
546
546
scheduler .block_manager .can_append_slots = MagicMock ()
@@ -581,7 +581,7 @@ def test_decode_swap_beam_search():
581
581
budget = create_token_budget ()
582
582
for i in range (3 ):
583
583
_ , seq_group = create_dummy_prompt (str (i ), prompt_length = 60 , best_of = 2 )
584
- scheduler ._allocate_and_set_running (seq_group , 60 )
584
+ scheduler ._allocate_and_set_running (seq_group )
585
585
running .append (seq_group )
586
586
append_new_token_seq_group (60 , seq_group , 1 )
587
587
budget .add_num_seqs (seq_group .request_id ,
@@ -629,7 +629,7 @@ def test_schedule_decode_blocks_to_copy_update():
629
629
running = deque ()
630
630
policy = PolicyFactory .get_policy (policy_name = "fcfs" )
631
631
curr_loras = None
632
- scheduler ._allocate_and_set_running (seq_group , 60 )
632
+ scheduler ._allocate_and_set_running (seq_group )
633
633
append_new_token_seq_group (60 , seq_group , 1 )
634
634
running .append (seq_group )
635
635
@@ -659,7 +659,7 @@ def test_schedule_swapped_simple():
659
659
curr_loras = None
660
660
blocks_to_swap_out = {}
661
661
_ , seq_group = create_dummy_prompt ("1" , prompt_length = 60 , best_of = 2 )
662
- scheduler ._allocate_and_set_running (seq_group , 60 )
662
+ scheduler ._allocate_and_set_running (seq_group )
663
663
append_new_token_seq_group (60 , seq_group , 1 )
664
664
scheduler ._swap_out (seq_group , blocks_to_swap_out )
665
665
swapped .append (seq_group )
@@ -687,7 +687,7 @@ def test_schedule_swapped_max_token_budget():
687
687
blocks_to_swap_out = {}
688
688
for _ in range (2 ):
689
689
_ , seq_group = create_dummy_prompt ("1" , prompt_length = 60 , best_of = 2 )
690
- scheduler ._allocate_and_set_running (seq_group , 60 )
690
+ scheduler ._allocate_and_set_running (seq_group )
691
691
append_new_token_seq_group (60 , seq_group , 1 )
692
692
scheduler ._swap_out (seq_group , blocks_to_swap_out )
693
693
swapped .append (seq_group )
@@ -721,7 +721,7 @@ def test_schedule_swapped_max_seqs():
721
721
blocks_to_swap_out = {}
722
722
for i in range (4 ):
723
723
_ , seq_group = create_dummy_prompt (str (i ), prompt_length = 60 )
724
- scheduler ._allocate_and_set_running (seq_group , 60 )
724
+ scheduler ._allocate_and_set_running (seq_group )
725
725
append_new_token_seq_group (60 , seq_group , 1 )
726
726
scheduler ._swap_out (seq_group , blocks_to_swap_out )
727
727
swapped .append (seq_group )
@@ -759,7 +759,7 @@ def test_schedule_swapped_max_loras():
759
759
lora_name = str (i ),
760
760
lora_int_id = i + 1 ,
761
761
lora_local_path = "abc" ))
762
- scheduler ._allocate_and_set_running (seq_group , 60 )
762
+ scheduler ._allocate_and_set_running (seq_group )
763
763
append_new_token_seq_group (60 , seq_group , 1 )
764
764
scheduler ._swap_out (seq_group , blocks_to_swap_out )
765
765
swapped .append (seq_group )
@@ -783,7 +783,7 @@ def test_schedule_swapped_cannot_swap_in():
783
783
blocks_to_swap_out = {}
784
784
for _ in range (2 ):
785
785
_ , seq_group = create_dummy_prompt ("1" , prompt_length = 60 , best_of = 2 )
786
- scheduler ._allocate_and_set_running (seq_group , 60 )
786
+ scheduler ._allocate_and_set_running (seq_group )
787
787
append_new_token_seq_group (60 , seq_group , 1 )
788
788
scheduler ._swap_out (seq_group , blocks_to_swap_out )
789
789
swapped .append (seq_group )
@@ -808,7 +808,7 @@ def test_schedule_swapped_blocks_to_copy():
808
808
policy = PolicyFactory .get_policy (policy_name = "fcfs" )
809
809
curr_loras = None
810
810
_ , seq_group = create_dummy_prompt ("1" , prompt_length = 60 , best_of = 2 )
811
- scheduler ._allocate_and_set_running (seq_group , 60 )
811
+ scheduler ._allocate_and_set_running (seq_group )
812
812
append_new_token_seq_group (60 , seq_group , 1 )
813
813
blocks_to_swap_out = {}
814
814
scheduler ._swap_out (seq_group , blocks_to_swap_out )
0 commit comments