File tree Expand file tree Collapse file tree 3 files changed +4
-13
lines changed
Expand file tree Collapse file tree 3 files changed +4
-13
lines changed Original file line number Diff line number Diff line change @@ -33,6 +33,8 @@ def __init__(
3333 self .sequence_parallel = config .sequence_parallel
3434 if self .sequence_parallel :
3535 self .weight .sequence_parallel = True
36+ if bias :
37+ self .bias .sequence_parallel = True
3638
3739 self .weight .data .normal_ (mean = 0.0 , std = 0.02 )
3840 if bias :
Original file line number Diff line number Diff line change @@ -25,18 +25,6 @@ def add_sglang_router_arguments(parser):
2525 default = 14400 ,
2626 help = "Timeout for requests to the SGLang router in seconds" ,
2727 )
28- parser .add_argument (
29- "--sglang-router-balance-abs-threshold" ,
30- type = int ,
31- default = 10 ,
32- help = "Absolute threshold for balance in the SGLang router" ,
33- )
34- parser .add_argument (
35- "--sglang-router-balance-rel-threshold" ,
36- type = float ,
37- default = 1.2 ,
38- help = "Relative threshold for balance in the SGLang router" ,
39- )
4028 return parser
4129
4230
@@ -45,6 +33,7 @@ def add_sglang_arguments(parser):
4533 Add arguments to the parser for the SGLang server.
4634 """
4735 parser = add_sglang_router_arguments (parser )
36+ parser .set_defaults (router_balance_abs_threshold = 10 , router_balance_rel_threshold = 1.2 )
4837 parser .add_argument ("--sglang-server-concurrency" , type = int , default = 512 )
4938
5039 old_add_argument = parser .add_argument
Original file line number Diff line number Diff line change @@ -659,7 +659,7 @@ def _start_router(args):
659659 router_args .pd_disaggregation = True
660660
661661 logger .info (f"Launch router with args: { router_args } " )
662-
662+ print ( "!!!" , router_args . balance_abs_threshold )
663663 process = multiprocessing .Process (
664664 target = run_router ,
665665 args = (router_args ,),
You can’t perform that action at this time.
0 commit comments