Skip to content

Commit af70d71

Browse files
committed
add lb default
1 parent 1008eed commit af70d71

File tree

3 files changed

+4
-13
lines changed

3 files changed

+4
-13
lines changed

slime/backends/megatron_utils/model_provider.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -33,6 +33,8 @@ def __init__(
3333
self.sequence_parallel = config.sequence_parallel
3434
if self.sequence_parallel:
3535
self.weight.sequence_parallel = True
36+
if bias:
37+
self.bias.sequence_parallel = True
3638

3739
self.weight.data.normal_(mean=0.0, std=0.02)
3840
if bias:

slime/backends/sglang_utils/arguments.py

Lines changed: 1 addition & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -25,18 +25,6 @@ def add_sglang_router_arguments(parser):
2525
default=14400,
2626
help="Timeout for requests to the SGLang router in seconds",
2727
)
28-
parser.add_argument(
29-
"--sglang-router-balance-abs-threshold",
30-
type=int,
31-
default=10,
32-
help="Absolute threshold for balance in the SGLang router",
33-
)
34-
parser.add_argument(
35-
"--sglang-router-balance-rel-threshold",
36-
type=float,
37-
default=1.2,
38-
help="Relative threshold for balance in the SGLang router",
39-
)
4028
return parser
4129

4230

@@ -45,6 +33,7 @@ def add_sglang_arguments(parser):
4533
Add arguments to the parser for the SGLang server.
4634
"""
4735
parser = add_sglang_router_arguments(parser)
36+
parser.set_defaults(router_balance_abs_threshold=10, router_balance_rel_threshold=1.2)
4837
parser.add_argument("--sglang-server-concurrency", type=int, default=512)
4938

5039
old_add_argument = parser.add_argument

slime/ray/rollout.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -659,7 +659,7 @@ def _start_router(args):
659659
router_args.pd_disaggregation = True
660660

661661
logger.info(f"Launch router with args: {router_args}")
662-
662+
print("!!!", router_args.balance_abs_threshold)
663663
process = multiprocessing.Process(
664664
target=run_router,
665665
args=(router_args,),

0 commit comments

Comments
 (0)