Skip to content

Commit d2ab369

Browse files
authored
[MTP]Support RL reshard (#4074)
* support rl reshard * modify model name
1 parent 2883746 commit d2ab369

File tree

3 files changed

+4
-0
lines changed

3 files changed

+4
-0
lines changed

fastdeploy/config.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -132,6 +132,7 @@ def __init__(
132132
self.eos_tokens_lens: int = 2
133133
self.lm_head_fp32: bool = False
134134
self.model_format = "auto"
135+
self.num_nextn_predict_layers = 0
135136
for key, value in args.items():
136137
if hasattr(self, key):
137138
setattr(self, key, value)

fastdeploy/multimodal/registry.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,7 @@ class MultimodalRegistry:
2424
"Ernie4_5_VLMoeForConditionalGeneration",
2525
"Ernie5MoeForCausalLM",
2626
"Qwen2_5_VLForConditionalGeneration",
27+
"Ernie5ForCausalLM",
2728
}
2829

2930
@classmethod

fastdeploy/rl/rollout_config.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -61,6 +61,7 @@ def __init__(
6161
local_rank: int = 0,
6262
moba_attention_config: str = None,
6363
data_parallel_size: int = 1,
64+
num_nextn_predict_layers: int = 0,
6465
):
6566
# Required parameters
6667
self.model = model_name_or_path
@@ -107,6 +108,7 @@ def __init__(
107108
self.early_stop_config = early_stop_config
108109
self.ips = None
109110
self.moba_attention_config = moba_attention_config
111+
self.num_nextn_predict_layers = num_nextn_predict_layers
110112

111113
def __str__(self):
112114
return "\n".join(f"{k}: {v}" for k, v in self.__dict__.items())

0 commit comments

Comments
 (0)