Skip to content

Commit 276b433

Browse files
committed
Update ray_trainer.py
1 parent 97dccaf commit 276b433

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

verl/trainer/ppo/ray_trainer.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,7 @@
4040
from verl.utils.seqlen_balancing import get_seqlen_balanced_partitions, log_seqlen_unbalance
4141

4242
import re
43-
from search_r1.llm_agent.generation import LLMGenerationManager, GenerationConfig
43+
from openmanus_rl.llm_agent.openmanus import OpenManusAgent, AgentConfig
4444

4545
WorkerType = Type[Worker]
4646

@@ -444,7 +444,7 @@ def _validate(self):
444444
reward_tensor_lst = []
445445
data_source_lst = []
446446

447-
gen_config = GenerationConfig(
447+
gen_config = AgentConfig(
448448
max_turns=self.config.max_turns,
449449
max_start_length=self.config.data.max_start_length,
450450
max_prompt_length=self.config.data.max_prompt_length,
@@ -457,7 +457,7 @@ def _validate(self):
457457
)
458458

459459
# Agent config preparation
460-
generation_manager = LLMGenerationManager(
460+
generation_manager = OpenManusAgent(
461461
tokenizer=self.tokenizer,
462462
actor_rollout_wg=self.actor_rollout_wg,
463463
config=gen_config,
@@ -675,7 +675,7 @@ def fit(self):
675675
self.global_steps += 1
676676

677677
# Agent config preparation
678-
gen_config = GenerationConfig(
678+
gen_config = AgentConfig(
679679
max_turns=self.config.max_turns,
680680
max_start_length=self.config.data.max_start_length,
681681
max_prompt_length=self.config.data.max_prompt_length,
@@ -687,7 +687,7 @@ def fit(self):
687687
topk = self.config.retriever.topk,
688688
)
689689

690-
generation_manager = LLMGenerationManager(
690+
generation_manager = OpenManusAgent(
691691
tokenizer=self.tokenizer,
692692
actor_rollout_wg=self.actor_rollout_wg,
693693
config=gen_config,

0 commit comments

Comments
 (0)