diff --git a/agentlightning/verl/trainer.py b/agentlightning/verl/trainer.py index 413a0a1cf..efb870f46 100644 --- a/agentlightning/verl/trainer.py +++ b/agentlightning/verl/trainer.py @@ -424,6 +424,7 @@ def _train_step(self, batch_dict: dict) -> dict: scores=scores, reward_extra_infos_dict=reward_extra_infos_dict, dump_path=rollout_data_dir, + gts=None, ) # compute training metrics diff --git a/contrib/agentlightning/contrib/algorithm/env_verl/trainer.py b/contrib/agentlightning/contrib/algorithm/env_verl/trainer.py index 3dd2458f4..ae606ef87 100644 --- a/contrib/agentlightning/contrib/algorithm/env_verl/trainer.py +++ b/contrib/agentlightning/contrib/algorithm/env_verl/trainer.py @@ -421,6 +421,7 @@ def _train_step(self, batch_dict: dict) -> dict: scores=scores, reward_extra_infos_dict=reward_extra_infos_dict, dump_path=rollout_data_dir, + gts=None, ) # compute training metrics