We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 78bf77a commit a7b54f9Copy full SHA for a7b54f9
tests/slow/test_grpo_slow.py
@@ -79,6 +79,7 @@ def test_training_with_liger_grpo_loss(self, model_name):
79
max_completion_length=self.max_length,
80
report_to="none",
81
logging_strategy="no",
82
+ loss_type="bnpo", # liger-kernel does not support "dapo" default; see https://github.com/linkedin/Liger-Kernel/issues/620
83
)
84
85
model = AutoModelForCausalLM.from_pretrained(model_name)
0 commit comments