We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 41602bc commit 3fd447aCopy full SHA for 3fd447a
trl/experimental/minillm/minillm_config.py
@@ -47,6 +47,8 @@ class MiniLLMConfig(GRPOConfig):
47
Whether to apply length normalization to the rewards.
48
"""
49
50
+ _VALID_DICT_FIELDS = TrainingArguments._VALID_DICT_FIELDS + ["teacher_model_init_kwargs"]
51
+
52
teacher_model_init_kwargs: dict[str, Any] | None = field(
53
default=None,
54
metadata={
0 commit comments