Remove duplicate

yfw · yfw · commit 5af40ce42af2 · 2025-12-02T03:24:43.000-08:00
Signed-off-by: Yi-Fu Wu &lt;yifu.wu@gmail.com&gt;
diff --git a/nemo_rl/algorithms/loss_functions.py b/nemo_rl/algorithms/loss_functions.py
@@ -46,7 +46,6 @@ class ClippedPGLossConfig(TypedDict):
     use_importance_sampling_correction: bool
     truncated_importance_sampling_ratio: float | None
     token_level_loss: bool
-    force_on_policy_ratio: bool
     # If True, apply the off-policy importance-sampling correction at the
     # sequence level (one weight per generated sample), as in GSPO.
     # If False (default), correction is applied at the token level as in the