add custom loss

Allen Wang · Allen Wang · commit 4d11e4eacba2 · 2025-11-06T14:40:07.000-08:00
diff --git a/src/forge/api/__init__.py b/src/forge/api/__init__.py
@@ -13,6 +13,7 @@
 from forge.api.types import (
     ForwardBackwardResult,
     ForwardResult,
+    LossFn,
     OptimStepResult,
     TextTrainBatch,
     TrainerInfo,
@@ -27,4 +28,5 @@
     "ForwardResult",
     "TrainerInfo",
     "TrainerStatus",
+    "LossFn",
 ]
diff --git a/src/forge/api/trainer.py b/src/forge/api/trainer.py
@@ -18,6 +18,7 @@
 from forge.api.types import (
     ForwardBackwardResult,
     ForwardResult,
+    LossFn,
     OptimStepResult,
     TextTrainBatch,
     TrainerInfo,
@@ -29,7 +30,9 @@
 class Trainer(Protocol):
     """Protocol defining the standard interface for all Forge trainers."""
 
-    async def forward_backward(self, batch: TextTrainBatch) -> ForwardBackwardResult:
+    async def forward_backward(
+        self, batch: TextTrainBatch, loss_fn: LossFn | None = None
+    ) -> ForwardBackwardResult:
         """Execute forward pass and backward pass for one batch of data.
 
         Basic usage - single batch per optimizer step:
@@ -45,16 +48,26 @@ async def forward_backward(self, batch: TextTrainBatch) -> ForwardBackwardResult
             >>> await trainer.forward_backward(batch2)  # Accumulates another batch
             >>> await trainer.optim_step()  # Apply all accumulated gradients
 
+        Custom loss function for specific batches:
+            >>> def custom_loss(logits: torch.Tensor, batch: TextTrainBatch) -> torch.Tensor:
+            >>>     # Custom loss computation (e.g., PPO clip, DPO, etc.)
+            >>>     return loss
+            >>>
+            >>> result = await trainer.forward_backward(batch, loss_fn=custom_loss)
+
         Args:
             batch: TextTrainBatch containing input_ids, target_ids, and optional
                 target_mask/target_weights. See forge.api.types.TextTrainBatch for details.
+            loss_fn: Optional custom loss function. If None, uses the loss function
+                configured at trainer creation. Signature: (logits, batch) -> loss.
+                Useful for mixed training objectives or experimentation.
 
         Returns:
             ForwardBackwardResult containing loss and metrics
 
         Note:
-            The loss function is configured at trainer creation time via the
-            `loss` parameter, not passed to this method.
+            The default loss function is configured at trainer creation time via the
+            `loss` parameter. The `loss_fn` parameter here allows per-batch override.
         """
         ...
 
diff --git a/src/forge/api/types.py b/src/forge/api/types.py
@@ -7,11 +7,15 @@
 """Type definitions for the Forge API."""
 
 from dataclasses import dataclass
-from typing import Any
+from typing import Any, Callable, TypeAlias
 
 import torch
 
 
+# Loss function signature: takes logits and batch, returns scalar loss
+LossFn: TypeAlias = Callable[[torch.Tensor, "TextTrainBatch"], torch.Tensor]
+
+
 @dataclass
 class TextTrainBatch:
     """A batch of text training data for forward_backward.