Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
16 changes: 16 additions & 0 deletions src/forge/data/rewards/math.py → src/forge/data/rewards.py
Original file line number Diff line number Diff line change
Expand Up @@ -54,3 +54,19 @@ def __call__(self, prompt: str, response: str, target: str) -> float:
if abs(expected_answer - model_answer) < self.tolerance:
return 1.0 # Correct answer
return 0.0 # Incorrect answer


class ThinkingReward(Reward):
"""Reward class for evaluating use of <think> tags in reasoning."""

def __init__(self, reward_value: float = 0.5):
self.reward_value = reward_value

def __call__(
self, prompt: str, response: str, target: Optional[str] = None
) -> float:
"""Check if response contains <think>...</think> tags."""
resp = response.lower()
if "<think>" in resp and "</think>" in resp:
return self.reward_value
return 0.0
19 changes: 0 additions & 19 deletions src/forge/data/rewards/thinking.py

This file was deleted.

2 changes: 1 addition & 1 deletion tests/unit_tests/rl/test_math_reward.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@
import unittest
from unittest import mock

from forge.data.rewards.math import MathReward
from forge.data.rewards import MathReward


class TestMathReward(unittest.TestCase):
Expand Down
2 changes: 1 addition & 1 deletion tests/unit_tests/rl/test_thinking_reward.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,7 +6,7 @@

import unittest

from forge.data.rewards.thinking import ThinkingReward
from forge.data.rewards import ThinkingReward


class TestThinkingReward(unittest.TestCase):
Expand Down
Loading