0731_3

2025-07-31 16:53:06 +08:00 · 2025-07-31 16:53:06 +08:00 · 2e0af5dd87
parent 78d0367ff2
commit 2e0af5dd87
1 changed files with 5 additions and 21 deletions
--- a/examples/arealite/reward/geometry3k.py
+++ b/examples/arealite/reward/geometry3k.py
@ -19,25 +19,9 @@ def geometry3k_reward_fn(
        return 0
    if ans is None:
        return 0
-
-    is_numeric = sol.replace('.', '', 1).isdigit() or ans.replace('.', '', 1).isdigit() # Allows for decimal check
-    is_latex = sol.startswith("\\frac") or '\\sqrt' in sol or ans.startswith("\\frac") or '\\sqrt' in ans
    print(f"sol: {sol}, ans: {ans}")
-    # Exact answer matching
-    if sol == ans :
-        reward = 1
-    elif is_numeric and not is_latex and abs(float(sol) - float(ans)) < 1e-4:
-        reward = 0.8  # Reward for correct numerical approximation
-    elif is_latex:
-        # Check if numbers in LaTeX are correct
-        expected_numbers = re.findall(r'-?\d+\.?\d*', ans)  # Find all numbers in expected answer
-        predicted_numbers = re.findall(r'-?\d+\.?\d*', sol)  # Find all numbers in predicted answer
-
-        if len(expected_numbers) == len(predicted_numbers) and all(
-            abs(float(pred) - float(exp)) < 1e-4 for pred, exp in zip(predicted_numbers, expected_numbers)
-        ):
-           reward = 0.6
-    else:
-        reward = 0
-
-    return reward
+    from realhf.impl.dataset.math_parser import math_equal
+    if math_equal(sol, ans):
+        print(f"completions: {completions}, answer: {answer}")
+        return 1
+    return 0