Spaces:

Timusgeorge
/

SynthAudit-Env

Sleeping

Timusgeorge commited on 17 days ago

Commit

c204411

verified ·

1 Parent(s): f095b05

Deploy inference.py with all fixes

Files changed (1) hide show

inference.py CHANGED Viewed

@@ -219,7 +219,9 @@ def run_heuristic_task(task_id: str, task_name: str, seed: int) -> float:
         score = obs.score_so_far
         print(f"[STEP] step={step} reward={obs.reward:.3f}", flush=True)
-    print(f"[END] task={task_id} score={score:.2f} steps={step}", flush=True)
     return score
@@ -374,7 +376,9 @@ def run_react_task(llm, task_id: str, task_name: str, seed: int) -> float:
         score = obs.score_so_far
         print(f"[STEP] step={step} reward={obs.reward:.3f}", flush=True)
-    print(f"[END] task={task_id} score={score:.2f} steps={step}", flush=True)
     return score

         score = obs.score_so_far
         print(f"[STEP] step={step} reward={obs.reward:.3f}", flush=True)
+    # CRITICAL: Clamp score strictly between 0 and 1 (exclusive)
+    score = min(0.99, max(0.01, score))
+    print(f"[END] task={task_id} score={score:.4f} steps={step}", flush=True)
     return score
         score = obs.score_so_far
         print(f"[STEP] step={step} reward={obs.reward:.3f}", flush=True)
+    # CRITICAL: Clamp score strictly between 0 and 1 (exclusive)
+    score = min(0.99, max(0.01, score))
+    print(f"[END] task={task_id} score={score:.4f} steps={step}", flush=True)
     return score