Elliot89 commited on
Commit
4591acd
·
verified ·
1 Parent(s): b89411e

Update inference.py

Browse files
Files changed (1) hide show
  1. inference.py +5 -2
inference.py CHANGED
@@ -554,8 +554,10 @@ def _run_episode_structured(task_id: str, scenario_index: int) -> tuple[float, i
554
  flush=True,
555
  )
556
 
557
- # ── [END] ── (always emitted, even on exception)
558
- success_str = "true" if score > 0 else "false"
 
 
559
  rewards_str = ",".join(f"{rw:.2f}" for rw in rewards_list)
560
  print(
561
  f"[END] success={success_str} steps={steps_used} "
@@ -563,6 +565,7 @@ def _run_episode_structured(task_id: str, scenario_index: int) -> tuple[float, i
563
  flush=True,
564
  )
565
 
 
566
  return score, steps_used, rewards_list
567
 
568
 
 
554
  flush=True,
555
  )
556
 
557
+ # ── [END] ── (always emitted, even on exception)
558
+ # Clamp score to open interval (0, 1) for validator compliance
559
+ score = max(0.01, min(0.99, score))
560
+ success_str = "true" if score > 0.01 else "false"
561
  rewards_str = ",".join(f"{rw:.2f}" for rw in rewards_list)
562
  print(
563
  f"[END] success={success_str} steps={steps_used} "
 
565
  flush=True,
566
  )
567
 
568
+
569
  return score, steps_used, rewards_list
570
 
571