Spaces:
Sleeping
Sleeping
Update inference.py
Browse files- inference.py +5 -2
inference.py
CHANGED
|
@@ -554,8 +554,10 @@ def _run_episode_structured(task_id: str, scenario_index: int) -> tuple[float, i
|
|
| 554 |
flush=True,
|
| 555 |
)
|
| 556 |
|
| 557 |
-
|
| 558 |
-
|
|
|
|
|
|
|
| 559 |
rewards_str = ",".join(f"{rw:.2f}" for rw in rewards_list)
|
| 560 |
print(
|
| 561 |
f"[END] success={success_str} steps={steps_used} "
|
|
@@ -563,6 +565,7 @@ def _run_episode_structured(task_id: str, scenario_index: int) -> tuple[float, i
|
|
| 563 |
flush=True,
|
| 564 |
)
|
| 565 |
|
|
|
|
| 566 |
return score, steps_used, rewards_list
|
| 567 |
|
| 568 |
|
|
|
|
| 554 |
flush=True,
|
| 555 |
)
|
| 556 |
|
| 557 |
+
# ── [END] ── (always emitted, even on exception)
|
| 558 |
+
# Clamp score to open interval (0, 1) for validator compliance
|
| 559 |
+
score = max(0.01, min(0.99, score))
|
| 560 |
+
success_str = "true" if score > 0.01 else "false"
|
| 561 |
rewards_str = ",".join(f"{rw:.2f}" for rw in rewards_list)
|
| 562 |
print(
|
| 563 |
f"[END] success={success_str} steps={steps_used} "
|
|
|
|
| 565 |
flush=True,
|
| 566 |
)
|
| 567 |
|
| 568 |
+
|
| 569 |
return score, steps_used, rewards_list
|
| 570 |
|
| 571 |
|