Spaces:

MridulNegi2005
/

negotiation-openenv

Sleeping

MridulNegi2005 commited on Apr 6

Commit

332cfd0

1 Parent(s): 4ad3f24

Fix [END] format: restore score= field, add flush=True to all log prints

Files changed (1) hide show

inference.py CHANGED Viewed

@@ -49,7 +49,7 @@ def run_task(client, model_name: str, task_config):
     )
     obs = env.reset()
-    print(f"[START] task={task_config.name} env=negotiation model={model_name}")
     done = False
     step_n = 0
@@ -153,14 +153,15 @@ Respond with ONLY your chosen action, nothing else."""
             # ── Log step (stdout — parsed by judges) ──
             log_action = action_str if not action_str.startswith("OFFER") else f"OFFER {action_price}"
-            print(f"[STEP] step={step_n} action={log_action} reward={reward:.2f} done={str(done).lower()} error={error_msg}")
     finally:
         # [END] MUST always be printed, even on exceptions
         grader = get_grader(task_config)
         result = grader.grade(rewards, step_n, deal_made)
         rewards_str = ",".join([f"{r:.2f}" for r in rewards])
-        print(f"[END] success={str(result['success']).lower()} steps={step_n} rewards={rewards_str}")
     return result

     )
     obs = env.reset()
+    print(f"[START] task={task_config.name} env=negotiation model={model_name}", flush=True)
     done = False
     step_n = 0
             # ── Log step (stdout — parsed by judges) ──
             log_action = action_str if not action_str.startswith("OFFER") else f"OFFER {action_price}"
+            print(f"[STEP] step={step_n} action={log_action} reward={reward:.2f} done={str(done).lower()} error={error_msg}", flush=True)
     finally:
         # [END] MUST always be printed, even on exceptions
         grader = get_grader(task_config)
         result = grader.grade(rewards, step_n, deal_made)
         rewards_str = ",".join([f"{r:.2f}" for r in rewards])
+        score = result['score']
+        print(f"[END] success={str(result['success']).lower()} steps={step_n} score={score:.4f} rewards={rewards_str}", flush=True)
     return result