modelbuilderhq commited on
Commit
a814a07
·
verified ·
1 Parent(s): dfc0f77

Upload folder using huggingface_hub

Browse files
Files changed (1) hide show
  1. inference.py +10 -12
inference.py CHANGED
@@ -68,13 +68,13 @@ def emit_step(step_no: int, action_text: str, reward: float, done: bool, error:
68
  )
69
 
70
 
71
- def emit_end(success: bool, steps: int, score: float, rewards: List[float]) -> None:
72
- reward_text = ",".join(f"{reward:.2f}" for reward in rewards)
73
- print(
74
- f"[END] success={str(success).lower()} steps={steps} "
75
- f"score={score:.2f} rewards={reward_text}",
76
- flush=True,
77
- )
78
 
79
 
80
  def choose_tasks(selection: str) -> Iterable[str]:
@@ -142,11 +142,9 @@ def compact_action(action: PharmaAction) -> str:
142
  return label
143
 
144
 
145
- def final_score(rewards: List[float]) -> float:
146
- if not rewards:
147
- return 0.0
148
- score = sum(rewards) / len(rewards)
149
- return min(max(round(score, 4), 0.0), 1.0)
150
 
151
 
152
  def run_one_task(llm: OpenAI, task_name: str) -> None:
 
68
  )
69
 
70
 
71
+ def emit_end(success: bool, steps: int, score: float, rewards: List[float]) -> None:
72
+ reward_text = ",".join(f"{reward:.2f}" for reward in rewards)
73
+ print(
74
+ f"[END] success={str(success).lower()} steps={steps} "
75
+ f"score={score:.6f} rewards={reward_text}",
76
+ flush=True,
77
+ )
78
 
79
 
80
  def choose_tasks(selection: str) -> Iterable[str]:
 
142
  return label
143
 
144
 
145
+ def final_score(rewards: List[float]) -> float:
146
+ score = sum(rewards) / len(rewards) if rewards else 0.0
147
+ return max(1e-6, min(score, 1 - 1e-6))
 
 
148
 
149
 
150
  def run_one_task(llm: OpenAI, task_name: str) -> None: