jampuramprem commited on
Commit
e651edc
·
1 Parent(s): e7cacff

Added a fallback for values

Browse files
Files changed (1) hide show
  1. inference.py +7 -6
inference.py CHANGED
@@ -199,15 +199,16 @@ def run_task(task_id: str, client: OpenAI) -> Dict[str, Any]:
199
  log_step(steps, action, reward, done, error)
200
 
201
  grader = http.get("/grader").json()
202
- raw_score = grader.get("score", 0.0)
203
- _EPS = 1e-6
204
- score = min(max(raw_score, _EPS), 1.0 - _EPS)
205
- log_end(success=score > _EPS, steps=steps, score=score, rewards=rewards)
 
206
 
207
  except Exception as exc:
208
  print(f"Episode error ({task_id}): {exc}", file=sys.stderr)
209
- log_end(success=False, steps=steps, score=0.0, rewards=rewards)
210
- score = 0.0
211
 
212
  return {
213
  "task_id": task_id,
 
199
  log_step(steps, action, reward, done, error)
200
 
201
  grader = http.get("/grader").json()
202
+ raw_score = grader.get("score") or 0.0
203
+ # Clamp strictly inside (0, 1): logger uses :.4f, so bounds must be
204
+ # representable without rounding to 0.0000 or 1.0000.
205
+ score = min(max(raw_score, 0.001), 0.999)
206
+ log_end(success=True, steps=steps, score=score, rewards=rewards)
207
 
208
  except Exception as exc:
209
  print(f"Episode error ({task_id}): {exc}", file=sys.stderr)
210
+ score = 0.001
211
+ log_end(success=False, steps=steps, score=score, rewards=rewards)
212
 
213
  return {
214
  "task_id": task_id,