Spaces:

anugrah55
/

data_clean_env

Sleeping

anugrah55 commited on about 1 month ago

Commit

656cb14

verified ·

1 Parent(s): 81fb5f6

Fix score decimal formatting to strictly 2 places

Files changed (1) hide show

inference.py CHANGED Viewed

@@ -15,7 +15,7 @@ HF_TOKEN = os.getenv("HF_TOKEN")
 BENCHMARK = "data_clean_env"
 MAX_STEPS = 10
-TEMPERATURE = 0.7
 SYSTEM_PROMPT = textwrap.dedent(
     """
@@ -54,7 +54,7 @@ def log_step(step: int, action: str, reward: float, done: bool, error: Optional[
 def log_end(success: bool, steps: int, score: float, rewards: List[float]) -> None:
     rewards_str = ",".join(f"{r:.2f}" for r in rewards)
-    print(f"[END] success={str(success).lower()} steps={steps} score={score:.3f} rewards={rewards_str}", flush=True)
 def get_model_action(client: OpenAI, obs_dict: dict) -> dict:
     user_prompt = f"Observation:\n{json.dumps(obs_dict, indent=2)}\nWhat is your next action?"

 BENCHMARK = "data_clean_env"
 MAX_STEPS = 10
+TEMPERATURE = 0.0
 SYSTEM_PROMPT = textwrap.dedent(
     """
 def log_end(success: bool, steps: int, score: float, rewards: List[float]) -> None:
     rewards_str = ",".join(f"{r:.2f}" for r in rewards)
+    print(f"[END] success={str(success).lower()} steps={steps} score={score:.2f} rewards={rewards_str}", flush=True)
 def get_model_action(client: OpenAI, obs_dict: dict) -> dict:
     user_prompt = f"Observation:\n{json.dumps(obs_dict, indent=2)}\nWhat is your next action?"