Spaces:

rahul2124
/

sql-arena

Running

rahul2124 commited on 12 days ago

Commit

ac49ad8

verified ·

1 Parent(s): 72e26c9

Upload folder using huggingface_hub

Files changed (5) hide show

.pytest_cache/v/cache/lastfailed ADDED Viewed

	@@ -0,0 +1 @@


1	+ {}

inference.py CHANGED Viewed

@@ -182,6 +182,11 @@ def run_task(client: OpenAI, env: SQLArenaEnvironment, task_config: dict) -> flo
                 break
         final_score = min(max(best_score, 0.0), 1.0)
         success = final_score >= 0.5
     except Exception as e:

                 break
         final_score = min(max(best_score, 0.0), 1.0)
+        # Clamp to strictly between 0 and 1
+        if final_score <= 0.0:
+            final_score = 0.01
+        if final_score >= 1.0:
+            final_score = 0.99
         success = final_score >= 0.5
     except Exception as e:

src/sql_arena/environment.py CHANGED Viewed

@@ -136,6 +136,12 @@ class SQLArenaEnvironment:
             reward = score * 0.5 + improvement * 0.5
         reward = round(min(max(reward, 0.0), 1.0), 4)
         state.rewards_history.append(reward)
         state.total_reward += reward

             reward = score * 0.5 + improvement * 0.5
         reward = round(min(max(reward, 0.0), 1.0), 4)
+        # Clamp to strictly between 0 and 1
+        if reward <= 0.0:
+            reward = 0.01
+        if reward >= 1.0:
+            reward = 0.99
         state.rewards_history.append(reward)
         state.total_reward += reward

src/sql_arena/graders.py CHANGED Viewed

@@ -194,6 +194,10 @@ def grade_result(
     # ---- Final score ----
     score = round(min(max(score, 0.0), 1.0), 4)
     feedback_parts.append(f"\nTotal Score: {score:.2f}/1.00")
     return score, "\n".join(feedback_parts)

     # ---- Final score ----
     score = round(min(max(score, 0.0), 1.0), 4)
+    if score <= 0.0:
+        score = 0.01
+    if score >= 1.0:
+        score = 0.99
     feedback_parts.append(f"\nTotal Score: {score:.2f}/1.00")
     return score, "\n".join(feedback_parts)

tests/test_env.py CHANGED Viewed

@@ -32,7 +32,7 @@ class TestEnvironmentBasics:
         self.env.reset(difficulty="basic_select", task_id="easy_001")
         action = SQLArenaAction(sql_query="INVALID SQL QUERY")
         result = self.env.step(action)
-        assert result.reward == 0.0
         assert result.observation.error_message is not None
     def test_state_tracking(self):

         self.env.reset(difficulty="basic_select", task_id="easy_001")
         action = SQLArenaAction(sql_query="INVALID SQL QUERY")
         result = self.env.step(action)
+        assert result.reward == 0.01  # Clamped to strictly > 0
         assert result.observation.error_message is not None
     def test_state_tracking(self):