Spaces:

Omkar1806
/

code

Running

App Files Files Community

Omkar1806 commited on 10 days ago

Commit

c5fdb67

verified ·

1 Parent(s): 1d620e0

Update env.py

Browse files

Files changed (1) hide show

env.py +31 -28

env.py CHANGED Viewed

@@ -1,5 +1,4 @@
 from typing import List, Dict, Any, Tuple
-import random
 URGENCY_LABELS = ["low", "medium", "high"]
 ROUTING_LABELS = ["general", "support", "security"]
@@ -13,42 +12,50 @@ class EmailTriageEnv:
         self._index = 0
         self._done = False
-    # ✅ TASK-WISE DATA (required for grader)
     def _generate_emails(self) -> List[Dict]:
-        task_data = {
-            "easy": [
                 {"description": "Password reset not working", "label": [2, 1, 2]},
                 {"description": "Billing refund request", "label": [1, 2, 2]},
-                {"description": "App is slow and buggy", "label": [0, 1, 1]},
-            ],
-            "medium": [
                 {"description": "Password reset not working", "label": [2, 1, 2]},
                 {"description": "Billing refund request", "label": [1, 2, 2]},
-                {"description": "App is slow and buggy", "label": [0, 1, 1]},
                 {"description": "Possible phishing attempt detected", "label": [2, 2, 2]},
-                {"description": "Invoice mismatch and payment issue", "label": [1, 2, 2]},
-            ],
-            "hard": [
                 {"description": "Password reset not working", "label": [2, 1, 2]},
                 {"description": "Billing refund request", "label": [1, 2, 2]},
-                {"description": "App is slow and buggy", "label": [0, 1, 1]},
                 {"description": "Possible phishing attempt detected", "label": [2, 2, 2]},
-                {"description": "Invoice mismatch and payment issue", "label": [1, 2, 2]},
-                {"description": "Ransomware attack suspected on system", "label": [2, 2, 2]},
-                {"description": "User reports data breach and performance issues", "label": [2, 2, 2]},
-            ],
-        }
-        emails = task_data.get(self.task, task_data["easy"])
-        random.shuffle(emails)
-        return emails
-    # ✅ RESET
     def reset(self) -> Dict[str, Any]:
         self._queue = self._generate_emails()
         self._index = 0
         self._done = False
-        return self.state()
     # ✅ STATE
     def state(self) -> Dict[str, Any]:
@@ -63,21 +70,17 @@ class EmailTriageEnv:
             "done": False
         }
-    # ✅ STEP (GRADER LOGIC)
     def step(self, action: List[int]) -> Tuple[Dict, float, bool, Dict, Dict]:
         if self._done:
             return self.state(), 0.0, True, {}, {}
         correct = self._queue[self._index]["label"]
-        # 🎯 PARTIAL REWARD (important)
         matches = sum(1 for a, b in zip(action, correct) if a == b)
         reward = matches / 3.0  # normalized [0,1]
-        # 🔥 BONUS for perfect prediction
-        if matches == 3:
-            reward = 1.0
         self._index += 1
         if self._index >= len(self._queue):

 from typing import List, Dict, Any, Tuple
 URGENCY_LABELS = ["low", "medium", "high"]
 ROUTING_LABELS = ["general", "support", "security"]
         self._index = 0
         self._done = False
+    # ✅ EXPLICIT TASK DATA (NO RANDOMNESS)
     def _generate_emails(self) -> List[Dict]:
+        if self.task == "easy":
+            return [
                 {"description": "Password reset not working", "label": [2, 1, 2]},
                 {"description": "Billing refund request", "label": [1, 2, 2]},
+                {"description": "App is slow", "label": [0, 1, 1]},
+            ]
+        elif self.task == "medium":
+            return [
                 {"description": "Password reset not working", "label": [2, 1, 2]},
                 {"description": "Billing refund request", "label": [1, 2, 2]},
+                {"description": "App is slow", "label": [0, 1, 1]},
                 {"description": "Possible phishing attempt detected", "label": [2, 2, 2]},
+                {"description": "Invoice mismatch issue", "label": [1, 2, 2]},
+            ]
+        elif self.task == "hard":
+            return [
                 {"description": "Password reset not working", "label": [2, 1, 2]},
                 {"description": "Billing refund request", "label": [1, 2, 2]},
+                {"description": "App is slow", "label": [0, 1, 1]},
                 {"description": "Possible phishing attempt detected", "label": [2, 2, 2]},
+                {"description": "Invoice mismatch issue", "label": [1, 2, 2]},
+                {"description": "Ransomware attack suspected", "label": [2, 2, 2]},
+                {"description": "Data breach reported", "label": [2, 2, 2]},
+            ]
+        else:
+            return []
+    # ✅ RESET (DETERMINISTIC)
     def reset(self) -> Dict[str, Any]:
         self._queue = self._generate_emails()
         self._index = 0
         self._done = False
+        return {
+            "description": self._queue[self._index]["description"],
+            "step": 0,
+            "remaining": len(self._queue),
+            "done": False
+        }
     # ✅ STATE
     def state(self) -> Dict[str, Any]:
             "done": False
         }
+    # ✅ STEP (CLEAR GRADER)
     def step(self, action: List[int]) -> Tuple[Dict, float, bool, Dict, Dict]:
         if self._done:
             return self.state(), 0.0, True, {}, {}
         correct = self._queue[self._index]["label"]
+        # 🎯 GRADER (CLEAR + NORMALIZED)
         matches = sum(1 for a, b in zip(action, correct) if a == b)
         reward = matches / 3.0  # normalized [0,1]
         self._index += 1
         if self._index >= len(self._queue):