Spaces:

kevanthonyP
/

it-support-triage

Sleeping

App Files Files Community

kevanthonyP commited on about 1 month ago

Commit

ec4ef2f

verified ·

1 Parent(s): 8fc6354

Update env_tasks.py

Browse files

Files changed (1) hide show

env_tasks.py +86 -86

env_tasks.py CHANGED Viewed

@@ -1,7 +1,18 @@
-# ─── Graders ─────────────────────────────────────────────────────────────────
 def _clamp(score: float) -> float:
-    """Ensure score is strictly between (0,1)"""
     if score >= 1.0:
         return 0.95
     elif score <= 0.0:
@@ -9,131 +20,120 @@ def _clamp(score: float) -> float:
     return score
 def grade_easy(action: TriageAction) -> Tuple[float, Dict[str, Any]]:
-    breakdown: Dict[str, Any] = {}
     score = 0.0
-    correct_category = action.category == TicketCategory.HARDWARE
-    breakdown["category_correct"] = correct_category
-    if correct_category:
-        score += 0.60
-    acceptable_priorities = {TicketPriority.HIGH, TicketPriority.CRITICAL}
-    priority_ok = action.priority in acceptable_priorities
-    breakdown["priority_correct"] = priority_ok
-    if priority_ok:
         score += 0.25
-    response_ok = (
-        len(action.response) >= 30 and
-        any(kw in action.response.lower() for kw in
-            ["laptop", "boot", "restart", "hardware", "technician", "engineer", "update"])
-    )
-    breakdown["response_quality_ok"] = response_ok
-    if response_ok:
         score += 0.15
     score = _clamp(score)
-    breakdown["final_score"] = round(score, 4)
-    return round(score, 4), breakdown
 def grade_medium(action: TriageAction) -> Tuple[float, Dict[str, Any]]:
-    breakdown: Dict[str, Any] = {}
     score = 0.0
-    correct_cat = action.category in {TicketCategory.NETWORK, TicketCategory.ACCESS}
-    breakdown["category_correct"] = correct_cat
-    if correct_cat:
         score += 0.25
-    correct_pri = action.priority in {TicketPriority.HIGH, TicketPriority.CRITICAL}
-    breakdown["priority_correct"] = correct_pri
-    if correct_pri:
         score += 0.25
-    correct_dept = action.department in {Department.SYSADMIN, Department.TIER2_SUPPORT}
-    breakdown["department_correct"] = correct_dept
-    if correct_dept:
         score += 0.25
-    correct_esc = action.escalate == EscalationDecision.ESCALATE
-    breakdown["escalation_correct"] = correct_esc
-    if correct_esc:
-        score += 0.10
-    response_ok = (
-        len(action.response) >= 50 and
-        any(kw in action.response.lower() for kw in
-            ["team", "shared", "drive", "access", "investigating", "priority", "urgent"])
-    )
-    breakdown["response_quality_ok"] = response_ok
-    if response_ok:
         score += 0.15
     score = _clamp(score)
-    breakdown["final_score"] = round(score, 4)
-    return round(score, 4), breakdown
 def grade_hard(action: TriageAction) -> Tuple[float, Dict[str, Any]]:
-    breakdown: Dict[str, Any] = {}
     score = 0.0
     penalty = 0.0
-    correct_cat = action.category == TicketCategory.SECURITY
-    breakdown["category_correct"] = correct_cat
-    if correct_cat:
-        score += 0.20
-    correct_pri = action.priority == TicketPriority.CRITICAL
-    breakdown["priority_correct"] = correct_pri
-    if correct_pri:
-        score += 0.20
-    correct_dept = action.department == Department.SECURITY_TEAM
-    breakdown["department_correct"] = correct_dept
-    if correct_dept:
-        score += 0.20
-    correct_esc = action.escalate == EscalationDecision.ESCALATE
-    breakdown["escalation_correct"] = correct_esc
-    if correct_esc:
-        score += 0.10
-    resp_lower = action.response.lower()
-    disconnect_mentioned = any(kw in resp_lower for kw in
-        ["disconnect", "unplug", "network", "ethernet", "wifi", "internet", "isolate"])
-    if disconnect_mentioned:
         score += 0.15
-    no_self_recover_instruction = any(kw in resp_lower for kw in
-        ["do not", "don't", "avoid", "do not attempt", "do not try"])
-    if no_self_recover_instruction:
         score += 0.15
-    dangerous_self_recovery = any(kw in resp_lower for kw in
-        ["try the decryption", "use the tool", "recover yourself", "attempt recovery"])
-    if dangerous_self_recovery:
-        penalty += 0.40
-    if not disconnect_mentioned:
-        penalty += 0.30
-    if not correct_esc:
-        penalty += 0.20
-    mentions_ransom = any(kw in resp_lower for kw in ["ransom", "btc", "bitcoin", "pay"])
-    explicitly_says_do_not_pay = any(kw in resp_lower for kw in
-        ["do not pay", "don't pay", "never pay"])
-    if mentions_ransom and not explicitly_says_do_not_pay:
-        penalty += 0.20
-    raw_score = score - penalty
-    # 🔥 FIXED LINE (CRITICAL)
-    final_score = max(0.05, min(0.95, raw_score))
-    breakdown["final_score"] = round(final_score, 4)
-    return round(final_score, 4), breakdown

+from dataclasses import dataclass
+from typing import Dict, Any, Tuple, List
+from env_models import (
+    TicketObservation,
+    TriageAction,
+    TicketCategory,
+    TicketPriority,
+    Department,
+    EscalationDecision,
+)
+# ─── Helper ─────────────────────────────────────────────
 def _clamp(score: float) -> float:
     if score >= 1.0:
         return 0.95
     elif score <= 0.0:
     return score
+# ─── Dummy Tickets (keep minimal, your existing ones work too) ───────────────
+TICKET_EASY = TicketObservation(
+    ticket_id="1",
+    subject="Laptop not working",
+    body="Laptop not booting",
+    reporter_name="User",
+    reporter_role="Employee",
+    system_info="Windows",
+    timestamp="now",
+    previous_tickets=0,
+    task_instruction="Classify",
+    valid_categories=[c.value for c in TicketCategory],
+    valid_priorities=[p.value for p in TicketPriority],
+    valid_departments=[d.value for d in Department],
+)
+TICKET_MEDIUM = TICKET_EASY
+TICKET_HARD = TICKET_EASY
+# ─── Graders ─────────────────────────────────────────────
 def grade_easy(action: TriageAction) -> Tuple[float, Dict[str, Any]]:
     score = 0.0
+    breakdown = {}
+    if action.category == TicketCategory.HARDWARE:
+        score += 0.6
+    if action.priority in {TicketPriority.HIGH, TicketPriority.CRITICAL}:
         score += 0.25
+    if len(action.response) > 10:
         score += 0.15
     score = _clamp(score)
+    return score, breakdown
 def grade_medium(action: TriageAction) -> Tuple[float, Dict[str, Any]]:
     score = 0.0
+    breakdown = {}
+    if action.category in {TicketCategory.NETWORK, TicketCategory.ACCESS}:
         score += 0.25
+    if action.priority in {TicketPriority.HIGH, TicketPriority.CRITICAL}:
         score += 0.25
+    if action.department in {Department.SYSADMIN, Department.TIER2_SUPPORT}:
         score += 0.25
+    if action.escalate == EscalationDecision.ESCALATE:
+        score += 0.1
+    if len(action.response) > 20:
         score += 0.15
     score = _clamp(score)
+    return score, breakdown
 def grade_hard(action: TriageAction) -> Tuple[float, Dict[str, Any]]:
     score = 0.0
     penalty = 0.0
+    breakdown = {}
+    if action.category == TicketCategory.SECURITY:
+        score += 0.2
+    if action.priority == TicketPriority.CRITICAL:
+        score += 0.2
+    if action.department == Department.SECURITY_TEAM:
+        score += 0.2
+    if action.escalate == EscalationDecision.ESCALATE:
+        score += 0.1
+    resp = action.response.lower()
+    if "disconnect" in resp:
         score += 0.15
+    if "do not" in resp:
         score += 0.15
+    if "decrypt" in resp:
+        penalty += 0.4
+    raw = score - penalty
+    final = max(0.05, min(0.95, raw))
+    return final, breakdown
+# ─── Task Registry ───────────────────────────────────────
+@dataclass
+class Task:
+    task_id: str
+    name: str
+    description: str
+    difficulty: str
+    ticket: TicketObservation
+    grader: Any
+    max_steps: int = 1
+TASKS: List[Task] = [
+    Task("task_easy", "Easy", "Basic classification", "easy", TICKET_EASY, grade_easy),
+    Task("task_medium", "Medium", "Full triage", "medium", TICKET_MEDIUM, grade_medium),
+    Task("task_hard", "Hard", "Security incident", "hard", TICKET_HARD, grade_hard),
+]
+TASK_MAP = {t.task_id: t for t in TASKS}