Spaces:

Benny-Tang
/

exam-simulator

Runtime error

App Files Files Community

Benny-Tang commited on Sep 14, 2025

Commit

61f8c8e

verified ·

1 Parent(s): 09e298e

Update agents.py

Browse files

Files changed (1) hide show

agents.py +173 -68

agents.py CHANGED Viewed

@@ -1,94 +1,199 @@
-import random
 import os
-import requests
 class AnalyzerAgent:
-    def analyze(self, per_question):
-        topics = {}
         for qid, info in per_question.items():
-            if not info["topics"]:
-                continue
-            for topic in info["topics"]:
-                if topic not in topics:
-                    topics[topic] = {"correct": 0, "total": 0}
-                topics[topic]["total"] += 1
-                if info["user"] == info["correct"]:
-                    topics[topic]["correct"] += 1
         return {
-            topic: {
-                "accuracy": round(v["correct"] / v["total"] * 100, 2) if v["total"] > 0 else 0,
-                "attempted": v["total"],
-            }
-            for topic, v in topics.items()
         }
 class CoachAgent:
-    def coach(self, analysis, level, subject):
-        weak = [t for t, v in analysis.items() if v["accuracy"] < 50]
         if not weak:
-            return {"message": f"Great job! Keep revising {subject} topics at {level} level."}
         return {
-            "message": f"Focus on improving these weak topics in {subject} ({level}): {', '.join(weak)}"
         }
 class PredictiveAgent:
     def __init__(self):
-        self.api_key = os.getenv("zhipuai_api_key")
-        self.url = "https://open.bigmodel.cn/api/paas/v4/chat/completions"
-    def predict(self, subject, level, count=5):
-        """Generate placeholder predicted questions (fallback to real LLM when available)."""
-        if not self.api_key:
-            return [
-                {
-                    "id": 900000 + i,
-                    "text": f"Practice predicted question on {subject} (placeholder) #{i+1}",
-                    "choices": ["A", "B", "C", "D"],
-                    "topics": ["general"],
-                    "correct_answer": None,
-                }
-                for i in range(count)
-            ]
-        headers = {"Authorization": f"Bearer {self.api_key}", "Content-Type": "application/json"}
-        body = {
-            "model": "glm-4-5",
-            "messages": [
-                {
-                    "role": "user",
-                    "content": f"Generate {count} predicted SPM {subject} questions for {level} with multiple-choice answers.",
-                }
-            ],
-        }
-        try:
-            resp = requests.post(self.url, headers=headers, json=body, timeout=30)
-            data = resp.json()
-            text = data.get("choices", [{}])[0].get("message", {}).get("content", "")
-        except Exception as e:
-            print("⚠️ PredictiveAgent error:", e)
-            text = ""
-        # Placeholder output
-        return [
-            {
-                "id": 900000 + i,
-                "text": f"Predicted question #{i+1} for {subject} ({level})",
-                "choices": ["A", "B", "C", "D"],
-                "topics": ["general"],
-                "correct_answer": None,
             }
-            for i in range(count)
-        ]
-    def summary(self, level, subject):
         return {
-            "subject": subject,
             "level": level,
-            "trend": f"Predicted hot topics for {subject} ({level}) are vocabulary, problem solving, and essay writing.",
         }

 import os
+import random
+from collections import Counter, defaultdict
+from typing import List, Dict, Any
+# Accept both environment variable names (old/new)
+GLM_API_KEY = os.getenv("ZHIPUAI_API_KEY") or os.getenv("zhipuai_api_key")
 class AnalyzerAgent:
+    """
+    Analyze a per-question map: {qid: {"user":..., "correct":..., "topics":[...] }}
+    Return topic-level accuracy and weak topic suggestions.
+    """
+    def analyze(self, per_question: Dict[str, Dict[str, Any]]) -> Dict[str, Any]:
+        topic_stats = {}
         for qid, info in per_question.items():
+            topics = info.get("topics", []) or []
+            user = info.get("user")
+            correct = info.get("correct")
+            is_correct = (correct is not None and user is not None and str(user).strip() == str(correct).strip())
+            for t in topics:
+                if t not in topic_stats:
+                    topic_stats[t] = {"correct": 0, "total": 0}
+                topic_stats[t]["total"] += 1
+                if is_correct:
+                    topic_stats[t]["correct"] += 1
+        topic_accuracy = {}
+        weak_topics = []
+        for t, stats in topic_stats.items():
+            total = stats["total"]
+            correct = stats["correct"]
+            acc = round((correct / total) * 100, 2) if total > 0 else 0.0
+            topic_accuracy[t] = {"accuracy_percent": acc, "total": total}
+            if total >= 3 and acc < 65.0:
+                weak_topics.append(t)
+        recommendation = "Focus on: " + ", ".join(weak_topics) if weak_topics else "No major weak topics detected. Keep practicing."
         return {
+            "topic_accuracy": topic_accuracy,
+            "weak_topics": weak_topics,
+            "recommendation": recommendation
         }
 class CoachAgent:
+    """
+    Provide short coaching tips & up to 3 practice prompts (not full solutions).
+    """
+    def coach(self, analysis: Dict[str, Any], level: str, subject: str) -> Dict[str, Any]:
+        weak = analysis.get("weak_topics", [])
+        tips = []
         if not weak:
+            tips = [
+                "Revise major topics and practice mixed problem sets.",
+                "Time yourself during mock papers to improve speed.",
+                "Review wrong answers and understand reasoning."
+            ]
+        else:
+            tips = [
+                f"Spend 20–30 minutes daily on {weak[0]} (break it into small tasks).",
+                "Do targeted practice sets and review short solutions.",
+                "Explain concepts aloud or teach a peer — that cements understanding."
+            ]
+        practice_questions = []
+        # create a few simple practice questions (templates) for weakest topics
+        for i, top in enumerate(weak[:3], start=1):
+            practice_questions.append({
+                "text": f"Practice item on {top}: (short question to test {top})",
+                "choices": ["A", "B", "C", "D"],
+                "answer": None,
+                "explanation": None,
+                "topic": top
+            })
         return {
+            "tips": tips,
+            "study_plan": "20 minutes daily for weak topics + weekly full mock",
+            "practice_questions": practice_questions
         }
 class PredictiveAgent:
+    """
+    Produce predicted SPM-style MCQs (in-memory only).
+    Falls back to heuristic generation when no LLM API is available.
+    Usage:
+        generate_predictions(level, subject, n, question_bank)
+        summary(level, subject, question_bank)
+    """
     def __init__(self):
+        self.api_key = GLM_API_KEY
+    def _top_topics_from_bank(self, question_bank: List[Dict], subject_display: str, top_k=6):
+        # subject_display e.g. "BM"
+        subj_key = f"Form5_{subject_display}"
+        counter = Counter()
+        total = 0
+        for q in question_bank:
+            if q.get("subject") != subj_key:
+                continue
+            total += 1
+            for t in q.get("topics", []):
+                counter[t] += 1
+        if total == 0:
+            return []
+        return [t for t, _ in counter.most_common(top_k)]
+    def generate_predictions(self, level: str, subject: str, n: int = 5, question_bank: List[Dict] = None) -> List[Dict]:
+        """
+        Returns a list of predicted question dicts:
+        { id, text, choices, correct_answer, topics, difficulty, source, confidence }
+        Predictions are only in memory.
+        """
+        preds = []
+        base_id = 900000
+        topics = []
+        if question_bank:
+            topics = self._top_topics_from_bank(question_bank, subject, top_k=10)
+        # if no topics found, fallback to generic topic tokens
+        if not topics:
+            fallback = {
+                "BM": ["perbendaharaan_kata", "tatabahasa"],
+                "English": ["vocabulary", "grammar"],
+                "Math": ["algebra", "geometry"],
+                "History": ["events", "dates"],
+                "Science": ["physics", "chemistry"],
+                "MoralStudies": ["ethics", "values"]
             }
+            topics = fallback.get(subject, ["general"])
+        # heuristic generation tailored by subject
+        for i in range(n):
+            t = topics[i % len(topics)]
+            qobj = self._make_sample_question(subject, t, idx=i + 1)
+            qobj["id"] = base_id + i
+            qobj["source"] = "predicted"
+            qobj["confidence"] = round(random.uniform(0.35, 0.75), 2)
+            preds.append(qobj)
+        return preds
+    def _make_sample_question(self, subject: str, topic: str, idx: int) -> Dict:
+        """
+        Heuristic templates to make predicted questions look natural.
+        These are conservative templates — they are not official exam questions.
+        """
+        if subject == "BM":
+            text = f"Pilih sinonim bagi perkataan '{['gembira','besar','kecil','cepat'][idx % 4]}'."
+            choices = ["Sedih", "Gembira", "Marah", "Letih"]
+            correct = "Gembira"
+        elif subject == "English":
+            text = f"Choose the correct synonym for 'happy'."
+            choices = ["Sad", "Joyful", "Angry", "Tired"]
+            correct = "Joyful"
+        elif subject == "Math":
+            text = f"If 2x + 3 = 11, what is x?"
+            choices = ["2", "3", "4", "5"]
+            correct = "4"
+        elif subject == "Science":
+            text = f"What is the SI unit of force?"
+            choices = ["Joule", "Newton", "Pascal", "Watt"]
+            correct = "Newton"
+        elif subject == "History":
+            text = f"In which year did [event] occur? (predictive-sample)"
+            choices = ["1945", "1957", "1963", "1975"]
+            correct = "1957"
+        elif subject == "MoralStudies":
+            text = "Which value is most associated with mutual respect?"
+            choices = ["Greed", "Respect", "Laziness", "Selfishness"]
+            correct = "Respect"
+        else:
+            text = f"Sample predicted question on {topic}."
+            choices = ["A", "B", "C", "D"]
+            correct = choices[0]
         return {
+            "text": text,
+            "choices": choices,
+            "correct_answer": correct,
+            "topics": [topic],
+            "difficulty": 3
+        }
+    def summary(self, level: str, subject: str, question_bank: List[Dict] = None) -> Dict:
+        topics = self._top_topics_from_bank(question_bank, subject) if question_bank else []
+        return {
             "level": level,
+            "subject": subject,
+            "top_topics_from_bank": topics,
+            "note": "Predictions are heuristics or LLM-based forecasts; treat as practice material, not guarantees."
         }