Spaces:

rajvivan
/

CUD-Traffic-AI

Running

App Files Files Community

Rajeev Ranjan Pandey commited on Mar 18

Commit

7976e9d

1 Parent(s): 5378bb9

fix: restore working copy/save buttons in dark mode and elevate model prompt styling

Browse files

Files changed (3) hide show

frontend/src/components/SummarizerWidget.jsx +2 -2
frontend/src/pages/Home.jsx +7 -3
src/models/abstractive.py +27 -16

frontend/src/components/SummarizerWidget.jsx CHANGED Viewed

@@ -179,13 +179,13 @@ export default function SummarizerWidget({
                 <div className="mt-5 flex flex-wrap gap-3 border-t border-white/5 pt-4">
                   <button
                     onClick={handleCopy}
-                    className="flex-1 flex justify-center items-center gap-2 rounded-xl bg-slate-100 dark:bg-white/8 hover:bg-slate-200 dark:hover:bg-white/12 py-3 text-sm font-bold text-slate-700 dark:text-white transition border border-slate-200 dark:border-white/10"
                   >
                     {copied ? <CheckCircle2 size={16}/> : <Copy size={16} />} {copied ? "Copied" : "Copy Summary"}
                   </button>
                   <button
                     onClick={() => downloadTextFile(`summary_${modelChoice}.txt`, summary)}
-                    className="flex-1 flex justify-center items-center gap-2 rounded-xl border border-slate-200 dark:border-white/10 bg-white dark:bg-transparent py-3 text-sm font-bold text-slate-600 dark:text-slate-300 transition hover:bg-white/5"
                   >
                     <Download size={16} /> Save
                   </button>

                 <div className="mt-5 flex flex-wrap gap-3 border-t border-white/5 pt-4">
                   <button
                     onClick={handleCopy}
+                    className="flex-1 flex justify-center items-center gap-2 rounded-xl bg-slate-100 dark:bg-white/[0.08] hover:bg-slate-200 dark:hover:bg-white/[0.12] py-3 text-sm font-bold text-slate-700 dark:text-white transition border border-slate-200 dark:border-white/10"
                   >
                     {copied ? <CheckCircle2 size={16}/> : <Copy size={16} />} {copied ? "Copied" : "Copy Summary"}
                   </button>
                   <button
                     onClick={() => downloadTextFile(`summary_${modelChoice}.txt`, summary)}
+                    className="flex-1 flex justify-center items-center gap-2 rounded-xl border border-slate-200 dark:border-white/10 bg-white dark:bg-transparent py-3 text-sm font-bold text-slate-600 dark:text-slate-300 transition hover:bg-slate-50 dark:hover:bg-white/[0.05]"
                   >
                     <Download size={16} /> Save
                   </button>

frontend/src/pages/Home.jsx CHANGED Viewed

@@ -13,7 +13,11 @@ const FALLBACK_TEXT = {
 };
 export default function Home() {
-  const [isDark, setIsDark] = useState(true);
   const [datasetTrack, setDatasetTrack] = useState("gcc");
   const [text, setText] = useState(FALLBACK_TEXT.gcc);
   const [modelChoice, setModelChoice] = useState("bart_large_cnn");
@@ -29,9 +33,9 @@ export default function Home() {
   useEffect(() => { datasetTrackRef.current = datasetTrack; }, [datasetTrack]);
   useEffect(() => { modelChoiceRef.current = modelChoice; }, [modelChoice]);
   useEffect(() => {
-    if (isDark) document.documentElement.classList.add("dark");
-    else document.documentElement.classList.remove("dark");
   }, [isDark]);
   useEffect(() => {

 };
 export default function Home() {
+  const [isDark, setIsDark] = useState(() => {
+    // Apply immediately — before first paint — so dark: variants work on load
+    document.documentElement.classList.add("dark");
+    return true;
+  });
   const [datasetTrack, setDatasetTrack] = useState("gcc");
   const [text, setText] = useState(FALLBACK_TEXT.gcc);
   const [modelChoice, setModelChoice] = useState("bart_large_cnn");
   useEffect(() => { datasetTrackRef.current = datasetTrack; }, [datasetTrack]);
   useEffect(() => { modelChoiceRef.current = modelChoice; }, [modelChoice]);
+  // Keep dark class in sync when user toggles
   useEffect(() => {
+    document.documentElement.classList.toggle("dark", isDark);
   }, [isDark]);
   useEffect(() => {

src/models/abstractive.py CHANGED Viewed

@@ -7,20 +7,23 @@ from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
 from src.data.utils import load_config
 # ── Per-model instruction prefixes ────────────────────────────────────────────
-# Prepended to raw incident text so models rewrite instead of echo.
 _MODEL_PROMPTS: dict[str, str] = {
     "bart_large_cnn": (
-        "Generate a concise traffic incident summary. "
-        "Report only: location, incident type, severity, and road impact. "
-        "Be brief. Incident report: "
     ),
     "flan_t5_small": (
-        "Write a one-sentence traffic incident summary covering location, "
-        "incident type, severity level, and road impact in under 35 words. "
-        "Traffic report: "
     ),
     "pegasus_cnn": (
-        "Summarize the key facts from this traffic incident in one compact sentence: "
     ),
 }
@@ -55,7 +58,7 @@ def build_generation_config(model_name: str, config_path: str = "config.yaml"):
         min_new_tokens=gen_cfg["default_min_new_tokens"],
         max_new_tokens=gen_cfg["default_max_new_tokens"],
         num_beams=gen_cfg["num_beams"],
-        length_penalty=gen_cfg["length_penalty"],
         no_repeat_ngram_size=gen_cfg["no_repeat_ngram_size"],
         early_stopping=gen_cfg["early_stopping"],
         prompt_prefix=model_cfg.get("prompt_prefix", ""),
@@ -73,10 +76,9 @@ def generate_summary(text: str, model_name: str, config_path: str = "config.yaml
     encoded = tokenizer(source_text, truncation=True, max_length=gen.max_input_tokens, return_tensors="pt")
     encoded = {k: v.to(get_device()) for k, v in encoded.items()}
-    # Dynamic cap: limit output to 50 % of raw input token count to force compression.
-    raw_len = tokenizer(clean_text, return_tensors="pt")["input_ids"].shape[-1]
-    dynamic_max = max(gen.min_new_tokens, min(int(raw_len * 0.50), gen.max_new_tokens))
-    actual_max_tokens = max_new_tokens or dynamic_max
     with torch.inference_mode():
         output_ids = model.generate(
@@ -84,12 +86,22 @@ def generate_summary(text: str, model_name: str, config_path: str = "config.yaml
             min_new_tokens=gen.min_new_tokens,
             max_new_tokens=actual_max_tokens,
             num_beams=gen.num_beams,
-            length_penalty=3.0,     # strongly prefers concise outputs
-            no_repeat_ngram_size=4, # blocks 4-gram copying from input
             early_stopping=True,
         )
     output_text = " ".join(tokenizer.decode(output_ids[0], skip_special_tokens=True).split())
     # Strip known hallucinations
     hallucinations = [
         "For confidential support call the Samaritans in the UK on 08457 90 90 90, visit a local Samaritans branch or click here for details.",
@@ -103,7 +115,6 @@ def generate_summary(text: str, model_name: str, config_path: str = "config.yaml
     return " ".join(output_text.split())
 def available_abstractive_models(config_path: str = "config.yaml") -> List[str]:
     cfg = load_config(config_path)
     return [name for name, meta in cfg["models"].items() if meta.get("enabled", False)]

 from src.data.utils import load_config
 # ── Per-model instruction prefixes ────────────────────────────────────────────
+# Changed prompting to be highly professional, requesting a "classy",
+# high-impact executive tone suitable for official intelligence reports.
 _MODEL_PROMPTS: dict[str, str] = {
     "bart_large_cnn": (
+        "Re-write the following traffic event into a highly professional executive "
+        "incident brief. Focus on creating an impactful, formal summary highlighting "
+        "severity and operational disruption: "
     ),
     "flan_t5_small": (
+        "Task: Create a professional, high-impact Executive Traffic Intelligence Brief "
+        "from the following incident. Emphasize severity, exact location, and direct "
+        "consequences in a formal tone. "
+        "Incident details: "
     ),
     "pegasus_cnn": (
+        "Generate a formal, impactful Traffic Intelligence Report summarizing the key "
+        "operational facts from this incident: "
     ),
 }
         min_new_tokens=gen_cfg["default_min_new_tokens"],
         max_new_tokens=gen_cfg["default_max_new_tokens"],
         num_beams=gen_cfg["num_beams"],
+        length_penalty=1.0,  # Reverted length_penalty to 1.0 (defaults) for natural flow
         no_repeat_ngram_size=gen_cfg["no_repeat_ngram_size"],
         early_stopping=gen_cfg["early_stopping"],
         prompt_prefix=model_cfg.get("prompt_prefix", ""),
     encoded = tokenizer(source_text, truncation=True, max_length=gen.max_input_tokens, return_tensors="pt")
     encoded = {k: v.to(get_device()) for k, v in encoded.items()}
+    # Limit to max_tokens configured. The previous dynamic strict limit forced the models
+    # to behave weirdly or copy, instead let the model use its own stopping logic.
+    actual_max_tokens = max_new_tokens or gen.max_new_tokens
     with torch.inference_mode():
         output_ids = model.generate(
             min_new_tokens=gen.min_new_tokens,
             max_new_tokens=actual_max_tokens,
             num_beams=gen.num_beams,
+            length_penalty=gen.length_penalty,
+            no_repeat_ngram_size=gen.no_repeat_ngram_size,
             early_stopping=True,
         )
     output_text = " ".join(tokenizer.decode(output_ids[0], skip_special_tokens=True).split())
+    # Strip the instruction template echo
+    for prefix in _MODEL_PROMPTS.values():
+        if output_text.lower().startswith(prefix.replace("Task: ", "").lower().strip()[:20]):
+            output_text = output_text[len(prefix):].strip()
+    # Generic stripping of prefixes the models sometimes generate
+    output_text = output_text.replace("Executive Incident Brief:", "")
+    output_text = output_text.replace("Traffic Intelligence Report:", "")
+    output_text = output_text.replace("Incident report:", "")
     # Strip known hallucinations
     hallucinations = [
         "For confidential support call the Samaritans in the UK on 08457 90 90 90, visit a local Samaritans branch or click here for details.",
     return " ".join(output_text.split())
 def available_abstractive_models(config_path: str = "config.yaml") -> List[str]:
     cfg = load_config(config_path)
     return [name for name, meta in cfg["models"].items() if meta.get("enabled", False)]