Spaces:

rajvivan
/

CUD-Traffic-AI

Running

App Files Files Community

Rajeev Ranjan Pandey commited on Mar 18

Commit

a543f4f

1 Parent(s): d703e0b

feat: directive prompts per model, BrainCircuit icon, info tooltip light mode fix

Browse files

Files changed (3) hide show

frontend/src/components/DatasetToggle.jsx +4 -4
frontend/src/components/SummarizerWidget.jsx +6 -4
src/models/abstractive.py +31 -9

frontend/src/components/DatasetToggle.jsx CHANGED Viewed

@@ -1,15 +1,15 @@
-import { Check, Database } from "lucide-react";
 export default function DatasetToggle({ value, onChange }) {
   const options = [
-    { value: "gcc", label: "GCC / UAE",   subtitle: "250+ Narrative Samples",    flag: "🇦🇪" },
-    { value: "us",  label: "US Accidents", subtitle: "5,000+ Extracted Records",  flag: "🇺🇸" }
   ];
   return (
     <div className="rounded-2xl border border-slate-300 dark:border-white/[0.07] bg-white dark:bg-[#0d1326] p-5 shadow-sm dark:shadow-xl">
       <div className="flex items-center gap-2 mb-4 text-[10px] font-bold uppercase tracking-[0.2em] text-slate-400 dark:text-slate-500">
-        <Database size={12}/> Analysis Dataset
       </div>
       <div className="flex flex-col gap-3">
         {options.map((option) => {

+import { Check, BrainCircuit } from "lucide-react";
 export default function DatasetToggle({ value, onChange }) {
   const options = [
+    { value: "gcc", label: "GCC / UAE",    subtitle: "250+ Narrative Samples",   flag: "🇦🇪" },
+    { value: "us",  label: "US Accidents", subtitle: "5,000+ Extracted Records", flag: "🇺🇸" }
   ];
   return (
     <div className="rounded-2xl border border-slate-300 dark:border-white/[0.07] bg-white dark:bg-[#0d1326] p-5 shadow-sm dark:shadow-xl">
       <div className="flex items-center gap-2 mb-4 text-[10px] font-bold uppercase tracking-[0.2em] text-slate-400 dark:text-slate-500">
+        <BrainCircuit size={13} className="text-orange-500"/> Available Datasets
       </div>
       <div className="flex flex-col gap-3">
         {options.map((option) => {

frontend/src/components/SummarizerWidget.jsx CHANGED Viewed

@@ -223,11 +223,13 @@ export default function SummarizerWidget({
                           <Icon size={18} />
                         </span>
                         <div className="group/tooltip relative">
-                           <div className="flex h-6 w-6 items-center justify-center rounded-full text-slate-400 hover:text-slate-700 transition cursor-help dark:text-slate-500 dark:hover:text-white">
-                             <span className="font-serif italic border border-slate-300 dark:border-slate-600 rounded-full w-4 h-4 flex items-center justify-center text-[10px]">i</span>
                            </div>
-                           <div className="absolute right-0 lg:right-auto lg:left-0 top-8 z-50 w-64 opacity-0 scale-95 origin-top-right lg:origin-top-left transition-all group-hover/tooltip:opacity-100 group-hover/tooltip:scale-100 pointer-events-none group-hover/tooltip:pointer-events-auto rounded-xl bg-slate-900 border border-slate-800 p-3 shadow-xl dark:bg-slate-800 dark:border-slate-700">
-                             <p className="text-xs text-slate-300 leading-relaxed font-normal">{model.description}</p>
                            </div>
                         </div>
                       </div>

                           <Icon size={18} />
                         </span>
                         <div className="group/tooltip relative">
+                           <div className="flex h-6 w-6 items-center justify-center rounded-full hover:bg-orange-50 dark:hover:bg-white/10 transition cursor-help">
+                             <span className="font-serif italic border-2 border-slate-400 dark:border-slate-500 text-slate-500 dark:text-slate-400 hover:border-orange-500 hover:text-orange-600 dark:hover:text-white rounded-full w-4 h-4 flex items-center justify-center text-[10px] transition">
+                               i
+                             </span>
                            </div>
+                           <div className="absolute right-0 lg:right-auto lg:left-0 top-8 z-50 w-64 opacity-0 scale-95 origin-top-right lg:origin-top-left transition-all group-hover/tooltip:opacity-100 group-hover/tooltip:scale-100 pointer-events-none group-hover/tooltip:pointer-events-auto rounded-xl bg-white dark:bg-slate-800 border border-slate-200 dark:border-slate-700 p-3 shadow-xl">
+                             <p className="text-xs text-slate-700 dark:text-slate-300 leading-relaxed font-normal">{model.description}</p>
                            </div>
                         </div>
                       </div>

src/models/abstractive.py CHANGED Viewed

@@ -6,6 +6,24 @@ import torch
 from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
 from src.data.utils import load_config
 @dataclass
 class GenerationConfig:
     max_input_tokens: int
@@ -46,14 +64,18 @@ def build_generation_config(model_name: str, config_path: str = "config.yaml"):
 def generate_summary(text: str, model_name: str, config_path: str = "config.yaml", max_new_tokens: int | None = None) -> str:
     hf_name, gen = build_generation_config(model_name, config_path)
     tokenizer, model = load_tokenizer_and_model(hf_name)
-    source_text = f"{gen.prompt_prefix}{' '.join(str(text).split())}"
     encoded = tokenizer(source_text, truncation=True, max_length=gen.max_input_tokens, return_tensors="pt")
     encoded = {k: v.to(get_device()) for k, v in encoded.items()}
-    # Dynamically cap max_new_tokens at 55 % of input length to enforce compression.
-    # This prevents the model from echoing short inputs verbatim.
-    input_len = encoded["input_ids"].shape[-1]
-    dynamic_max = max(gen.min_new_tokens, min(int(input_len * 0.55), gen.max_new_tokens))
     actual_max_tokens = max_new_tokens or dynamic_max
     with torch.inference_mode():
@@ -62,19 +84,19 @@ def generate_summary(text: str, model_name: str, config_path: str = "config.yaml
             min_new_tokens=gen.min_new_tokens,
             max_new_tokens=actual_max_tokens,
             num_beams=gen.num_beams,
-            length_penalty=2.0,          # strongly prefers shorter outputs
-            no_repeat_ngram_size=4,      # blocks 4-gram repetition / copy
             early_stopping=True,
         )
     output_text = " ".join(tokenizer.decode(output_ids[0], skip_special_tokens=True).split())
-    # Post-processing: strip known hallucinations
     hallucinations = [
         "For confidential support call the Samaritans in the UK on 08457 90 90 90, visit a local Samaritans branch or click here for details.",
         "For confidential support call the Samaritans",
         "The cause of the collision has not been determined",
         "The incident is under investigation by Dubai Police.",
-        "The incident is currently under investigation and no further details have been released."
     ]
     for h in hallucinations:
         output_text = output_text.replace(h, "").strip()

 from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
 from src.data.utils import load_config
+# ── Per-model instruction prefixes ────────────────────────────────────────────
+# Prepended to raw incident text so models rewrite instead of echo.
+_MODEL_PROMPTS: dict[str, str] = {
+    "bart_large_cnn": (
+        "Generate a concise traffic incident summary. "
+        "Report only: location, incident type, severity, and road impact. "
+        "Be brief. Incident report: "
+    ),
+    "flan_t5_small": (
+        "Write a one-sentence traffic incident summary covering location, "
+        "incident type, severity level, and road impact in under 35 words. "
+        "Traffic report: "
+    ),
+    "pegasus_cnn": (
+        "Summarize the key facts from this traffic incident in one compact sentence: "
+    ),
+}
 @dataclass
 class GenerationConfig:
     max_input_tokens: int
 def generate_summary(text: str, model_name: str, config_path: str = "config.yaml", max_new_tokens: int | None = None) -> str:
     hf_name, gen = build_generation_config(model_name, config_path)
     tokenizer, model = load_tokenizer_and_model(hf_name)
+    # Use model-specific rewriting instruction if available, else fall back to config prefix.
+    instruction = _MODEL_PROMPTS.get(model_name, gen.prompt_prefix)
+    clean_text = " ".join(str(text).split())
+    source_text = f"{instruction}{clean_text}"
     encoded = tokenizer(source_text, truncation=True, max_length=gen.max_input_tokens, return_tensors="pt")
     encoded = {k: v.to(get_device()) for k, v in encoded.items()}
+    # Dynamic cap: limit output to 50 % of raw input token count to force compression.
+    raw_len = tokenizer(clean_text, return_tensors="pt")["input_ids"].shape[-1]
+    dynamic_max = max(gen.min_new_tokens, min(int(raw_len * 0.50), gen.max_new_tokens))
     actual_max_tokens = max_new_tokens or dynamic_max
     with torch.inference_mode():
             min_new_tokens=gen.min_new_tokens,
             max_new_tokens=actual_max_tokens,
             num_beams=gen.num_beams,
+            length_penalty=3.0,     # strongly prefers concise outputs
+            no_repeat_ngram_size=4, # blocks 4-gram copying from input
             early_stopping=True,
         )
     output_text = " ".join(tokenizer.decode(output_ids[0], skip_special_tokens=True).split())
+    # Strip known hallucinations
     hallucinations = [
         "For confidential support call the Samaritans in the UK on 08457 90 90 90, visit a local Samaritans branch or click here for details.",
         "For confidential support call the Samaritans",
         "The cause of the collision has not been determined",
         "The incident is under investigation by Dubai Police.",
+        "The incident is currently under investigation and no further details have been released.",
     ]
     for h in hallucinations:
         output_text = output_text.replace(h, "").strip()