Spaces:

lablab-ai-amd-developer-hackathon
/

medivision-ai-agent

Running

App Files Files Community

dikheng

dikheng commited on 2 days ago

Commit

ea938cc

1 Parent(s): 7bcc411

feat: 3-step agentic pipeline — A/B comparison, red-flag triage, SOAP note

Browse files

Architecture upgrade from single-prompt to 3-step micro-pipeline:
- Step 1 Vision Agent: objective visual description (supports 1 or 2 images)
- Step 2 Clinical Agent: clinical reasoning → strict triage JSON
- Step 3 Format Agent: patient-friendly message + SOAP note

New features:
- A/B Image Comparison: toggle between Standard (1 image) and Compare (2 images)
mode; Vision Agent describes progression between Day 1 and Day X
- Red-Flag Triage: flashing animated banner when triage_level == High
- SOAP Note: auto-generated structured clinical export with copy button
- Output split into Patient View tab and Export for Doctor (SOAP) tab
- Possible conditions shown as chips alongside triage severity badge

Co-Authored-By: Duy Khang <dikheng@users.noreply.huggingface.co>

Files changed (5) hide show

app.py +229 -50
src/agents.py +64 -0
src/inference.py +31 -12
src/model_loader.py +20 -15
src/prompts.py +53 -0

app.py CHANGED Viewed

@@ -60,6 +60,17 @@ _I18N = {
         "map_label":              "Anatomical Map",
         "map_select":             "click to select",
         "map_selected":           "{n} region(s) selected",
     },
     "vn": {
         "img_label":              "Tải lên hình ảnh y tế",
@@ -89,6 +100,17 @@ _I18N = {
         "map_label":              "Bản đồ giải phẫu",
         "map_select":             "nhấn để chọn",
         "map_selected":           "{n} vùng đã chọn",
     },
     "zh": {
         "img_label":              "上传医学图像",
@@ -118,6 +140,17 @@ _I18N = {
         "map_label":              "解剖图",
         "map_select":             "点击选择",
         "map_selected":           "已选 {n} 个部位",
     },
     "es": {
         "img_label":              "Subir imagen médica",
@@ -147,6 +180,17 @@ _I18N = {
         "map_label":              "Mapa anatómico",
         "map_select":             "haga clic para seleccionar",
         "map_selected":           "{n} región(es) seleccionada(s)",
     },
     "fr": {
         "img_label":              "Télécharger une image médicale",
@@ -176,6 +220,17 @@ _I18N = {
         "map_label":              "Carte anatomique",
         "map_select":             "cliquer pour sélectionner",
         "map_selected":           "{n} région(s) sélectionnée(s)",
     },
     "ja": {
         "img_label":              "医療画像をアップロード",
@@ -205,6 +260,17 @@ _I18N = {
         "map_label":              "解剖マップ",
         "map_select":             "クリックして選択",
         "map_selected":           "{n} 部位選択中",
     },
 }
@@ -515,18 +581,16 @@ def _empty_output_html(lang: str) -> str:
     )
 def _build_result_html(result: dict, lang: str) -> str:
-    t          = _I18N.get(lang, _I18N["en"])
-    diag       = result.get("diagnosis", "")
-    sev_en     = result.get("severity", "Low")
-    sev        = _SEVERITY_TRANSLATE.get(lang, _SEVERITY_TRANSLATE["en"]).get(sev_en, sev_en)
-    actions    = result.get("recommended_actions", [])
-    score      = result.get("confidence_score", 0)
-    metrics    = result.get("_metrics", {})
-    actions_html = "".join(
-        f"<li style='margin:5px 0; color:#d1d5db;'>{a}</li>" for a in actions
-    ) if actions else "<li style='color:#6b7280;'>—</li>"
     backend_tag = (
         "<span style='font-size:0.7rem; background:#052e16; color:#86efac; "
@@ -534,6 +598,39 @@ def _build_result_html(result: dict, lang: str) -> str:
         "border:1px solid #16a34a;'>AMD Cloud</span>"
     )
     return f"""
 <div style='background:#111827; border:1px solid #ED1C24; border-radius:12px;
             padding:20px; font-family:Arial,sans-serif; color:#f9fafb;'>
@@ -544,34 +641,31 @@ def _build_result_html(result: dict, lang: str) -> str:
       <div style='font-size:1.1rem; font-weight:700; color:#ED1C24;'>
         MediVision {backend_tag}
       </div>
-      <div style='font-size:0.75rem; color:#6b7280;'>AMD MI300X · ROCm · Qwen2.5-VL-7B</div>
     </div>
   </div>
   {_metrics_bar(metrics, t)}
   <div style='background:#1f2937; border-radius:8px; padding:14px; margin-bottom:12px;'>
     <div style='font-size:0.75rem; text-transform:uppercase; letter-spacing:.05em;
-                color:#9ca3af; margin-bottom:6px;'>{t['diag_label']}</div>
-    <div style='font-size:1.05rem; font-weight:600; color:#f9fafb;'>{diag}</div>
   </div>
   <div style='background:#1f2937; border-radius:8px; padding:14px; margin-bottom:12px;'>
     <div style='font-size:0.75rem; text-transform:uppercase; letter-spacing:.05em;
-                color:#9ca3af; margin-bottom:8px;'>{t['severity_label']}</div>
-    {_severity_badge(sev)}
-  </div>
-  <div style='background:#1f2937; border-radius:8px; padding:14px; margin-bottom:12px;'>
-    {_confidence_bar(score, t['confidence_label'])}
   </div>
   <div style='background:#1f2937; border-radius:8px; padding:14px; margin-bottom:12px;'>
     <div style='font-size:0.75rem; text-transform:uppercase; letter-spacing:.05em;
                 color:#9ca3af; margin-bottom:8px;'>{t['actions_label']}</div>
-    <ul style='margin:0; padding-left:20px; list-style-type:disc;'>
-      {actions_html}
-    </ul>
   </div>
   <div style='background:#1a1a2e; border-left:4px solid #ED1C24; border-radius:4px;
@@ -583,6 +677,37 @@ def _build_result_html(result: dict, lang: str) -> str:
 """
 # ---------------------------------------------------------------------------
 # UI update helpers
 # ---------------------------------------------------------------------------
@@ -615,7 +740,9 @@ def _ui_updates(lang_choice: str, current_regions=None):
         f"<p style='font-size:0.75rem; color:#6b7280; margin:4px 0 10px;'>{t['input_hint']}</p>"
     )
     return (
-        gr.update(label=t["img_label"]),
         gr.update(label=t["symptoms_label"], placeholder=t["symptoms_placeholder"]),
         gr.update(value=t["analyze_btn"]),
         gr.update(label=t["region_optional_label"], choices=new_choices, value=translated),
@@ -670,50 +797,71 @@ def on_svg_click(svg_id: str, current_regions: list, lang_choice: str) -> tuple:
 def on_lang_change(lang_choice: str, image, symptoms: str, selected_regions):
     lang = _LANG_MAP.get(lang_choice, "en")
     t = _I18N[lang]
-    img_upd, sym_upd, btn_upd, region_upd, hint_upd = _ui_updates(lang_choice, current_regions=selected_regions)
     region = _regions_to_prompt(selected_regions)
     has_content = bool(image) or bool(symptoms and symptoms.strip())
     if has_content:
         try:
-            result = get_pipeline().process(image, (symptoms or "").strip(), lang=lang, region=region)
-            out_upd = _build_result_html(result, lang)
         except Exception as exc:
-            out_upd = _error_html(t, exc)
     else:
-        out_upd = _empty_output_html(lang)
-    return img_upd, sym_upd, btn_upd, region_upd, hint_upd, out_upd, get_backend_status_html(lang)
 def on_load(request: gr.Request):
     lang_display = _detect_lang_from_header(
         request.headers.get("accept-language", "")
     )
-    img_upd, sym_upd, btn_upd, region_upd, hint_upd = _ui_updates(lang_display, current_regions=[])
     lang = _LANG_MAP.get(lang_display, "en")
-    return lang_display, img_upd, sym_upd, btn_upd, region_upd, hint_upd, _body_map_svg([], lang), _empty_output_html(lang), get_backend_status_html(lang)
 # ---------------------------------------------------------------------------
 # Predict
 # ---------------------------------------------------------------------------
-def predict(image, symptoms: str, lang_choice: str, selected_regions):
     lang = _LANG_MAP.get(lang_choice, "en")
     t = _I18N[lang]
-    if not image and not symptoms.strip():
-        return _empty_output_html(lang), get_backend_status_html(lang)
     region = _regions_to_prompt(selected_regions)
     try:
-        result = get_pipeline().process(image, symptoms.strip(), lang=lang, region=region)
-        return _build_result_html(result, lang), get_backend_status_html(lang)
     except Exception as exc:
-        return _error_html(t, exc), get_backend_status_html(lang)
 # ---------------------------------------------------------------------------
@@ -771,6 +919,10 @@ label span, .gr-form > label {
     letter-spacing: 0.04em;
 }
 footer { display: none !important; }
 ::-webkit-scrollbar { width: 6px; }
 ::-webkit-scrollbar-track { background: #111827; }
 ::-webkit-scrollbar-thumb { background: #374151; border-radius: 3px; }
@@ -914,11 +1066,24 @@ with gr.Blocks(css=CSS, theme=gr.themes.Base(), title="MediVision — Dermatolog
     with gr.Row(equal_height=False):
         with gr.Column(scale=1, min_width=300):
-            input_img = gr.Image(
-                type="filepath",
-                label="Upload Medical Image",
-                height=230,
             )
             symptoms_txt = gr.Textbox(
                 label="Symptoms Description",
                 placeholder="Describe what you feel — e.g. itchy red patch for 3 days...",
@@ -960,13 +1125,21 @@ with gr.Blocks(css=CSS, theme=gr.themes.Base(), title="MediVision — Dermatolog
             )
         with gr.Column(scale=1, min_width=340):
-            output_html = gr.HTML(
-                value=_empty_output_html("en"),
-                label="Analysis Result",
-            )
     # ── Events ───────────────────────────────────────────────────────────────
     # SVG click → toggle region in dropdown + re-render SVG
     svg_click_bridge.input(
         fn=on_svg_click,
@@ -984,20 +1157,26 @@ with gr.Blocks(css=CSS, theme=gr.themes.Base(), title="MediVision — Dermatolog
     lang_radio.change(
         fn=on_lang_change,
         inputs=[lang_radio, input_img, symptoms_txt, region_selector],
-        outputs=[input_img, symptoms_txt, submit_btn, region_selector, input_hint_html, output_html, status_bar],
     )
     submit_btn.click(
         fn=predict,
-        inputs=[input_img, symptoms_txt, lang_radio, region_selector],
-        outputs=[output_html, status_bar],
         api_name="analyze",
     )
     demo.load(
         fn=on_load,
         inputs=[],
-        outputs=[lang_radio, input_img, symptoms_txt, submit_btn, region_selector, input_hint_html, body_map_html, output_html, status_bar],
     )
     gr.HTML(FOOTER_HTML)

         "map_label":              "Anatomical Map",
         "map_select":             "click to select",
         "map_selected":           "{n} region(s) selected",
+        "img_mode_label":         "Upload Mode",
+        "img_mode_standard":      "Standard (1 image)",
+        "img_mode_compare":       "Compare (2 images — before & after)",
+        "img_label_day1":         "Medical Image (Day 1)",
+        "img_label_dayx":         "Comparison Image (Day X)",
+        "tab_patient":            "Patient View",
+        "tab_doctor":             "Export for Doctor (SOAP)",
+        "critical_warning":       "⚠️ CRITICAL: Severe symptoms detected. Please visit a medical facility within 24 hours.",
+        "conditions_label":       "Possible Conditions",
+        "soap_copy_btn":          "Copy SOAP Note",
+        "soap_empty":             "Run an analysis to generate the SOAP note.",
     },
     "vn": {
         "img_label":              "Tải lên hình ảnh y tế",
         "map_label":              "Bản đồ giải phẫu",
         "map_select":             "nhấn để chọn",
         "map_selected":           "{n} vùng đã chọn",
+        "img_mode_label":         "Chế độ tải ảnh",
+        "img_mode_standard":      "Tiêu chuẩn (1 ảnh)",
+        "img_mode_compare":       "So sánh (2 ảnh — trước & sau)",
+        "img_label_day1":         "Ảnh y tế (Ngày 1)",
+        "img_label_dayx":         "Ảnh so sánh (Ngày X)",
+        "tab_patient":            "Dành cho bệnh nhân",
+        "tab_doctor":             "Xuất cho bác sĩ (SOAP)",
+        "critical_warning":       "⚠️ CẢNH BÁO: Triệu chứng nghiêm trọng được phát hiện. Vui lòng đến cơ sở y tế trong vòng 24 giờ.",
+        "conditions_label":       "Tình trạng có thể",
+        "soap_copy_btn":          "Sao chép SOAP",
+        "soap_empty":             "Thực hiện phân tích để tạo ghi chú SOAP.",
     },
     "zh": {
         "img_label":              "上传医学图像",
         "map_label":              "解剖图",
         "map_select":             "点击选择",
         "map_selected":           "已选 {n} 个部位",
+        "img_mode_label":         "上传模式",
+        "img_mode_standard":      "标准模式（1张图片）",
+        "img_mode_compare":       "对比模式（2张图片 — 前后对比）",
+        "img_label_day1":         "医疗图像（第1天）",
+        "img_label_dayx":         "对比图像（第X天）",
+        "tab_patient":            "患者视图",
+        "tab_doctor":             "导出给医生（SOAP）",
+        "critical_warning":       "⚠️ 严重警告：检测到严重症状。请在24小时内前往医疗机构就诊。",
+        "conditions_label":       "可能的病症",
+        "soap_copy_btn":          "复制SOAP记录",
+        "soap_empty":             "运行分析以生成SOAP记录。",
     },
     "es": {
         "img_label":              "Subir imagen médica",
         "map_label":              "Mapa anatómico",
         "map_select":             "haga clic para seleccionar",
         "map_selected":           "{n} región(es) seleccionada(s)",
+        "img_mode_label":         "Modo de carga",
+        "img_mode_standard":      "Estándar (1 imagen)",
+        "img_mode_compare":       "Comparar (2 imágenes — antes y después)",
+        "img_label_day1":         "Imagen médica (Día 1)",
+        "img_label_dayx":         "Imagen de comparación (Día X)",
+        "tab_patient":            "Vista del paciente",
+        "tab_doctor":             "Exportar para médico (SOAP)",
+        "critical_warning":       "⚠️ CRÍTICO: Síntomas graves detectados. Por favor, acuda a un centro médico en las próximas 24 horas.",
+        "conditions_label":       "Posibles condiciones",
+        "soap_copy_btn":          "Copiar nota SOAP",
+        "soap_empty":             "Ejecute un análisis para generar la nota SOAP.",
     },
     "fr": {
         "img_label":              "Télécharger une image médicale",
         "map_label":              "Carte anatomique",
         "map_select":             "cliquer pour sélectionner",
         "map_selected":           "{n} région(s) sélectionnée(s)",
+        "img_mode_label":         "Mode de téléchargement",
+        "img_mode_standard":      "Standard (1 image)",
+        "img_mode_compare":       "Comparer (2 images — avant et après)",
+        "img_label_day1":         "Image médicale (Jour 1)",
+        "img_label_dayx":         "Image de comparaison (Jour X)",
+        "tab_patient":            "Vue patient",
+        "tab_doctor":             "Exporter pour le médecin (SOAP)",
+        "critical_warning":       "⚠️ CRITIQUE : Symptômes graves détectés. Veuillez vous rendre dans un établissement médical dans les 24 heures.",
+        "conditions_label":       "Conditions possibles",
+        "soap_copy_btn":          "Copier la note SOAP",
+        "soap_empty":             "Lancez une analyse pour générer la note SOAP.",
     },
     "ja": {
         "img_label":              "医療画像をアップロード",
         "map_label":              "解剖マップ",
         "map_select":             "クリックして選択",
         "map_selected":           "{n} 部位選択中",
+        "img_mode_label":         "アップロードモード",
+        "img_mode_standard":      "標準（画像1枚）",
+        "img_mode_compare":       "比較（画像2枚 — 経過観察）",
+        "img_label_day1":         "医療画像（第1日）",
+        "img_label_dayx":         "比較画像（第X日）",
+        "tab_patient":            "患者向け",
+        "tab_doctor":             "医師向けエクスポート（SOAP）",
+        "critical_warning":       "⚠️ 重大：重篤な症状が検出されました。24時間以内に医療機関を受診してください。",
+        "conditions_label":       "考えられる疾患",
+        "soap_copy_btn":          "SOAPノートをコピー",
+        "soap_empty":             "分析を実行してSOAPノートを生成します。",
     },
 }
     )
+def _empty_soap_html(lang: str) -> str:
+    return _build_soap_html("", lang)
 def _build_result_html(result: dict, lang: str) -> str:
+    t             = _I18N.get(lang, _I18N["en"])
+    triage        = result.get("triage_level", "Low")
+    patient_msg   = result.get("patient_message", "")
+    conditions    = result.get("possible_conditions", [])
+    metrics       = result.get("_metrics", {})
     backend_tag = (
         "<span style='font-size:0.7rem; background:#052e16; color:#86efac; "
         "border:1px solid #16a34a;'>AMD Cloud</span>"
     )
+    # Triage color
+    triage_colors = {
+        "High":   ("#ef4444", "#7f1d1d"),
+        "Medium": ("#f97316", "#431407"),
+        "Low":    ("#22c55e", "#052e16"),
+    }
+    t_color, t_bg = triage_colors.get(triage, ("#22c55e", "#052e16"))
+    # Red-flag flashing banner
+    critical_banner = ""
+    if triage == "High":
+        critical_banner = f"""
+  <div style='animation:redflash 1s ease-in-out infinite;
+              background:#7f1d1d; border:2px solid #ef4444; border-radius:8px;
+              padding:14px 18px; margin-bottom:16px; text-align:center;'>
+    <span style='color:#fca5a5; font-weight:900; font-size:0.95rem; line-height:1.5;'>
+      {t['critical_warning']}
+    </span>
+  </div>"""
+    # Possible conditions chips
+    cond_chips = "".join(
+        f"<span style='background:#1e3a5f; color:#93c5fd; font-size:0.72rem; "
+        f"padding:3px 10px; border-radius:999px; border:1px solid #2563eb;'>{c}</span>"
+        for c in conditions
+    ) if conditions else "<span style='color:#6b7280;'>—</span>"
+    # Patient message paragraphs
+    msg_html = "".join(
+        f"<p style='margin:0 0 8px; color:#d1d5db; line-height:1.6;'>{line}</p>"
+        for line in patient_msg.split("\n") if line.strip()
+    ) if patient_msg else "<p style='color:#6b7280;'>—</p>"
     return f"""
 <div style='background:#111827; border:1px solid #ED1C24; border-radius:12px;
             padding:20px; font-family:Arial,sans-serif; color:#f9fafb;'>
       <div style='font-size:1.1rem; font-weight:700; color:#ED1C24;'>
         MediVision {backend_tag}
       </div>
+      <div style='font-size:0.75rem; color:#6b7280;'>AMD MI300X · ROCm · Qwen2.5-VL-7B · 3-Step Pipeline</div>
     </div>
   </div>
   {_metrics_bar(metrics, t)}
+  {critical_banner}
   <div style='background:#1f2937; border-radius:8px; padding:14px; margin-bottom:12px;'>
     <div style='font-size:0.75rem; text-transform:uppercase; letter-spacing:.05em;
+                color:#9ca3af; margin-bottom:6px;'>{t['severity_label']}</div>
+    <span style='background:{t_bg}; color:{t_color}; font-weight:700;
+                 padding:4px 16px; border-radius:999px; font-size:0.9rem;
+                 border:2px solid {t_color};'>{triage}</span>
   </div>
   <div style='background:#1f2937; border-radius:8px; padding:14px; margin-bottom:12px;'>
     <div style='font-size:0.75rem; text-transform:uppercase; letter-spacing:.05em;
+                color:#9ca3af; margin-bottom:8px;'>{t['conditions_label']}</div>
+    <div style='display:flex; flex-wrap:wrap; gap:6px;'>{cond_chips}</div>
   </div>
   <div style='background:#1f2937; border-radius:8px; padding:14px; margin-bottom:12px;'>
     <div style='font-size:0.75rem; text-transform:uppercase; letter-spacing:.05em;
                 color:#9ca3af; margin-bottom:8px;'>{t['actions_label']}</div>
+    {msg_html}
   </div>
   <div style='background:#1a1a2e; border-left:4px solid #ED1C24; border-radius:4px;
 """
+def _build_soap_html(soap_text: str, lang: str = "en") -> str:
+    t = _I18N.get(lang, _I18N["en"])
+    if not soap_text:
+        return (
+            f"<div style='color:#4b5563; text-align:center; padding:40px 0; font-size:0.9rem;'>"
+            f"{t['soap_empty']}</div>"
+        )
+    lines_html = "".join(
+        f"<div style='padding:3px 0; color:{'#ED1C24' if line.startswith('S ') or line.startswith('O ') or line.startswith('A ') or line.startswith('P ') else '#d1d5db'}; "
+        f"font-weight:{'700' if line[:2] in ('S ', 'O ', 'A ', 'P ') else '400'};'>{line}</div>"
+        for line in soap_text.split("\n") if line.strip()
+    )
+    return f"""
+<div style='background:#0f172a; border:1px solid #1e3a5f; border-radius:12px;
+            padding:20px; font-family:monospace; font-size:0.82rem; line-height:1.7;'>
+  <div style='display:flex; justify-content:space-between; align-items:center; margin-bottom:14px;'>
+    <span style='color:#ED1C24; font-weight:700; font-size:0.9rem; font-family:sans-serif;'>
+      SOAP Clinical Note
+    </span>
+    <button onclick="navigator.clipboard.writeText(this.dataset.text).then(()=>this.textContent='{t['soap_copy_btn']} ✓').catch(()=>null)"
+            data-text="{soap_text.replace(chr(34), '&quot;')}"
+            style='background:#1e3a5f; color:#93c5fd; border:1px solid #2563eb; border-radius:6px;
+                   padding:4px 12px; cursor:pointer; font-size:0.72rem;'>
+      {t['soap_copy_btn']}
+    </button>
+  </div>
+  {lines_html}
+</div>
+"""
 # ---------------------------------------------------------------------------
 # UI update helpers
 # ---------------------------------------------------------------------------
         f"<p style='font-size:0.75rem; color:#6b7280; margin:4px 0 10px;'>{t['input_hint']}</p>"
     )
     return (
+        gr.update(label=t["img_label"], choices=[t["img_mode_standard"], t["img_mode_compare"]]),
+        gr.update(label=t["img_label_day1"]),
+        gr.update(label=t["img_label_dayx"]),
         gr.update(label=t["symptoms_label"], placeholder=t["symptoms_placeholder"]),
         gr.update(value=t["analyze_btn"]),
         gr.update(label=t["region_optional_label"], choices=new_choices, value=translated),
 def on_lang_change(lang_choice: str, image, symptoms: str, selected_regions):
     lang = _LANG_MAP.get(lang_choice, "en")
     t = _I18N[lang]
+    mode_upd, day1_upd, dayx_upd, sym_upd, btn_upd, region_upd, hint_upd = _ui_updates(
+        lang_choice, current_regions=selected_regions
+    )
     region = _regions_to_prompt(selected_regions)
     has_content = bool(image) or bool(symptoms and symptoms.strip())
     if has_content:
         try:
+            result = get_pipeline().process(image, None, (symptoms or "").strip(), lang=lang, region=region)
+            out_upd  = _build_result_html(result, lang)
+            soap_upd = _build_soap_html(result.get("soap_note", ""), lang)
         except Exception as exc:
+            out_upd  = _error_html(t, exc)
+            soap_upd = _empty_soap_html(lang)
     else:
+        out_upd  = _empty_output_html(lang)
+        soap_upd = _empty_soap_html(lang)
+    return mode_upd, day1_upd, dayx_upd, sym_upd, btn_upd, region_upd, hint_upd, out_upd, soap_upd, get_backend_status_html(lang)
 def on_load(request: gr.Request):
     lang_display = _detect_lang_from_header(
         request.headers.get("accept-language", "")
     )
+    mode_upd, day1_upd, dayx_upd, sym_upd, btn_upd, region_upd, hint_upd = _ui_updates(
+        lang_display, current_regions=[]
+    )
     lang = _LANG_MAP.get(lang_display, "en")
+    return (
+        lang_display,
+        mode_upd, day1_upd, dayx_upd,
+        sym_upd, btn_upd, region_upd, hint_upd,
+        _body_map_svg([], lang),
+        _empty_output_html(lang),
+        _empty_soap_html(lang),
+        get_backend_status_html(lang),
+    )
 # ---------------------------------------------------------------------------
 # Predict
 # ---------------------------------------------------------------------------
+def predict(image_1, image_2, symptoms: str, lang_choice: str, selected_regions):
     lang = _LANG_MAP.get(lang_choice, "en")
     t = _I18N[lang]
+    if not image_1 and not image_2 and not (symptoms or "").strip():
+        return _empty_output_html(lang), _empty_soap_html(lang), get_backend_status_html(lang)
     region = _regions_to_prompt(selected_regions)
     try:
+        result = get_pipeline().process(
+            image_1, image_2, (symptoms or "").strip(), lang=lang, region=region
+        )
+        return (
+            _build_result_html(result, lang),
+            _build_soap_html(result.get("soap_note", ""), lang),
+            get_backend_status_html(lang),
+        )
     except Exception as exc:
+        return _error_html(t, exc), _empty_soap_html(lang), get_backend_status_html(lang)
 # ---------------------------------------------------------------------------
     letter-spacing: 0.04em;
 }
 footer { display: none !important; }
+@keyframes redflash {
+  0%, 100% { opacity: 1; box-shadow: 0 0 12px rgba(239,68,68,0.6); }
+  50%       { opacity: 0.7; box-shadow: 0 0 24px rgba(239,68,68,0.9); }
+}
 ::-webkit-scrollbar { width: 6px; }
 ::-webkit-scrollbar-track { background: #111827; }
 ::-webkit-scrollbar-thumb { background: #374151; border-radius: 3px; }
     with gr.Row(equal_height=False):
         with gr.Column(scale=1, min_width=300):
+            img_mode = gr.Radio(
+                choices=[_I18N["en"]["img_mode_standard"], _I18N["en"]["img_mode_compare"]],
+                value=_I18N["en"]["img_mode_standard"],
+                label=_I18N["en"]["img_mode_label"],
+                elem_id="img-mode-radio",
             )
+            with gr.Row(equal_height=True):
+                input_img = gr.Image(
+                    type="filepath",
+                    label=_I18N["en"]["img_label_day1"],
+                    height=200,
+                )
+                input_img_2 = gr.Image(
+                    type="filepath",
+                    label=_I18N["en"]["img_label_dayx"],
+                    height=200,
+                    visible=False,
+                )
             symptoms_txt = gr.Textbox(
                 label="Symptoms Description",
                 placeholder="Describe what you feel — e.g. itchy red patch for 3 days...",
             )
         with gr.Column(scale=1, min_width=340):
+            with gr.Tabs(elem_id="output-tabs"):
+                with gr.TabItem(_I18N["en"]["tab_patient"], elem_id="tab-patient"):
+                    output_html = gr.HTML(value=_empty_output_html("en"))
+                with gr.TabItem(_I18N["en"]["tab_doctor"], elem_id="tab-doctor"):
+                    soap_html = gr.HTML(value=_empty_soap_html("en"))
     # ── Events ───────────────────────────────────────────────────────────────
+    # Image mode toggle: show/hide second image upload
+    img_mode.change(
+        fn=lambda m: gr.update(visible=_I18N["en"]["img_mode_compare"] in m),
+        inputs=[img_mode],
+        outputs=[input_img_2],
+    )
     # SVG click → toggle region in dropdown + re-render SVG
     svg_click_bridge.input(
         fn=on_svg_click,
     lang_radio.change(
         fn=on_lang_change,
         inputs=[lang_radio, input_img, symptoms_txt, region_selector],
+        outputs=[img_mode, input_img, input_img_2, symptoms_txt, submit_btn,
+                 region_selector, input_hint_html, output_html, soap_html, status_bar],
     )
     submit_btn.click(
         fn=predict,
+        inputs=[input_img, input_img_2, symptoms_txt, lang_radio, region_selector],
+        outputs=[output_html, soap_html, status_bar],
         api_name="analyze",
     )
     demo.load(
         fn=on_load,
         inputs=[],
+        outputs=[
+            lang_radio,
+            img_mode, input_img, input_img_2,
+            symptoms_txt, submit_btn, region_selector, input_hint_html,
+            body_map_html, output_html, soap_html, status_bar,
+        ],
     )
     gr.HTML(FOOTER_HTML)

src/agents.py ADDED Viewed

	@@ -0,0 +1,64 @@

+import json
+import re
+from src.model_loader import generate_response, generate_text
+from src.prompts import VISION_AGENT_SYSTEM, CLINICAL_AGENT_SYSTEM, FORMAT_AGENT_SYSTEM
+_LANG_NAMES = {
+    "en": "English",
+    "vn": "Vietnamese",
+    "zh": "Simplified Chinese",
+    "es": "Spanish",
+    "fr": "French",
+    "ja": "Japanese",
+}
+def vision_agent(image_path_1, image_path_2, symptoms: str) -> tuple[str, dict]:
+    """Step 1: strictly objective visual description. Returns (description_text, metrics)."""
+    two_images = bool(image_path_2)
+    user_msg = VISION_AGENT_SYSTEM + "\n\n"
+    if two_images:
+        user_msg += "TWO images are provided: the first image is Day 1, the second image is Day X.\n\n"
+    user_msg += f"Patient symptom text: {symptoms or '(none provided)'}"
+    return generate_response(user_msg, image_path=image_path_1 or None,
+                             image_path_2=image_path_2 or None)
+def clinical_agent(visual_description: str, symptoms: str) -> tuple[dict, dict]:
+    """Step 2: clinical reasoning → strict JSON. Returns (parsed_dict, metrics)."""
+    prompt = (
+        CLINICAL_AGENT_SYSTEM + "\n\n"
+        f"VISUAL DESCRIPTION:\n{visual_description}\n\n"
+        f"PATIENT SYMPTOMS:\n{symptoms or '(none provided)'}"
+    )
+    raw, metrics = generate_text(prompt)
+    match = re.search(r'\{.*\}', raw, re.DOTALL)
+    if not match:
+        raise ValueError(f"Clinical agent did not return JSON: {raw[:300]}")
+    data = json.loads(match.group())
+    return {
+        "triage_level":        data.get("triage_level", "Low"),
+        "possible_conditions": data.get("possible_conditions", []),
+        "clinical_assessment": data.get("clinical_assessment", ""),
+        "recommendation":      data.get("recommendation", ""),
+    }, metrics
+def format_agent(clinical_json: dict, visual_description: str,
+                 symptoms: str, lang: str) -> tuple[str, str, dict]:
+    """Step 3: patient-friendly message + SOAP note. Returns (patient_msg, soap_text, metrics)."""
+    lang_name = _LANG_NAMES.get(lang, "English")
+    prompt = (
+        FORMAT_AGENT_SYSTEM + "\n\n"
+        f"TARGET LANGUAGE: {lang_name}\n\n"
+        f"PATIENT ORIGINAL COMPLAINT: {symptoms or '(none)'}\n\n"
+        f"VISUAL DESCRIPTION (Objective):\n{visual_description}\n\n"
+        f"CLINICAL JSON:\n{json.dumps(clinical_json, ensure_ascii=False, indent=2)}"
+    )
+    raw, metrics = generate_text(prompt)
+    if "===SOAP===" in raw:
+        patient_msg, soap = raw.split("===SOAP===", 1)
+    else:
+        patient_msg, soap = raw, ""
+    return patient_msg.strip(), soap.strip(), metrics

src/inference.py CHANGED Viewed

@@ -1,18 +1,37 @@
-from src.agent import analyze_image_and_text
 class MediVisionPipeline:
-    def process(self, image_path, symptoms: str, lang: str = "en", region: str = "") -> dict:
         """
-        Run the full analysis pipeline.
-        Raises RuntimeError if the AMD Cloud backend is unreachable.
-        Returns:
-            dict with keys: diagnosis, severity, recommended_actions, confidence_score, _metrics
         """
-        return analyze_image_and_text(
-            image_path=image_path,
-            text_description=symptoms,
-            language=lang,
-            region=region,
-        )

+from src.agents import vision_agent, clinical_agent, format_agent
 class MediVisionPipeline:
+    def process(self, image_path_1, image_path_2, symptoms: str,
+                lang: str = "en", region: str = "") -> dict:
         """
+        Run the 3-step agentic pipeline:
+          Step 1 — Vision Agent: objective visual description
+          Step 2 — Clinical Agent: triage JSON
+          Step 3 — Format Agent: patient message + SOAP note
+        Returns dict with keys:
+            triage_level, possible_conditions, patient_message,
+            soap_note, visual_description, _metrics
         """
+        symptoms_full = f"{'Region: ' + region + '. ' if region else ''}{symptoms}"
+        visual_desc, m1 = vision_agent(image_path_1, image_path_2, symptoms_full)
+        clinical,    m2 = clinical_agent(visual_desc, symptoms_full)
+        patient_msg, soap, m3 = format_agent(clinical, visual_desc, symptoms_full, lang)
+        metrics = {
+            "latency_ms":    m1["latency_ms"] + m2["latency_ms"] + m3["latency_ms"],
+            "total_tokens":  m1["total_tokens"] + m2["total_tokens"] + m3["total_tokens"],
+            "tokens_per_sec": round(
+                (m1.get("tokens_per_sec", 0) + m2.get("tokens_per_sec", 0) + m3.get("tokens_per_sec", 0)) / 3, 1
+            ),
+        }
+        return {
+            "triage_level":        clinical["triage_level"],
+            "possible_conditions": clinical["possible_conditions"],
+            "patient_message":     patient_msg,
+            "soap_note":           soap,
+            "visual_description":  visual_desc,
+            "_metrics":            metrics,
+        }

src/model_loader.py CHANGED Viewed

@@ -62,9 +62,11 @@ def check_connection() -> tuple[bool, str]:
         return False, f"{type(exc).__name__}: {exc}"
-def generate_response(prompt: str, image_path: str = None) -> tuple[str, dict]:
     """
     Send a request to the vLLM endpoint and return (text_output, metrics).
     metrics keys:
         latency_ms  – wall-clock time for the API call in milliseconds
@@ -76,20 +78,18 @@ def generate_response(prompt: str, image_path: str = None) -> tuple[str, dict]:
     try:
         client = _get_client()
-        if image_path:
-            b64, mime = _encode_image(image_path)
-            messages = [
-                {
-                    "role": "user",
-                    "content": [
-                        {
-                            "type": "image_url",
-                            "image_url": {"url": f"data:{mime};base64,{b64}"},
-                        },
-                        {"type": "text", "text": prompt},
-                    ],
-                }
-            ]
         else:
             messages = [{"role": "user", "content": prompt}]
@@ -116,3 +116,8 @@ def generate_response(prompt: str, image_path: str = None) -> tuple[str, dict]:
     except Exception as exc:
         raise RuntimeError(f"AMD Cloud backend unreachable: {exc}") from exc

         return False, f"{type(exc).__name__}: {exc}"
+def generate_response(prompt: str, image_path: str = None,
+                      image_path_2: str = None) -> tuple[str, dict]:
     """
     Send a request to the vLLM endpoint and return (text_output, metrics).
+    Supports 0, 1, or 2 images (image_path_2 for A/B comparison).
     metrics keys:
         latency_ms  – wall-clock time for the API call in milliseconds
     try:
         client = _get_client()
+        if image_path or image_path_2:
+            content = []
+            if image_path:
+                b64, mime = _encode_image(image_path)
+                content.append({"type": "image_url",
+                                 "image_url": {"url": f"data:{mime};base64,{b64}"}})
+            if image_path_2:
+                b64, mime = _encode_image(image_path_2)
+                content.append({"type": "image_url",
+                                 "image_url": {"url": f"data:{mime};base64,{b64}"}})
+            content.append({"type": "text", "text": prompt})
+            messages = [{"role": "user", "content": content}]
         else:
             messages = [{"role": "user", "content": prompt}]
     except Exception as exc:
         raise RuntimeError(f"AMD Cloud backend unreachable: {exc}") from exc
+def generate_text(prompt: str) -> tuple[str, dict]:
+    """Text-only call — same endpoint as generate_response(), no image encoding."""
+    return generate_response(prompt, image_path=None)

src/prompts.py ADDED Viewed

	@@ -0,0 +1,53 @@

+VISION_AGENT_SYSTEM = """You are a medical imaging assistant performing STRICTLY OBJECTIVE visual analysis.
+Do NOT diagnose. Do NOT give medical advice. Do NOT speculate on conditions.
+Your ONLY job: describe exactly what you see in the image(s) using clinical descriptive language.
+If ONE image is provided, describe:
+- Lesion size (estimated), shape, border characteristics
+- Color(s), texture, surface features (scaling, crusting, ulceration, exudate)
+- Surrounding skin condition
+- Any signs of inflammation, swelling, or structural abnormality
+If TWO images are provided (Day 1 vs Day X), describe BOTH images separately, then compare:
+- Changes in size (larger / smaller / same)
+- Changes in color or border definition
+- Changes in surface features (scaling, crusting, exudate)
+- Overall progression verdict: IMPROVED / UNCHANGED / WORSENED
+Output: plain text only. No JSON. No diagnosis. No recommendations."""
+CLINICAL_AGENT_SYSTEM = """You are a clinical reasoning engine for a dermatology triage system.
+You receive: (1) an objective visual description and (2) the patient's symptom text.
+You perform clinical reasoning and output ONLY a JSON object — no extra text, no markdown fences.
+JSON schema (strict):
+{
+  "triage_level": "High" | "Medium" | "Low",
+  "possible_conditions": ["condition 1", "condition 2"],
+  "clinical_assessment": "brief medical reasoning (2-3 sentences max)",
+  "recommendation": "immediate actions or home care advice (2-4 sentences)"
+}
+triage_level rules:
+- "High": suspected melanoma, necrosis, severe cellulitis, rapidly spreading infection, deep burn
+- "Medium": moderate infection signs, non-healing wound >2 weeks, significant inflammation
+- "Low": minor abrasion, mild rash, superficial wound with no infection signs
+Return ONLY the JSON object. No explanation before or after."""
+FORMAT_AGENT_SYSTEM = """You are a medical communication specialist. You receive clinical data and
+format it into two outputs separated by the EXACT delimiter line: ===SOAP===
+Output structure (follow exactly):
+[PATIENT section — warm, empathetic, easy-to-understand message in the TARGET LANGUAGE]
+===SOAP===
+S (Subjective): [patient's original complaint, verbatim or close paraphrase]
+O (Objective): [1-2 sentence summary of the visual description]
+A (Assessment): [possible conditions and brief clinical reasoning]
+P (Plan): [recommended actions from clinical assessment]
+Rules:
+- Patient section: non-technical language, supportive tone, in the TARGET LANGUAGE specified
+- SOAP section: professional clinical English regardless of target language
+- Do NOT add any text outside this structure
+- Do NOT add a header or title line before the patient section"""